diff --git a/.circleci/config.yml b/.circleci/config.yml deleted file mode 100644 index 8d16cb4f..00000000 --- a/.circleci/config.yml +++ /dev/null @@ -1,67 +0,0 @@ -version: 2.1 - -orbs: - python: circleci/python@0.3.2 -jobs: - test: - executor: python/default - steps: - - checkout - - python/load-cache - - python/install-deps - - python/save-cache - - run: pip install cadCAD==0.4.23 - - run: - command: python testing/tests/a_b_tests/multi_model_row_count_0_4_23.py - name: Multi Model Row Count (ver. 0.4.23) - - run: pip install -r requirements.txt --force-reinstall - - run: python setup.py bdist_wheel - - run: pip install dist/*.whl --force-reinstall - - run: - command: python testing/tests/multi_model_row_count.py - name: Multi Model Row Count - - run: - command: python testing/tests/param_sweep.py - name: Parameter sweep - - run: - command: python testing/tests/policy_aggregation.py - name: Policy Aggregation - - run: - command: python testing/tests/timestep1psub0.py - name: Timestep equals 1 instead of 0 for 1st PSUB - - run: - command: python testing/tests/runs_not_zero.py - name: Value Error thrown when Runs < 1 - - run: - command: python testing/tests/run1psub0.py - name: Run Starts at 1 for PSUB 0 - - run: - command: python testing/tests/append_mod_test.py - name: Auto Append Model ID - - run: - command: python testing/tests/cadCAD_exp.py - name: Package Root Experiment and configs object -# - run: -# command: python -m unittest discover -s testing/tests -p "*_test.py" -# name: Test Suite - jupyterServerTest: - docker: - - image: cimg/python:3.9.5 - steps: - - checkout - - python/load-cache - - run: python --version - - run: pip install --upgrade pip - - run: pip install jupyter - - python/save-cache - - run: python setup.py bdist_wheel - - run: pip install dist/*.whl --force-reinstall - - run: - command: python testing/tests/import_cadCAD_test.py - name: cadCAD importable by Jupyter Server - -workflows: - main: - jobs: - - test - - jupyterServerTest diff --git a/.github/workflows/cadcad-ci.yml b/.github/workflows/cadcad-ci.yml new file mode 100644 index 00000000..9ff30705 --- /dev/null +++ b/.github/workflows/cadcad-ci.yml @@ -0,0 +1,61 @@ +# This workflow will install Python dependencies and run tests with multiple versions of Python + +name: cadCAD CI + +on: + push: + branches: [ "master" ] + pull_request: + branches: [ "master" ] + +permissions: + contents: read + +jobs: + build: + continue-on-error: true + + strategy: + matrix: + python-version: ["3.9", "3.10", "3.11", "3.12"] + os: [ubuntu-latest, macos-latest] + + runs-on: ${{ matrix.os }} + + steps: + - uses: actions/checkout@v4 + + - name: Set up Python ${{ matrix.python-version }} + uses: actions/setup-python@v5 + with: + python-version: ${{ matrix.python-version }} + cache: 'pip' + + - name: Display Python version + run: python -c "import sys; print(sys.version)" + + - name: Install test and build dependencies + run: | + python -m pip install --upgrade pip + python -m pip install jupyter + pip install -r requirements.txt + + - name: Build cadCAD + run: | + python setup.py bdist_wheel + python -m pip install dist/*.whl --force-reinstall + + - name: Run tests + run: | + python testing/tests/multi_model_row_count.py + python testing/tests/param_sweep.py + python testing/tests/policy_aggregation.py + python testing/tests/timestep1psub0.py + python testing/tests/runs_not_zero.py + python testing/tests/run1psub0.py + python testing/tests/append_mod_test.py + python testing/tests/cadCAD_exp.py + + - name: Run Jupyter test + run: | + python testing/tests/import_cadCAD_test.py diff --git a/AUTHORS.txt b/AUTHORS.txt index 351daeaa..933b38b6 100644 --- a/AUTHORS.txt +++ b/AUTHORS.txt @@ -1,30 +1,41 @@ Authors ======= -cadCAD was implemented by Joshua E. Jodesty and designed by Michael Zargham, Markus B. Koch, and -Matthew V. Barlin from 2018 to 2020. +cadCAD was originally implemented by Joshua E. Jodesty and designed by Michael Zargham, Markus B. Koch, and +Matthew V. Barlin in 2018. Since then, upgrades and improvements were further committed by Danilo L. Bernardineli, Tyler D. Mace +and Emanuel Lima. + -Project Maintainers: -- Joshua E. Jodesty -- Markus B. Koch -- Michael Zargham +Current Project Maintainers: +- Emanuel Lima @emanuellima1 +- Michael Zargham @mzargham -Original Contributors: -- Joshua E. Jodesty -- Markus B. Koch -- Matthew V. Barlin -- Michael Zargham -- Zixuan Zhang -- Charles Rice +Active and Past Contributors: +- Joshua E. Jodesty @JEJodesty +- Markus B. Koch @markusbkoch +- Matthew V. Barlin @matttyb80 +- Michael Zargham @mzargham +- Danilo L. Bernardineli @danlessa +- Tyler D. Mace @tylerdmace +- Emanuel Lima @emanuellima1 +- Zixuan Zhang @zixuanzh +- Charles Rice @charles-rice +- Benjamin Scholz @BenSchZA We’d also like to thank: -- Andrew Clark -- Nick Hirannet -- Jonathan Gabler -- Harry Goodnight +- Andrew Clark @aclarkData +- Nick Hirannet @nick-phl-7 +- Jonathan Gabler +- Harry Goodnight @ - Charlie Hoppes - Nikhil Jamdade - Chris Frazier +- Griff Green @GriffGreen +- Isaac @eenti +- Jonny Dubowsky @jonnydubowsky +- Sem Brestels @sembrestels +- @fjribi +- Andrea Maria Piana @cammellos diff --git a/cadCAD/engine/__init__.py b/cadCAD/engine/__init__.py index c154e72f..59e49d6b 100644 --- a/cadCAD/engine/__init__.py +++ b/cadCAD/engine/__init__.py @@ -1,5 +1,5 @@ from time import time -from typing import Callable, Dict, List, Any, Tuple +from typing import Callable, Dict, List, Any, Tuple, Union from cadCAD.utils import flatten from cadCAD.utils.execution import print_exec_info @@ -39,6 +39,7 @@ def auto_mode_switcher(config_amt: int): class ExecutionContext: def __init__(self, context=ExecutionMode.local_mode, method=None, additional_objs=None) -> None: self.name = context + self.additional_objs = additional_objs if context == 'local_proc': self.method = local_simulations elif context == 'single_proc': @@ -74,6 +75,7 @@ def __init__(self, self.SimExecutor = SimExecutor self.exec_method = exec_context.method self.exec_context = exec_context.name + self.additional_objs = exec_context.additional_objs self.configs = configs self.empty_return = empty_return @@ -174,7 +176,7 @@ def get_final_results(simulations: List[StateHistory], print("Execution Method: " + self.exec_method.__name__) simulations_results = self.exec_method( sim_executors, var_dict_list, states_lists, configs_structs, env_processes_list, Ts, SimIDs, RunIDs, - ExpIDs, SubsetIDs, SubsetWindows, original_N + ExpIDs, SubsetIDs, SubsetWindows, original_N, self.additional_objs ) final_result = get_final_results( diff --git a/cadCAD/engine/execution.py b/cadCAD/engine/execution.py index fdf0452c..febafffe 100644 --- a/cadCAD/engine/execution.py +++ b/cadCAD/engine/execution.py @@ -22,7 +22,8 @@ def single_proc_exec( ExpIDs: List[int], SubsetIDs: List[SubsetID], SubsetWindows: List[SubsetWindow], - configured_n: List[N_Runs] + configured_n: List[N_Runs], + additional_objs=None ): # HACK for making it run with N_Runs=1 @@ -38,7 +39,7 @@ def single_proc_exec( map(lambda x: x.pop(), raw_params) ) result = simulation_exec( - var_dict_list, states_list, config, env_processes, T, sim_id, N, subset_id, subset_window, configured_n + var_dict_list, states_list, config, env_processes, T, sim_id, N, subset_id, subset_window, configured_n, additional_objs ) return flatten(result) @@ -58,7 +59,8 @@ def parallelize_simulations( ExpIDs: List[int], SubsetIDs: List[SubsetID], SubsetWindows: List[SubsetWindow], - configured_n: List[N_Runs] + configured_n: List[N_Runs], + additional_objs=None ): print(f'Execution Mode: parallelized') @@ -96,7 +98,7 @@ def process_executor(params): if len_configs_structs > 1: pp = PPool(processes=len_configs_structs) results = pp.map( - lambda t: t[0](t[1], t[2], t[3], t[4], t[5], t[6], t[7], t[8], t[9], configured_n), params + lambda t: t[0](t[1], t[2], t[3], t[4], t[5], t[6], t[7], t[8], t[9], configured_n, additional_objs), params ) pp.close() pp.join() @@ -123,18 +125,19 @@ def local_simulations( ExpIDs: List[int], SubsetIDs: List[SubsetID], SubsetWindows: List[SubsetWindow], - configured_n: List[N_Runs] + configured_n: List[N_Runs], + additional_objs=None ): config_amt = len(configs_structs) if config_amt == 1: # and configured_n != 1 return single_proc_exec( simulation_execs, var_dict_list, states_lists, configs_structs, env_processes_list, - Ts, SimIDs, Ns, ExpIDs, SubsetIDs, SubsetWindows, configured_n + Ts, SimIDs, Ns, ExpIDs, SubsetIDs, SubsetWindows, configured_n, additional_objs ) elif config_amt > 1: # and configured_n != 1 return parallelize_simulations( simulation_execs, var_dict_list, states_lists, configs_structs, env_processes_list, - Ts, SimIDs, Ns, ExpIDs, SubsetIDs, SubsetWindows, configured_n + Ts, SimIDs, Ns, ExpIDs, SubsetIDs, SubsetWindows, configured_n, additional_objs ) # elif config_amt > 1 and configured_n == 1: diff --git a/cadCAD/engine/simulation.py b/cadCAD/engine/simulation.py index c39a7aa0..d97d083e 100644 --- a/cadCAD/engine/simulation.py +++ b/cadCAD/engine/simulation.py @@ -1,10 +1,12 @@ from typing import Any, Callable, Dict, List, Tuple from copy import deepcopy +from types import MappingProxyType from functools import reduce -from funcy import curry +from funcy import curry # type: ignore from cadCAD.utils import flatten from cadCAD.engine.utils import engine_exception +from cadCAD.types import * id_exception: Callable = curry(engine_exception)(KeyError)(KeyError)(None) @@ -107,20 +109,30 @@ def env_composition(target_field, state_dict, target_value): # mech_step def partial_state_update( self, - sweep_dict: Dict[str, List[Any]], - sub_step: int, - sL, - sH, - state_funcs: List[Callable], - policy_funcs: List[Callable], - env_processes: Dict[str, Callable], + sweep_dict: Parameters, + sub_step: Substep, + sL: list[State], + sH: StateHistory, + state_funcs: List[StateUpdateFunction], + policy_funcs: List[PolicyFunction], + env_processes: EnvProcesses, time_step: int, run: int, additional_objs ) -> List[Dict[str, Any]]: - # last_in_obj: Dict[str, Any] = MappingProxyType(sL[-1]) - last_in_obj: Dict[str, Any] = deepcopy(sL[-1]) + if type(additional_objs) == dict: + if additional_objs.get('deepcopy_off', False) == True: + last_in_obj = MappingProxyType(sL[-1]) + if len(additional_objs) == 1: + additional_objs = None + # XXX: drop the additional objects if only used for deepcopy + # toggling. + else: + last_in_obj = deepcopy(sL[-1]) + else: + last_in_obj = deepcopy(sL[-1]) + _input: Dict[str, Any] = self.policy_update_exception( self.get_policy_input(sweep_dict, sub_step, sH, last_in_obj, policy_funcs, additional_objs) ) @@ -217,18 +229,18 @@ def run_pipeline( def simulation( self, - sweep_dict: Dict[str, List[Any]], - states_list: List[Dict[str, Any]], + sweep_dict: SweepableParameters, + states_list: StateHistory, configs, - env_processes: Dict[str, Callable], - time_seq: range, - simulation_id: int, + env_processes: EnvProcesses, + time_seq: TimeSeq, + simulation_id: SimulationID, run: int, - subset_id, - subset_window, - configured_N, + subset_id: SubsetID, + subset_window: SubsetWindow, + configured_N: int, # remote_ind - additional_objs=None + additional_objs: Union[None, Dict]=None ): run += 1 subset_window.appendleft(subset_id) diff --git a/cadCAD/types.py b/cadCAD/types.py index 78726b5a..d2658e48 100644 --- a/cadCAD/types.py +++ b/cadCAD/types.py @@ -24,8 +24,9 @@ class ConfigurationDict(TypedDict): N: int # Number of MC Runs M: Union[Parameters, SweepableParameters] # Parameters / List of Parameter to Sweep - -EnvProcesses = object +TargetValue = object +EnvProcess: Callable[[State, SweepableParameters, TargetValue], TargetValue] +EnvProcesses = dict[str, Callable] TimeSeq = Iterator SimulationID = int Run = int @@ -33,7 +34,6 @@ class ConfigurationDict(TypedDict): SubsetWindow = Iterator N_Runs = int - ExecutorFunction = Callable[[Parameters, StateHistory, StateUpdateBlocks, EnvProcesses, TimeSeq, SimulationID, Run, SubsetID, SubsetWindow, N_Runs], object] ExecutionParameter = Tuple[ExecutorFunction, Parameters, StateHistory, StateUpdateBlocks, EnvProcesses, TimeSeq, SimulationID, Run, SubsetID, SubsetWindow, N_Runs] @@ -45,4 +45,4 @@ class SessionDict(TypedDict): simulation_id: int run_id: int subset_id: int - subset_window: deque \ No newline at end of file + subset_window: deque diff --git a/requirements.txt b/requirements.txt index 0890a625..a951734a 100644 --- a/requirements.txt +++ b/requirements.txt @@ -1,21 +1,13 @@ -i https://pypi.org/simple -matplotlib==3.3.2 -networkx==2.5 -parameterized==0.7.4 -plotly==4.10.0 -pytest==6.0.2 -scikit-learn==0.23.2 -scipy>=1.5.2 -seaborn==0.11.0 -tabulate==0.8.7 -xarray==0.16.0 -wheel==0.38.1 -pandas==1.1.5 -fn==0.4.3 -funcy==1.16 -dill==0.3.4 -pathos==0.2.8 -numpy==1.22.0 -pytz==2021.1 -six>=1.11.0 +parameterized>=0.7.4 +pytest>=6.0.2 +tabulate>=0.8.7 +wheel>=0.38.1 +pandas>=1.1.5 +funcy>=1.16 +dill>=0.3.4 +pathos>=0.2.8 +numpy>=1.22.0 +pytz>=2021.1 +setuptools>=69.0.2 diff --git a/setup.py b/setup.py index fc8ae488..dfd786c4 100644 --- a/setup.py +++ b/setup.py @@ -28,8 +28,8 @@ description=short_description, long_description=long_description, url='https://github.com/cadCAD-org/cadCAD', - author='Joshua E. Jodesty', - author_email='joshua@block.science', + author='cadCAD-org Developers', + author_email='info@block.science', license='LICENSE.txt', packages=find_packages(), install_requires=[ diff --git a/testing/test_additional_objs.py b/testing/test_additional_objs.py new file mode 100644 index 00000000..89cd2995 --- /dev/null +++ b/testing/test_additional_objs.py @@ -0,0 +1,187 @@ +from typing import Dict, List +from cadCAD.engine import Executor, ExecutionContext, ExecutionMode +from cadCAD.configuration import Experiment +from cadCAD.configuration.utils import env_trigger, var_substep_trigger, config_sim, psub_list +from cadCAD.types import * +import pandas as pd # type: ignore +import types +import inspect +import pytest + +def describe_or_return(v: object) -> object: + """ + Thanks @LinuxIsCool! + """ + if isinstance(v, types.FunctionType): + return f'function: {v.__name__}' + elif isinstance(v, types.LambdaType) and v.__name__ == '': + return f'lambda: {inspect.signature(v)}' + else: + return v + + +def select_M_dict(M_dict: Dict[str, object], keys: set) -> Dict[str, object]: + """ + Thanks @LinuxIsCool! + """ + return {k: describe_or_return(v) for k, v in M_dict.items() if k in keys} + + +def select_config_M_dict(configs: list, i: int, keys: set) -> Dict[str, object]: + return select_M_dict(configs[i].sim_config['M'], keys) + + +def drop_substeps(_df): + first_ind = (_df.substep == 0) & (_df.timestep == 0) + last_ind = _df.substep == max(_df.substep) + inds_to_drop = first_ind | last_ind + return _df.copy().loc[inds_to_drop].drop(columns=['substep']) + + +def assign_params(_df: pd.DataFrame, configs) -> pd.DataFrame: + """ + Based on `cadCAD-tools` package codebase, by @danlessa + """ + M_dict = configs[0].sim_config['M'] + params_set = set(M_dict.keys()) + selected_params = params_set + + # Attribute parameters to each row + # 1. Assign the parameter set from the first row first, so that + # columns are created + first_param_dict = select_config_M_dict(configs, 0, selected_params) + + # 2. Attribute parameter on an (simulation, subset, run) basis + df = _df.assign(**first_param_dict).copy() + for i, (_, subset_df) in enumerate(df.groupby(['simulation', 'subset', 'run'])): + df.loc[subset_df.index] = subset_df.assign(**select_config_M_dict(configs, + i, + selected_params)) + return df + + + + +SWEEP_PARAMS: Dict[str, List] = { + 'alpha': [1], + 'beta': [lambda x: 2 * x, lambda x: x], + 'gamma': [3, 4], + 'omega': [7] + } + +SINGLE_PARAMS: Dict[str, object] = { + 'alpha': 1, + 'beta': lambda x: x, + 'gamma': 3, + 'omega': 5 + } + + +def create_experiment(N_RUNS=2, N_TIMESTEPS=3, params: dict=SWEEP_PARAMS): + psu_steps = ['m1', 'm2', 'm3'] + system_substeps = len(psu_steps) + var_timestep_trigger = var_substep_trigger([0, system_substeps]) + env_timestep_trigger = env_trigger(system_substeps) + env_process = {} + + + # ['s1', 's2', 's3', 's4'] + # Policies per Mechanism + def gamma(params: Parameters, substep: Substep, history: StateHistory, state: State, **kwargs): + return {'gamma': params['gamma']} + + + def omega(params: Parameters, substep: Substep, history: StateHistory, state: State, **kwarg): + return {'omega': params['omega']} + + + # Internal States per Mechanism + def alpha(params: Parameters, substep: Substep, history: StateHistory, state: State, _input: PolicyOutput, **kwargs): + return 'alpha_var', params['alpha'] + + + def beta(params: Parameters, substep: Substep, history: StateHistory, state: State, _input: PolicyOutput, **kwargs): + return 'beta_var', params['beta'] + + def gamma_var(params: Parameters, substep: Substep, history: StateHistory, state: State, _input: PolicyOutput, **kwargs): + return 'gamma_var', params['gamma'] + + def omega_var(params: Parameters, substep: Substep, history: StateHistory, state: State, _input: PolicyOutput, **kwargs): + return 'omega_var', params['omega'] + + + def policies(params: Parameters, substep: Substep, history: StateHistory, state: State, _input: PolicyOutput, **kwargs): + return 'policies', _input + + + def sweeped(params: Parameters, substep: Substep, history: StateHistory, state: State, _input: PolicyOutput, **kwargs): + return 'sweeped', {'beta': params['beta'], 'gamma': params['gamma']} + + psu_block: dict = {k: {"policies": {}, "states": {}} for k in psu_steps} + for m in psu_steps: + psu_block[m]['policies']['gamma'] = gamma + psu_block[m]['policies']['omega'] = omega + psu_block[m]["states"]['alpha_var'] = alpha + psu_block[m]["states"]['beta_var'] = beta + psu_block[m]["states"]['gamma_var'] = gamma_var + psu_block[m]["states"]['omega_var'] = omega_var + psu_block[m]['states']['policies'] = policies + psu_block[m]["states"]['sweeped'] = var_timestep_trigger(y='sweeped', f=sweeped) + + + # Genesis States + genesis_states = { + 'alpha_var': 0, + 'beta_var': 0, + 'gamma_var': 0, + 'omega_var': 0, + 'policies': {}, + 'sweeped': {} + } + + # Environment Process + env_process['sweeped'] = env_timestep_trigger(trigger_field='timestep', trigger_vals=[5], funct_list=[lambda _g, x: _g['beta']]) + + sim_config = config_sim( + { + "N": N_RUNS, + "T": range(N_TIMESTEPS), + "M": params, # Optional + } + ) + + # New Convention + partial_state_update_blocks = psub_list(psu_block, psu_steps) + + exp = Experiment() + exp.append_model( + sim_configs=sim_config, + initial_state=genesis_states, + env_processes=env_process, + partial_state_update_blocks=partial_state_update_blocks + ) + return exp + + +def test_deepcopy_off(): + exp = create_experiment() + mode = ExecutionMode().local_mode + exec_context = ExecutionContext(mode, additional_objs={'deepcopy_off': True}) + executor = Executor(exec_context=exec_context, configs=exp.configs) + (records, tensor_field, _) = executor.execute() + df = drop_substeps(assign_params(pd.DataFrame(records), exp.configs)) + + # XXX: parameters should always be of the same type. Else, the test will fail + first_sim_config = exp.configs[0].sim_config['M'] + + + for (i, row) in df.iterrows(): + if row.timestep > 0: + + assert row['alpha_var'] == row['alpha'] + assert type(row['alpha_var']) == type(first_sim_config['alpha']) + assert row['gamma_var'] == row['gamma'] + assert type(row['gamma_var']) == type(first_sim_config['gamma']) + assert row['omega_var'] == row['omega'] + assert type(row['omega_var']) == type(first_sim_config['omega']) +