From a54c45f82812207e3eb9da7b4e5baafb2e7b4441 Mon Sep 17 00:00:00 2001 From: Leif Denby Date: Mon, 19 Aug 2024 15:44:39 +0200 Subject: [PATCH] Refactor codebase into a python package (#32) Make it possible to `neural-lam` as a package, thereby enabling the possibility to run from anywhere once the package has been installed. This means it is now possible (in theory) to train neural-lam on a `.npy`-file based dataset with the neural-lam package installed into a user's `site-packages` (i.e. in their virtualenv). The primary changes are: - move all `*.py` that are currently outside of neural_lam/ into that folder, but keep the files the same - change all examples of running the neural-lam "scripts", e.g. `python create_mesh.py` by `python -m neural_lam.create_mesh` in the README - change all absolute imports to package-relative imports, i.e. `from .import utils` rather than `from neural_lam import utils` - add tests that all the CLI entrypoints to neural_lam can be imported and add ci/cd action to run these tests --------- Co-authored-by: SimonKamuk <43374850+SimonKamuk@users.noreply.github.com> Co-authored-by: joeloskarsson Co-authored-by: Leif Denby --- .github/workflows/run_tests.yml | 2 +- .pre-commit-config.yaml | 1 + CHANGELOG.md | 7 ++ README.md | 94 +++++++++---------- neural_lam/__init__.py | 10 ++ .../create_grid_features.py | 4 +- create_mesh.py => neural_lam/create_mesh.py | 4 +- .../create_parameter_weights.py | 5 +- neural_lam/interaction_net.py | 4 +- neural_lam/models/__init__.py | 6 ++ neural_lam/models/ar_model.py | 4 +- neural_lam/models/base_graph_model.py | 8 +- neural_lam/models/base_hi_graph_model.py | 8 +- neural_lam/models/graph_lam.py | 8 +- neural_lam/models/hi_lam.py | 6 +- neural_lam/models/hi_lam_parallel.py | 6 +- train_model.py => neural_lam/train_model.py | 9 +- neural_lam/vis.py | 4 +- neural_lam/weather_dataset.py | 4 +- pyproject.toml | 7 ++ tests/__init__.py | 0 tests/test_cli.py | 18 ++++ tests/test_mllam_dataset.py | 20 ++-- 23 files changed, 141 insertions(+), 98 deletions(-) create mode 100644 neural_lam/__init__.py rename create_grid_features.py => neural_lam/create_grid_features.py (97%) rename create_mesh.py => neural_lam/create_mesh.py (99%) rename create_parameter_weights.py => neural_lam/create_parameter_weights.py (99%) create mode 100644 neural_lam/models/__init__.py rename train_model.py => neural_lam/train_model.py (97%) delete mode 100644 tests/__init__.py create mode 100644 tests/test_cli.py diff --git a/.github/workflows/run_tests.yml b/.github/workflows/run_tests.yml index 4c677908..810f2b2c 100644 --- a/.github/workflows/run_tests.yml +++ b/.github/workflows/run_tests.yml @@ -35,7 +35,7 @@ jobs: ${{ runner.os }}-meps-reduced-example-data-v0.1.0 - name: Test with pytest run: | - pytest -v -s + python -m pytest -v -s tests/ - name: Save cache data uses: actions/cache/save@v4 with: diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml index 815a92e1..dfbf8b60 100644 --- a/.pre-commit-config.yaml +++ b/.pre-commit-config.yaml @@ -35,3 +35,4 @@ repos: hooks: - id: flake8 description: Check Python code for correctness, consistency and adherence to best practices + additional_dependencies: [Flake8-pyproject] diff --git a/CHANGELOG.md b/CHANGELOG.md index dfb186f7..c183888e 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -92,6 +92,13 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0 [\#68](https://github.com/mllam/neural-lam/pull/68) @joeloskarsson +- turn `neural-lam` into a python package by moving all `*.py`-files into the + `neural_lam/` source directory and updating imports accordingly. This means + all cli functions are now invoke through the package name, e.g. `python -m + neural_lam.train_model` instead of `python train_model.py` (and can be done + anywhere once the package has been installed). + [\#32](https://github.com/mllam/neural-lam/pull/32), @leifdenby + ## [v0.1.0](https://github.com/joeloskarsson/neural-lam/releases/tag/v0.1.0) First tagged release of `neural-lam`, matching Oskarsson et al 2023 publication diff --git a/README.md b/README.md index 26d844f7..ce8daf69 100644 --- a/README.md +++ b/README.md @@ -48,7 +48,7 @@ Still, some restrictions are inevitable: ## A note on the limited area setting Currently we are using these models on a limited area covering the Nordic region, the so called MEPS area (see [paper](https://arxiv.org/abs/2309.17370)). There are still some parts of the code that is quite specific for the MEPS area use case. -This is in particular true for the mesh graph creation (`create_mesh.py`) and some of the constants set in a `data_config.yaml` file (path specified in `train_model.py --data_config` ). +This is in particular true for the mesh graph creation (`python -m neural_lam.create_mesh`) and some of the constants set in a `data_config.yaml` file (path specified in `python -m neural_lam.train_model --data_config ` ). If there is interest to use Neural-LAM for other areas it is not a substantial undertaking to refactor the code to be fully area-agnostic. We would be happy to support such enhancements. See the issues https://github.com/joeloskarsson/neural-lam/issues/2, https://github.com/joeloskarsson/neural-lam/issues/3 and https://github.com/joeloskarsson/neural-lam/issues/4 for some initial ideas on how this could be done. @@ -62,16 +62,10 @@ Follow the steps below to create the necessary python environment. 1. Install GEOS for your system. For example with `sudo apt-get install libgeos-dev`. This is necessary for the Cartopy requirement. 2. Use python 3.9. 3. Install version 2.0.1 of PyTorch. Follow instructions on the [PyTorch webpage](https://pytorch.org/get-started/previous-versions/) for how to set this up with GPU support on your system. -4. Install required packages specified in `requirements.txt`. -5. Install PyTorch Geometric version 2.2.0. This can be done by running +4. Install `neural-lam` with pip: ``` -TORCH="2.0.1" -CUDA="cu117" - -pip install pyg-lib==0.2.0 torch-scatter==2.1.1 torch-sparse==0.6.17 torch-cluster==1.6.1\ - torch-geometric==2.3.1 -f https://pytorch-geometric.com/whl/torch-${TORCH}+${CUDA}.html +pip install -e . ``` -You will have to adjust the `CUDA` variable to match the CUDA version on your system or to run on CPU. See the [installation webpage](https://pytorch-geometric.readthedocs.io/en/latest/install/installation.html) for more information. ## Data Datasets should be stored in a directory called `data`. @@ -80,39 +74,39 @@ See the [repository format section](#format-of-data-directory) for details on th The full MEPS dataset can be shared with other researchers on request, contact us for this. A tiny subset of the data (named `meps_example`) is available in `example_data.zip`, which can be downloaded from [here](https://liuonline-my.sharepoint.com/:f:/g/personal/joeos82_liu_se/EuiUuiGzFIFHruPWpfxfUmYBSjhqMUjNExlJi9W6ULMZ1w?e=97pnGX). Download the file and unzip in the neural-lam directory. -All graphs used in the paper are also available for download at the same link (but can as easily be re-generated using `create_mesh.py`). -Note that this is far too little data to train any useful models, but all scripts can be ran with it. +All graphs used in the paper are also available for download at the same link (but can as easily be re-generated using `python -m neural_lam.create_mesh`). +Note that this is far too little data to train any useful models, but all pre-processing and training steps can be run with it. It should thus be useful to make sure that your python environment is set up correctly and that all the code can be ran without any issues. ## Pre-processing -An overview of how the different scripts and files depend on each other is given in this figure: +An overview of how the different pre-processing steps, training and files depend on each other is given in this figure:

-In order to start training models at least three pre-processing scripts have to be ran: +In order to start training models at least three pre-processing steps have to be run: -* `create_mesh.py` -* `create_grid_features.py` -* `create_parameter_weights.py` +* `python -m neural_lam.create_mesh` +* `python -m neural_lam.create_grid_features` +* `python -m neural_lam.create_parameter_weights` ### Create graph -Run `create_mesh.py` with suitable options to generate the graph you want to use (see `python create_mesh.py --help` for a list of options). +Run `python -m neural_lam.create_mesh` with suitable options to generate the graph you want to use (see `python neural_lam.create_mesh --help` for a list of options). The graphs used for the different models in the [paper](https://arxiv.org/abs/2309.17370) can be created as: -* **GC-LAM**: `python create_mesh.py --graph multiscale` -* **Hi-LAM**: `python create_mesh.py --graph hierarchical --hierarchical 1` (also works for Hi-LAM-Parallel) -* **L1-LAM**: `python create_mesh.py --graph 1level --levels 1` +* **GC-LAM**: `python -m neural_lam.create_mesh --graph multiscale` +* **Hi-LAM**: `python -m neural_lam.create_mesh --graph hierarchical --hierarchical 1` (also works for Hi-LAM-Parallel) +* **L1-LAM**: `python -m neural_lam.create_mesh --graph 1level --levels 1` The graph-related files are stored in a directory called `graphs`. ### Create remaining static features -To create the remaining static files run the scripts `create_grid_features.py` and `create_parameter_weights.py`. +To create the remaining static files run `python -m neural_lam.create_grid_features` and `python -m neural_lam.create_parameter_weights`. ## Weights & Biases Integration The project is fully integrated with [Weights & Biases](https://www.wandb.ai/) (W&B) for logging and visualization, but can just as easily be used without it. When W&B is used, training configuration, training/test statistics and plots are sent to the W&B servers and made available in an interactive web interface. If W&B is turned off, logging instead saves everything locally to a directory like `wandb/dryrun...`. -The W&B project name is set to `neural-lam`, but this can be changed in the flags of `train_model.py` (using argsparse). +The W&B project name is set to `neural-lam`, but this can be changed in the flags of `python -m neural_lam.train_model` (using argsparse). See the [W&B documentation](https://docs.wandb.ai/) for details. If you would like to login and use W&B, run: @@ -125,8 +119,8 @@ wandb off ``` ## Train Models -Models can be trained using `train_model.py`. -Run `python train_model.py --help` for a full list of training options. +Models can be trained using `python -m neural_lam.train_model`. +Run `python neural_lam.train_model --help` for a full list of training options. A few of the key ones are outlined below: * `--dataset`: Which data to train on @@ -145,12 +139,12 @@ This model class is used both for the L1-LAM and GC-LAM models from the [paper]( To train 1L-LAM use ``` -python train_model.py --model graph_lam --graph 1level ... +python -m neural_lam.train_model --model graph_lam --graph 1level ... ``` To train GC-LAM use ``` -python train_model.py --model graph_lam --graph multiscale ... +python -m neural_lam.train_model --model graph_lam --graph multiscale ... ``` ### Hi-LAM @@ -158,7 +152,7 @@ A version of Graph-LAM that uses a hierarchical mesh graph and performs sequenti To train Hi-LAM use ``` -python train_model.py --model hi_lam --graph hierarchical ... +python -m neural_lam.train_model --model hi_lam --graph hierarchical ... ``` ### Hi-LAM-Parallel @@ -167,13 +161,13 @@ Not included in the paper as initial experiments showed worse results than Hi-LA To train Hi-LAM-Parallel use ``` -python train_model.py --model hi_lam_parallel --graph hierarchical ... +python -m neural_lam.train_model --model hi_lam_parallel --graph hierarchical ... ``` Checkpoint files for our models trained on the MEPS data are available upon request. ## Evaluate Models -Evaluation is also done using `train_model.py`, but using the `--eval` option. +Evaluation is also done using `python -m neural_lam.train_model`, but using the `--eval` option. Use `--eval val` to evaluate the model on the validation set and `--eval test` to evaluate on test data. Most of the training options are also relevant for evaluation (not `ar_steps`, evaluation always unrolls full forecasts). Some options specifically important for evaluation are: @@ -216,13 +210,13 @@ data │ ├── nwp_xy.npy - Coordinates of grid nodes (part of dataset) │ ├── surface_geopotential.npy - Geopotential at surface of grid nodes (part of dataset) │ ├── border_mask.npy - Mask with True for grid nodes that are part of border (part of dataset) -│ ├── grid_features.pt - Static features of grid nodes (create_grid_features.py) -│ ├── parameter_mean.pt - Means of state parameters (create_parameter_weights.py) -│ ├── parameter_std.pt - Std.-dev. of state parameters (create_parameter_weights.py) -│ ├── diff_mean.pt - Means of one-step differences (create_parameter_weights.py) -│ ├── diff_std.pt - Std.-dev. of one-step differences (create_parameter_weights.py) -│ ├── flux_stats.pt - Mean and std.-dev. of solar flux forcing (create_parameter_weights.py) -│ └── parameter_weights.npy - Loss weights for different state parameters (create_parameter_weights.py) +│ ├── grid_features.pt - Static features of grid nodes (neural_lam.create_grid_features) +│ ├── parameter_mean.pt - Means of state parameters (neural_lam.create_parameter_weights) +│ ├── parameter_std.pt - Std.-dev. of state parameters (neural_lam.create_parameter_weights) +│ ├── diff_mean.pt - Means of one-step differences (neural_lam.create_parameter_weights) +│ ├── diff_std.pt - Std.-dev. of one-step differences (neural_lam.create_parameter_weights) +│ ├── flux_stats.pt - Mean and std.-dev. of solar flux forcing (neural_lam.create_parameter_weights) +│ └── parameter_weights.npy - Loss weights for different state parameters (neural_lam.create_parameter_weights) ├── dataset2 ├── ... └── datasetN @@ -234,13 +228,13 @@ The structure is shown with examples below: ``` graphs ├── graph1 - Directory with a graph definition -│ ├── m2m_edge_index.pt - Edges in mesh graph (create_mesh.py) -│ ├── g2m_edge_index.pt - Edges from grid to mesh (create_mesh.py) -│ ├── m2g_edge_index.pt - Edges from mesh to grid (create_mesh.py) -│ ├── m2m_features.pt - Static features of mesh edges (create_mesh.py) -│ ├── g2m_features.pt - Static features of grid to mesh edges (create_mesh.py) -│ ├── m2g_features.pt - Static features of mesh to grid edges (create_mesh.py) -│ └── mesh_features.pt - Static features of mesh nodes (create_mesh.py) +│ ├── m2m_edge_index.pt - Edges in mesh graph (neural_lam.create_mesh) +│ ├── g2m_edge_index.pt - Edges from grid to mesh (neural_lam.create_mesh) +│ ├── m2g_edge_index.pt - Edges from mesh to grid (neural_lam.create_mesh) +│ ├── m2m_features.pt - Static features of mesh edges (neural_lam.create_mesh) +│ ├── g2m_features.pt - Static features of grid to mesh edges (neural_lam.create_mesh) +│ ├── m2g_features.pt - Static features of mesh to grid edges (neural_lam.create_mesh) +│ └── mesh_features.pt - Static features of mesh nodes (neural_lam.create_mesh) ├── graph2 ├── ... └── graphN @@ -250,9 +244,9 @@ graphs To keep track of levels in the mesh graph, a list format is used for the files with mesh graph information. In particular, the files ``` -│ ├── m2m_edge_index.pt - Edges in mesh graph (create_mesh.py) -│ ├── m2m_features.pt - Static features of mesh edges (create_mesh.py) -│ ├── mesh_features.pt - Static features of mesh nodes (create_mesh.py) +│ ├── m2m_edge_index.pt - Edges in mesh graph (neural_lam.create_mesh) +│ ├── m2m_features.pt - Static features of mesh edges (neural_lam.create_mesh) +│ ├── mesh_features.pt - Static features of mesh nodes (neural_lam.create_mesh) ``` all contain lists of length `L`, for a hierarchical mesh graph with `L` layers. For non-hierarchical graphs `L == 1` and these are all just singly-entry lists. @@ -263,10 +257,10 @@ In addition, hierarchical mesh graphs (`L > 1`) feature a few additional files w ``` ├── graph1 │ ├── ... -│ ├── mesh_down_edge_index.pt - Downward edges in mesh graph (create_mesh.py) -│ ├── mesh_up_edge_index.pt - Upward edges in mesh graph (create_mesh.py) -│ ├── mesh_down_features.pt - Static features of downward mesh edges (create_mesh.py) -│ ├── mesh_up_features.pt - Static features of upward mesh edges (create_mesh.py) +│ ├── mesh_down_edge_index.pt - Downward edges in mesh graph (neural_lam.create_mesh) +│ ├── mesh_up_edge_index.pt - Upward edges in mesh graph (neural_lam.create_mesh) +│ ├── mesh_down_features.pt - Static features of downward mesh edges (neural_lam.create_mesh) +│ ├── mesh_up_features.pt - Static features of upward mesh edges (neural_lam.create_mesh) │ ├── ... ``` These files have the same list format as the ones above, but each list has length `L-1` (as these edges describe connections between levels). diff --git a/neural_lam/__init__.py b/neural_lam/__init__.py new file mode 100644 index 00000000..dd565a26 --- /dev/null +++ b/neural_lam/__init__.py @@ -0,0 +1,10 @@ +# First-party +import neural_lam.config +import neural_lam.interaction_net +import neural_lam.metrics +import neural_lam.models +import neural_lam.utils +import neural_lam.vis + +# Local +from .weather_dataset import WeatherDataset diff --git a/create_grid_features.py b/neural_lam/create_grid_features.py similarity index 97% rename from create_grid_features.py rename to neural_lam/create_grid_features.py index 4f058e17..adabd9dc 100644 --- a/create_grid_features.py +++ b/neural_lam/create_grid_features.py @@ -6,8 +6,8 @@ import numpy as np import torch -# First-party -from neural_lam import config +# Local +from . import config def main(): diff --git a/create_mesh.py b/neural_lam/create_mesh.py similarity index 99% rename from create_mesh.py rename to neural_lam/create_mesh.py index 41557a97..40f7ba0e 100644 --- a/create_mesh.py +++ b/neural_lam/create_mesh.py @@ -12,8 +12,8 @@ import torch_geometric as pyg from torch_geometric.utils.convert import from_networkx -# First-party -from neural_lam import config +# Local +from . import config def plot_graph(graph, title=None): diff --git a/create_parameter_weights.py b/neural_lam/create_parameter_weights.py similarity index 99% rename from create_parameter_weights.py rename to neural_lam/create_parameter_weights.py index c85cd5a3..74058d38 100644 --- a/create_parameter_weights.py +++ b/neural_lam/create_parameter_weights.py @@ -10,9 +10,8 @@ from torch.utils.data.distributed import DistributedSampler from tqdm import tqdm -# First-party -from neural_lam import config -from neural_lam.weather_dataset import WeatherDataset +# Local +from . import WeatherDataset, config class PaddedWeatherDataset(torch.utils.data.Dataset): diff --git a/neural_lam/interaction_net.py b/neural_lam/interaction_net.py index 663f27e4..2f45b03f 100644 --- a/neural_lam/interaction_net.py +++ b/neural_lam/interaction_net.py @@ -3,8 +3,8 @@ import torch_geometric as pyg from torch import nn -# First-party -from neural_lam import utils +# Local +from . import utils class InteractionNet(pyg.nn.MessagePassing): diff --git a/neural_lam/models/__init__.py b/neural_lam/models/__init__.py new file mode 100644 index 00000000..f65387ab --- /dev/null +++ b/neural_lam/models/__init__.py @@ -0,0 +1,6 @@ +# Local +from .base_graph_model import BaseGraphModel +from .base_hi_graph_model import BaseHiGraphModel +from .graph_lam import GraphLAM +from .hi_lam import HiLAM +from .hi_lam_parallel import HiLAMParallel diff --git a/neural_lam/models/ar_model.py b/neural_lam/models/ar_model.py index 6ced211f..e94de8c6 100644 --- a/neural_lam/models/ar_model.py +++ b/neural_lam/models/ar_model.py @@ -8,8 +8,8 @@ import torch import wandb -# First-party -from neural_lam import config, metrics, utils, vis +# Local +from .. import config, metrics, utils, vis class ARModel(pl.LightningModule): diff --git a/neural_lam/models/base_graph_model.py b/neural_lam/models/base_graph_model.py index 256d4adc..99629073 100644 --- a/neural_lam/models/base_graph_model.py +++ b/neural_lam/models/base_graph_model.py @@ -1,10 +1,10 @@ # Third-party import torch -# First-party -from neural_lam import utils -from neural_lam.interaction_net import InteractionNet -from neural_lam.models.ar_model import ARModel +# Local +from .. import utils +from ..interaction_net import InteractionNet +from .ar_model import ARModel class BaseGraphModel(ARModel): diff --git a/neural_lam/models/base_hi_graph_model.py b/neural_lam/models/base_hi_graph_model.py index 3fd30579..a2ebcc1b 100644 --- a/neural_lam/models/base_hi_graph_model.py +++ b/neural_lam/models/base_hi_graph_model.py @@ -1,10 +1,10 @@ # Third-party from torch import nn -# First-party -from neural_lam import utils -from neural_lam.interaction_net import InteractionNet -from neural_lam.models.base_graph_model import BaseGraphModel +# Local +from .. import utils +from ..interaction_net import InteractionNet +from .base_graph_model import BaseGraphModel class BaseHiGraphModel(BaseGraphModel): diff --git a/neural_lam/models/graph_lam.py b/neural_lam/models/graph_lam.py index f767fba0..d73f7ad8 100644 --- a/neural_lam/models/graph_lam.py +++ b/neural_lam/models/graph_lam.py @@ -1,10 +1,10 @@ # Third-party import torch_geometric as pyg -# First-party -from neural_lam import utils -from neural_lam.interaction_net import InteractionNet -from neural_lam.models.base_graph_model import BaseGraphModel +# Local +from .. import utils +from ..interaction_net import InteractionNet +from .base_graph_model import BaseGraphModel class GraphLAM(BaseGraphModel): diff --git a/neural_lam/models/hi_lam.py b/neural_lam/models/hi_lam.py index 4d7eb94c..4f3aec05 100644 --- a/neural_lam/models/hi_lam.py +++ b/neural_lam/models/hi_lam.py @@ -1,9 +1,9 @@ # Third-party from torch import nn -# First-party -from neural_lam.interaction_net import InteractionNet -from neural_lam.models.base_hi_graph_model import BaseHiGraphModel +# Local +from ..interaction_net import InteractionNet +from .base_hi_graph_model import BaseHiGraphModel class HiLAM(BaseHiGraphModel): diff --git a/neural_lam/models/hi_lam_parallel.py b/neural_lam/models/hi_lam_parallel.py index 740824e1..b40a9424 100644 --- a/neural_lam/models/hi_lam_parallel.py +++ b/neural_lam/models/hi_lam_parallel.py @@ -2,9 +2,9 @@ import torch import torch_geometric as pyg -# First-party -from neural_lam.interaction_net import InteractionNet -from neural_lam.models.base_hi_graph_model import BaseHiGraphModel +# Local +from ..interaction_net import InteractionNet +from .base_hi_graph_model import BaseHiGraphModel class HiLAMParallel(BaseHiGraphModel): diff --git a/train_model.py b/neural_lam/train_model.py similarity index 97% rename from train_model.py rename to neural_lam/train_model.py index 03863275..39f7aecd 100644 --- a/train_model.py +++ b/neural_lam/train_model.py @@ -9,12 +9,9 @@ import torch from lightning_fabric.utilities import seed -# First-party -from neural_lam import config, utils -from neural_lam.models.graph_lam import GraphLAM -from neural_lam.models.hi_lam import HiLAM -from neural_lam.models.hi_lam_parallel import HiLAMParallel -from neural_lam.weather_dataset import WeatherDataset +# Local +from . import WeatherDataset, config, utils +from .models import GraphLAM, HiLAM, HiLAMParallel MODELS = { "graph_lam": GraphLAM, diff --git a/neural_lam/vis.py b/neural_lam/vis.py index 8c9ca77c..2f22bef1 100644 --- a/neural_lam/vis.py +++ b/neural_lam/vis.py @@ -3,8 +3,8 @@ import matplotlib.pyplot as plt import numpy as np -# First-party -from neural_lam import utils +# Local +from . import utils @matplotlib.rc_context(utils.fractional_plot_bundle(1)) diff --git a/neural_lam/weather_dataset.py b/neural_lam/weather_dataset.py index 3288ed67..29977789 100644 --- a/neural_lam/weather_dataset.py +++ b/neural_lam/weather_dataset.py @@ -7,8 +7,8 @@ import numpy as np import torch -# First-party -from neural_lam import utils +# Local +from . import utils class WeatherDataset(torch.utils.data.Dataset): diff --git a/pyproject.toml b/pyproject.toml index b513a258..c482abc9 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -1,3 +1,10 @@ +[project] +name = "neural-lam" +version = "0.1.0" + +[tool.setuptools] +py-modules = ["neural_lam"] + [tool.black] line-length = 80 diff --git a/tests/__init__.py b/tests/__init__.py deleted file mode 100644 index e69de29b..00000000 diff --git a/tests/test_cli.py b/tests/test_cli.py new file mode 100644 index 00000000..e90daa04 --- /dev/null +++ b/tests/test_cli.py @@ -0,0 +1,18 @@ +# First-party +import neural_lam +import neural_lam.create_grid_features +import neural_lam.create_mesh +import neural_lam.create_parameter_weights +import neural_lam.train_model + + +def test_import(): + """ + This test just ensures that each cli entry-point can be imported for now, + eventually we should test their execution too + """ + assert neural_lam is not None + assert neural_lam.create_mesh is not None + assert neural_lam.create_grid_features is not None + assert neural_lam.create_parameter_weights is not None + assert neural_lam.train_model is not None diff --git a/tests/test_mllam_dataset.py b/tests/test_mllam_dataset.py index f91170c9..e12a57ae 100644 --- a/tests/test_mllam_dataset.py +++ b/tests/test_mllam_dataset.py @@ -1,15 +1,17 @@ # Standard library import os +from pathlib import Path # Third-party import pooch +import pytest # First-party -from create_mesh import main as create_mesh from neural_lam.config import Config +from neural_lam.create_mesh import main as create_mesh +from neural_lam.train_model import main as train_model from neural_lam.utils import load_static_data from neural_lam.weather_dataset import WeatherDataset -from train_model import main as train_model # Disable weights and biases to avoid unnecessary logging # and to avoid having to deal with authentication @@ -25,7 +27,8 @@ ) -def test_retrieve_data_ewc(): +@pytest.fixture(scope="module") +def meps_example_reduced_filepath(): # Download and unzip test data into data/meps_example_reduced pooch.retrieve( url=S3_FULL_PATH, @@ -34,16 +37,17 @@ def test_retrieve_data_ewc(): path="data", fname="meps_example_reduced.zip", ) + return Path("data/meps_example_reduced") -def test_load_reduced_meps_dataset(): +def test_load_reduced_meps_dataset(meps_example_reduced_filepath): # The data_config.yaml file is downloaded and extracted in # test_retrieve_data_ewc together with the dataset itself - data_config_file = "data/meps_example_reduced/data_config.yaml" - dataset_name = "meps_example_reduced" + data_config_file = meps_example_reduced_filepath / "data_config.yaml" + dataset_name = meps_example_reduced_filepath.name - dataset = WeatherDataset(dataset_name="meps_example_reduced") - config = Config.from_file(data_config_file) + dataset = WeatherDataset(dataset_name=dataset_name) + config = Config.from_file(str(data_config_file)) var_names = config.values["dataset"]["var_names"] var_units = config.values["dataset"]["var_units"]