fix project_slug error.

replace ml_pipeline with project_name or module_name from config
2024-04-06 15:48:29 -07:00 · 2024-04-06 15:48:29 -07:00 · 6eed08d1ba
parent 727f16df57
commit 6eed08d1ba
43 changed files with 81 additions and 95 deletions
--- a/cookiecutter.json
+++ b/cookiecutter.json
@ -4,5 +4,8 @@
    "module_name": "{{ cookiecutter.repo_name }}",
    "author_name": "Your name (or your organization/company/team)",
    "description": "A short description of the project.",
-    "open_source_license": ["MIT", "BSD-3-Clause", "No license file"]
+    "open_source_license": ["MIT", "BSD-3-Clause", "No license file"],
    "_copy_without_render": [
        "docs/book"
    ]
 }
--- a/{{cookiecutter.project_name}}/.env.example
+++ b/{{cookiecutter.project_name}}/.env.example
@ -0,0 +1,7 @@
 MODEL__IN_CHANNELS=1
 MODEL__NUM_CLASSES=10
 DATA__TRAIN_PATH=/path/to/{{cookiecutter.project_name}}/data/mnist_train.csv
 DATA__TEST_PATH=/path/to/{{cookiecutter.project_name}}/data/mnist_test.csv
 PATHS__APP=/path/to/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/
 PATHS__ROOT=/path/to/{{cookiecutter.project_name}}/
 PATHS__DATA=/path/to/{{cookiecutter.project_name}}/data/
--- a/{{cookiecutter.project_name}}/LICENCE
+++ b/{{cookiecutter.project_name}}/LICENCE
--- a/{{cookiecutter.project_name}}/Makefile
+++ b/{{cookiecutter.project_name}}/Makefile
@ -1,30 +1,36 @@
-APP_NAME=ml_pipeline
+APP_NAME={{cookiecutter.module_name}}
 PYTHON=.venv/bin/python3
 INTERPRETER=/usr/bin/python3
 .PHONY: help test
-all: run
+all: help
 init: ## create a venv
 	$(INTERPRETER) -m venv .venv
-
+	cp .env.example .env
 run: ## run the pipeline (train)
 	$(PYTHON) -m $(APP_NAME) pipeline:train 
 data: ## download the mnist data
 	$(PYTHON) -m $(APP_NAME) data:download 
 	# wget https://pjreddie.com/media/files/mnist_train.csv -O data/mnist_train.csv
 	# wget https://pjreddie.com/media/files/mnist_test.csv -O data/mnist_test.csv
 test:
 	find . -iname "*.py" | entr -c pytest
 serve:
 	$(PYTHON) -m $(APP_NAME) app:serve
 install:
 	$(PYTHON) -m pip install -r requirements.txt
 data: ## download the mnist data
 	$(PYTHON) -m $(APP_NAME) data:download 
 run: ## run the pipeline (train)
 	$(PYTHON) -m $(APP_NAME) pipeline:train 
 serve: ## start fastapi uvicorn server
 	$(PYTHON) -m $(APP_NAME) app:serve
 docs: ## serve the mdbook docs directory
 	mdbook serve docs
 test: ## run pytest tests
 	$(PYTHON) -m pytest
 test-watch: ## run pytest on .py changes
 	find . -iname "*.py" | entr -c $(PYTHON) -m pytest
 help: ## display this help message
-	@grep -E '^[a-zA-Z_-]+:.*?## .*$$' $(MAKEFILE_LIST) | sort | awk 'BEGIN {FS = ":.*?## "}; {printf "\033[36m%-30s\033[0m %s\n", $$1, $$2}'
+	@echo "available commands:"
 	@grep -E '^[a-zA-Z_-]+:.*?## .*$$' $(MAKEFILE_LIST) | sort | awk 'BEGIN {FS = ":.*?## "}; {printf "\033[36mmake %-30s\033[0m %s\n", $$1, $$2}'
--- a/{{cookiecutter.project_name}}/README.md
+++ b/{{cookiecutter.project_name}}/README.md
--- a/{{cookiecutter.project_name}}/docs/.gitignore
+++ b/{{cookiecutter.project_name}}/docs/.gitignore
--- a/{{cookiecutter.project_name}}/docs/book.toml
+++ b/{{cookiecutter.project_name}}/docs/book.toml
@ -3,4 +3,4 @@ authors = ["publicmatt"]
 language = "en"
 multilingual = false
 src = "src"
-title = "ml_pipeline"
+title = "{{cookiecutter.project_name}}"
--- a/{{cookiecutter.project_name}}/docs/src/SUMMARY.md
+++ b/{{cookiecutter.project_name}}/docs/src/SUMMARY.md
--- a/{{cookiecutter.project_name}}/docs/src/chapter_1.md
+++ b/{{cookiecutter.project_name}}/docs/src/chapter_1.md
--- a/{{cookiecutter.project_name}}/docs/src/index.md
+++ b/{{cookiecutter.project_name}}/docs/src/index.md
--- a/{{cookiecutter.project_name}}/pyproject.toml
+++ b/{{cookiecutter.project_name}}/pyproject.toml
@ -3,7 +3,7 @@ requires = ["setuptools", "wheel"]
 build-backend = "setuptools.build_meta"
 [project]
-name = "ml_pipeline"
+name = "{{cookiecutter.project_name}}"
 version = "0.1.0"
 authors = [
    {name = "publicmatt", email = "git@publicmatt.com"},
@ -18,7 +18,6 @@ dependencies = [
    "numpy==1.26.4",
    "pytest==8.1.1",
    "pytest-cov==5.0.0",
    "python-dotenv==1.0.1",
    "requests==2.31.0",
    "torch==2.2.2",
    "torchvision=0.17.2",
@ -37,11 +36,11 @@ repository = "https://example.com/my_project/repo"
 documentation = "https://example.com/my_project/docs"
 [tool.setuptools]
-packages = ["ml_pipeline"]
+packages = ["{{cookiecutter.module_name}}"]
 [tool.pytest.ini_options]
 # Run tests in parallel using pytest-xdist
-addopts = "--cov=ml_pipeline --cov-report=term"
+addopts = "--cov={{cookiecutter.module_name}} --cov-report=term"
 # Specify the paths to look for tests
 testpaths = [
    "test",
--- a/{{cookiecutter.project_name}}/requirements.txt
+++ b/{{cookiecutter.project_name}}/requirements.txt
--- a/{{cookiecutter.project_name}}/test/.env.test
+++ b/{{cookiecutter.project_name}}/test/.env.test
--- a/{{cookiecutter.project_name}}/test/test_cnn.py
+++ b/{{cookiecutter.project_name}}/test/test_cnn.py
@ -0,0 +1,6 @@
 from {{cookiecutter.module_name}} import config
 from {{cookiecutter.module_name}}.model.cnn import VGG11
 def test_in_channels():
    assert config.model.name == 'vgg11' 
--- a/{{cookiecutter.project_name}}/test/test_inputs.py
+++ b/{{cookiecutter.project_name}}/test/test_inputs.py
@ -1,5 +1,5 @@
-from ml_pipeline.data.dataset import MnistDataset
+from {{cookiecutter.module_name}}.data.dataset import MnistDataset
-from ml_pipeline import config
+from {{cookiecutter.module_name}} import config
 from pathlib import Path
 import pytest
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/init.py
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/init.py
@ -5,7 +5,7 @@ pwd = Path(__file__).parent
 config_path = pwd / 'config'
 root_path = pwd.parent
 config = ConfigurationSet(
-    config_from_env(prefix="ML_PIPELINE", separator="__", lowercase_keys=True),
+    config_from_env(prefix="{{cookiecutter.module_name.upper()}}", separator="__", lowercase_keys=True),
    config_from_dotenv(root_path / ".env", read_from_file=True, lowercase_keys=True, interpolate=True, interpolate_type=1),
    config_from_toml(config_path / "training.toml", read_from_file=True),
    config_from_toml(config_path / "data.toml", read_from_file=True),
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/main.py
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/main.py
@ -0,0 +1,5 @@
 from {{cookiecutter.module_name}}.cli import cli
 if __name__ == "__main__":
    cli()
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/app/init.py
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/app/init.py
@ -0,0 +1,11 @@
 from {{cookiecutter.module_name}} import config
 from fastapi import FastAPI, Response
 import logging
 import uvicorn
 app = FastAPI()
 logger = logging.getLogger(__name__)
 def run():
    uvicorn.run("{{cookiecutter.module_name}}.app:app", host=config.app.host, port=config.app.port, proxy_headers=True)
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/batch.py
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/batch.py
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/cli.py
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/cli.py
@ -4,38 +4,38 @@ import click
@click.version_option()
 def cli():
    """
-    ml_pipeline: a template for building, training and running pytorch models.
+    build, train and run machine learning models.
    """
@cli.command("pipeline:train")
 def pipeline_train():
    """run the training pipeline with train data"""
-    from ml_pipeline.training import pipeline
+    from {{cookiecutter.module_name}}.training import pipeline
    pipeline.run(evaluate=False)
@cli.command("pipeline:evaluate")
 def pipeline_evaluate():
    """run the training pipeline with test data"""
-    from ml_pipeline.training import pipeline
+    from {{cookiecutter.module_name}}.training import pipeline
    pipeline.run(evaluate=True)
@cli.command("app:serve")
 def app_serve():
    """run the api server pipeline with pretrained model"""
-    from ml_pipeline import app
+    from {{cookiecutter.module_name}} import app
    app.run()
@cli.command("data:download")
 def data_download():
    """download the train and test data"""
-    from ml_pipeline import data
+    from {{cookiecutter.module_name}} import data
-    from ml_pipeline import config
+    from {{cookiecutter.module_name}} import config
    from pathlib import Path
    data.download(Path(config.paths.data))
@cli.command("data:debug")
 def data_debug():
    """debug the dataset class"""
-    from ml_pipeline.data import dataset
+    from {{cookiecutter.module_name}}.data import dataset
    dataset.debug()
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/common.py
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/common.py
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/config/app.toml
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/config/app.toml
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/config/config.toml
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/config/config.toml
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/config/data.toml
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/config/data.toml
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/config/model.toml
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/config/model.toml
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/config/paths.toml
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/config/paths.toml
@ -1,4 +1,4 @@
 [paths]
 repo = "/path/to/root"
-app = "/path/to/root/ml_pipeline"
+app = "/path/to/root/{{cookiecutter.module_name}}"
 data = "/path/to/root/data"
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/config/training.toml
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/config/training.toml
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/data/init.py
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/data/init.py
@ -1,7 +1,7 @@
 from pathlib import Path
 import requests
 import logging
-from ml_pipeline import config
+from {{cookiecutter.module_name}} import config
 logger = logging.getLogger(__name__)
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/data/dataset.py
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/data/dataset.py
@ -5,7 +5,7 @@ import csv
 import torch
 from pathlib import Path
 from typing import Tuple
-from ml_pipeline import config, logger
+from {{cookiecutter.module_name}} import config, logger
 class MnistDataset(Dataset):
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/data/make.py
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/data/make.py
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/data/spark.py
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/data/spark.py
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/features/make.py
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/features/make.py
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/model/init.py
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/model/init.py
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/model/cnn.py
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/model/cnn.py
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/model/linear.py
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/model/linear.py
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/notebooks/features.ipynb
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/notebooks/features.ipynb
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/notebooks/main.ipynb
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/notebooks/main.ipynb
@ -8,7 +8,7 @@
   "outputs": [],
   "source": [
    "# Now you can import your package\n",
-    "import ml_pipeline"
+    "import {{cookiecutter.module_name}}"
   ]
  },
  {
@ -18,7 +18,7 @@
   "metadata": {},
   "outputs": [],
   "source": [
-    "from ml_pipeline.data.dataset import MnistDataset"
+    "from {{cookiecutter.module_name}}.data.dataset import MnistDataset"
   ]
  },
  {
@ -28,38 +28,9 @@
   "metadata": {},
   "outputs": [],
   "source": [
-    "from ml_pipeline import config"
+    "from {{cookiecutter.module_name}} import config"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "c8ce7920-c056-44ac-93df-b25bae870592",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<ConfigurationSet: 0x7fcf70fc1a50>"
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "config"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "83293ef7-37b3-452f-8de5-13bee633d099",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/training/init.py
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/training/init.py
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/training/pipeline.py
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/training/pipeline.py
@ -1,8 +1,8 @@
 from torch.utils.data import DataLoader
 from torch.optim import AdamW
-from ml_pipeline.training.runner import Runner
+from {{cookiecutter.module_name}}.training.runner import Runner
-from ml_pipeline import config, logger
+from {{cookiecutter.module_name}} import config, logger
 def run(evaluate=False):
@ -30,8 +30,8 @@ def run(evaluate=False):
            logger.info(f"{step}")
 def get_model(name='vgg11'):
-    from ml_pipeline.model.linear import DNN
+    from {{cookiecutter.module_name}}.model.linear import DNN
-    from ml_pipeline.model.cnn import VGG11
+    from {{cookiecutter.module_name}}.model.cnn import VGG11
    if name == 'vgg11':
        return VGG11(config.data.in_channels, config.data.num_classes)
    else:
@ -43,7 +43,7 @@ def get_model(name='vgg11'):
 def get_dataset(evaluate=False):
    # Usage
-    from ml_pipeline.data.dataset import MnistDataset
+    from {{cookiecutter.module_name}}.data.dataset import MnistDataset
    from torchvision import transforms
    csv_file_path = config.data.train_path if not evaluate else config.data.test_path
    transform = transforms.Compose([
--- a/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/training/runner.py
+++ b/{{cookiecutter.project_name}}/{{cookiecutter.module_name}}/training/runner.py
--- a/{{cookiecutter.project_slug}}/test/test_cnn.py
+++ b/{{cookiecutter.project_slug}}/test/test_cnn.py
@ -1,6 +0,0 @@
 from ml_pipeline import config
 from ml_pipeline.model.cnn import VGG11
 def test_in_channels():
    assert config.model.name == 'vgg11' 
--- a/{{cookiecutter.project_slug}}/{{cookiecutter.module_name}}/main.py
+++ b/{{cookiecutter.project_slug}}/{{cookiecutter.module_name}}/main.py
@ -1,5 +0,0 @@
 from ml_pipeline.cli import cli
 if __name__ == "__main__":
    cli()
--- a/{{cookiecutter.project_slug}}/{{cookiecutter.module_name}}/app/init.py
+++ b/{{cookiecutter.project_slug}}/{{cookiecutter.module_name}}/app/init.py
@ -1,11 +0,0 @@
 from ml_pipeline import config
 from fastapi import FastAPI, Response
 import logging
 import uvicorn
 app = FastAPI()
 logger = logging.getLogger(__name__)
 def run():
    uvicorn.run("ml_pipeline.app:app", host=config.app.host, port=config.app.port, proxy_headers=True)