From fda4ac90e610e09f3f87288deff8fee05fbc77b2 Mon Sep 17 00:00:00 2001 From: Sarah Alnegheimish Date: Thu, 14 Nov 2024 17:23:15 -0500 Subject: [PATCH 01/11] update python --- .github/workflows/tests.yml | 8 ++++---- README.md | 2 +- setup.py | 9 ++++++--- tox.ini | 8 ++++---- 4 files changed, 15 insertions(+), 12 deletions(-) diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml index 0eb0022..7aa16ec 100644 --- a/.github/workflows/tests.yml +++ b/.github/workflows/tests.yml @@ -32,7 +32,7 @@ jobs: runs-on: ${{ matrix.os }} strategy: matrix: - python-version: [3.6, 3.7, 3.8] + python-version: ['3.8', '3.9', '3.10', '3.11'] os: [ubuntu-20.04, macos-latest] steps: - uses: actions/checkout@v1 @@ -53,7 +53,7 @@ jobs: runs-on: ${{ matrix.os }} strategy: matrix: - python-version: ['3.6', '3.7', '3.8', '3.9', '3.10', '3.11'] + python-version: ['3.8', '3.9', '3.10', '3.11', '3.12', '3.13'] os: [ubuntu-20.04, macos-latest] steps: - uses: actions/checkout@v1 @@ -70,7 +70,7 @@ jobs: runs-on: ${{ matrix.os }} strategy: matrix: - python-version: [3.6, 3.7, 3.8] + python-version: ['3.8', '3.9', '3.10', '3.11'] os: [ubuntu-20.04, macos-latest] steps: - uses: actions/checkout@v1 @@ -91,7 +91,7 @@ jobs: runs-on: ${{ matrix.os }} strategy: matrix: - python-version: [3.6, 3.7, 3.8] + python-version: ['3.8', '3.9', '3.10', '3.11'] os: [ubuntu-20.04] steps: - uses: actions/checkout@v1 diff --git a/README.md b/README.md index 662a3ed..541d8d1 100644 --- a/README.md +++ b/README.md @@ -50,7 +50,7 @@ Features include: ## Requirements -**MLBlocks** has been developed and tested on [Python 3.6, 3.7, 3.8, 3.9, and 3.10](https://www.python.org/downloads/) +**MLBlocks** has been developed and tested on [Python 3.6, 3.7, 3.8, 3.9, 3.10, 3.11, 3.12, 3.13](https://www.python.org/downloads/) ## Install with `pip` diff --git a/setup.py b/setup.py index c741ead..6510a13 100644 --- a/setup.py +++ b/setup.py @@ -14,8 +14,8 @@ install_requires = [ 'graphviz>=0.9,<1', - 'numpy>=1.17.1,<2', - 'psutil>=5,<6', + 'numpy>=1.17.1,<3', + 'psutil>=5,<7', ] @@ -99,6 +99,9 @@ 'Programming Language :: Python :: 3.9', 'Programming Language :: Python :: 3.10', 'Programming Language :: Python :: 3.11', + 'Programming Language :: Python :: 3.12', + 'Programming Language :: Python :: 3.13', + ], description='Pipelines and primitives for machine learning and data science.', extras_require={ @@ -116,7 +119,7 @@ long_description_content_type='text/markdown', name='mlblocks', packages=find_packages(include=['mlblocks', 'mlblocks.*']), - python_requires='>=3.6,<3.12', + python_requires='>=3.6,<3.14', setup_requires=setup_requires, test_suite='tests', tests_require=tests_require, diff --git a/tox.ini b/tox.ini index 27e499e..cdaadc2 100644 --- a/tox.ini +++ b/tox.ini @@ -3,12 +3,12 @@ envlist = py3{6,7,8,9,10,11}, test-devel [travis] python = - 3.11: py11 - 3.10: py10 + 3.13: py313 + 3.12: py312 + 3.11: py311 + 3.10: py310 3.9: py39 3.8: py38, test-devel - 3.7: py37 - 3.6: py36 [testenv] passenv = CI TRAVIS TRAVIS_* From 72df9bb0eb75cb1ac8116ee4b2af04707a09444b Mon Sep 17 00:00:00 2001 From: Sarah Alnegheimish Date: Thu, 14 Nov 2024 17:32:59 -0500 Subject: [PATCH 02/11] update dependencies --- setup.py | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/setup.py b/setup.py index 6510a13..3091819 100644 --- a/setup.py +++ b/setup.py @@ -20,15 +20,15 @@ mlprimitives_requires = [ - 'mlprimitives>=0.3.0,<0.4', - 'h5py<2.11.0,>=2.10.0', # <- tensorflow 2.3.2 conflict - 'matplotlib<3.2.2,>=2.2.2', # <- copulas 0.3.3 + 'mlprimitives>=0.4.0,<0.5', + 'h5py<4,>=2.10.0', # <- tensorflow 2.3.2 conflict + 'matplotlib<4,>=2.2.2', # <- copulas 0.3.3 'protobuf<4', # <- importlib ] examples_require = mlprimitives_requires + [ 'jupyter==1.0.0', - 'baytune>=0.4.0,<0.5', + 'baytune>=0.4.0,<0.6', ] @@ -50,7 +50,7 @@ # general 'bumpversion>=0.5.3,<0.6', 'pip>=9.0.1', - 'watchdog>=0.8.3,<0.11', + 'watchdog>=0.8.3,<5', # docs 'm2r>=0.2.0,<0.3', From 1c7210538271368696327724a1fdb1d8bcd1e21e Mon Sep 17 00:00:00 2001 From: Sarah Alnegheimish Date: Thu, 14 Nov 2024 17:51:30 -0500 Subject: [PATCH 03/11] mute simpleimputer for now --- README.md | 2 +- examples/tutorials/1. Using and MLPipeline.ipynb | 2 +- examples/tutorials/3. Setting MLPipeline Hyperparameters.ipynb | 2 +- examples/tutorials/4. Saving and Loading a Pipeline.ipynb | 2 +- .../tutorials/5. Partial execution and pipeline debugging.ipynb | 2 +- examples/tutorials/6. Flexible outputs specification.ipynb | 2 +- setup.py | 1 + 7 files changed, 7 insertions(+), 6 deletions(-) diff --git a/README.md b/README.md index 541d8d1..431f1c7 100644 --- a/README.md +++ b/README.md @@ -99,7 +99,7 @@ X_train, X_test, y_train, y_test = train_test_split(dataset, label, stratify=lab primitives = [ 'mlprimitives.custom.preprocessing.ClassEncoder', 'mlprimitives.custom.feature_extraction.CategoricalEncoder', - 'sklearn.impute.SimpleImputer', + # 'sklearn.impute.SimpleImputer', 'xgboost.XGBClassifier', 'mlprimitives.custom.preprocessing.ClassDecoder' ] diff --git a/examples/tutorials/1. Using and MLPipeline.ipynb b/examples/tutorials/1. Using and MLPipeline.ipynb index 901cc50..bc25fe9 100644 --- a/examples/tutorials/1. Using and MLPipeline.ipynb +++ b/examples/tutorials/1. Using and MLPipeline.ipynb @@ -361,7 +361,7 @@ "primitives = [\n", " 'mlprimitives.custom.preprocessing.ClassEncoder',\n", " 'mlprimitives.custom.feature_extraction.CategoricalEncoder',\n", - " 'sklearn.impute.SimpleImputer',\n", + " # 'sklearn.impute.SimpleImputer',\n", " 'xgboost.XGBClassifier',\n", " 'mlprimitives.custom.preprocessing.ClassDecoder'\n", "]\n", diff --git a/examples/tutorials/3. Setting MLPipeline Hyperparameters.ipynb b/examples/tutorials/3. Setting MLPipeline Hyperparameters.ipynb index 7aa0ab2..6aacc15 100644 --- a/examples/tutorials/3. Setting MLPipeline Hyperparameters.ipynb +++ b/examples/tutorials/3. Setting MLPipeline Hyperparameters.ipynb @@ -54,7 +54,7 @@ "primitives = [\n", " 'mlprimitives.custom.preprocessing.ClassEncoder',\n", " 'mlprimitives.custom.feature_extraction.CategoricalEncoder',\n", - " 'sklearn.impute.SimpleImputer',\n", + " # 'sklearn.impute.SimpleImputer',\n", " 'xgboost.XGBClassifier',\n", " 'mlprimitives.custom.preprocessing.ClassDecoder'\n", "]\n", diff --git a/examples/tutorials/4. Saving and Loading a Pipeline.ipynb b/examples/tutorials/4. Saving and Loading a Pipeline.ipynb index ec1c6f9..35c42df 100644 --- a/examples/tutorials/4. Saving and Loading a Pipeline.ipynb +++ b/examples/tutorials/4. Saving and Loading a Pipeline.ipynb @@ -60,7 +60,7 @@ "primitives = [\n", " 'mlprimitives.custom.preprocessing.ClassEncoder',\n", " 'mlprimitives.custom.feature_extraction.CategoricalEncoder',\n", - " 'sklearn.impute.SimpleImputer',\n", + " # 'sklearn.impute.SimpleImputer',\n", " 'xgboost.XGBClassifier',\n", " 'mlprimitives.custom.preprocessing.ClassDecoder'\n", "]\n", diff --git a/examples/tutorials/5. Partial execution and pipeline debugging.ipynb b/examples/tutorials/5. Partial execution and pipeline debugging.ipynb index 769a69c..96adb0e 100644 --- a/examples/tutorials/5. Partial execution and pipeline debugging.ipynb +++ b/examples/tutorials/5. Partial execution and pipeline debugging.ipynb @@ -275,7 +275,7 @@ "primitives = [\n", " 'mlprimitives.custom.preprocessing.ClassEncoder',\n", " 'mlprimitives.custom.feature_extraction.CategoricalEncoder',\n", - " 'sklearn.impute.SimpleImputer',\n", + " # 'sklearn.impute.SimpleImputer',\n", " 'xgboost.XGBClassifier',\n", " 'mlprimitives.custom.preprocessing.ClassDecoder'\n", "]\n", diff --git a/examples/tutorials/6. Flexible outputs specification.ipynb b/examples/tutorials/6. Flexible outputs specification.ipynb index 6ecad5a..c1fc84b 100644 --- a/examples/tutorials/6. Flexible outputs specification.ipynb +++ b/examples/tutorials/6. Flexible outputs specification.ipynb @@ -62,7 +62,7 @@ "primitives = [\n", " 'mlprimitives.custom.preprocessing.ClassEncoder',\n", " 'mlprimitives.custom.feature_extraction.CategoricalEncoder',\n", - " 'sklearn.impute.SimpleImputer',\n", + " # 'sklearn.impute.SimpleImputer',\n", " 'xgboost.XGBClassifier',\n", " 'mlprimitives.custom.preprocessing.ClassDecoder'\n", "]\n", diff --git a/setup.py b/setup.py index 3091819..850b8d0 100644 --- a/setup.py +++ b/setup.py @@ -57,6 +57,7 @@ 'Sphinx>=1.7.1,<3', 'sphinx_rtd_theme>=0.2.4,<0.5', 'docutils>=0.12,<0.18', + 'lxml_html_clean>=0.2.2', 'ipython>=6.5.0', 'autodocsumm>=0.1.10', 'Jinja2>=2,<3', # >=3 makes sphinx theme fail From 4f4c94ae256d748f00cd44de4f78e2bc90295692 Mon Sep 17 00:00:00 2001 From: Sarah Alnegheimish Date: Thu, 14 Nov 2024 18:04:00 -0500 Subject: [PATCH 04/11] edit docs --- examples/tutorials/6. Flexible outputs specification.ipynb | 2 +- setup.py | 3 +-- 2 files changed, 2 insertions(+), 3 deletions(-) diff --git a/examples/tutorials/6. Flexible outputs specification.ipynb b/examples/tutorials/6. Flexible outputs specification.ipynb index c1fc84b..5a1ba1d 100644 --- a/examples/tutorials/6. Flexible outputs specification.ipynb +++ b/examples/tutorials/6. Flexible outputs specification.ipynb @@ -432,7 +432,7 @@ ], "source": [ "output_spec = [\n", - " 'sklearn.impute.SimpleImputer#1.X',\n", + " # 'sklearn.impute.SimpleImputer#1.X',\n", " 'mlprimitives.custom.preprocessing.ClassEncoder#1.y',\n", " 'mlprimitives.custom.preprocessing.ClassEncoder#1.classes',\n", "]\n", diff --git a/setup.py b/setup.py index 850b8d0..e54291b 100644 --- a/setup.py +++ b/setup.py @@ -53,11 +53,10 @@ 'watchdog>=0.8.3,<5', # docs - 'm2r>=0.2.0,<0.3', + 'm2r2>=0.2.5,<0.3', 'Sphinx>=1.7.1,<3', 'sphinx_rtd_theme>=0.2.4,<0.5', 'docutils>=0.12,<0.18', - 'lxml_html_clean>=0.2.2', 'ipython>=6.5.0', 'autodocsumm>=0.1.10', 'Jinja2>=2,<3', # >=3 makes sphinx theme fail From 1d8879dd1490e73c080c92bfad96f6d940957324 Mon Sep 17 00:00:00 2001 From: Sarah Alnegheimish Date: Thu, 14 Nov 2024 18:11:22 -0500 Subject: [PATCH 05/11] change image --- .github/workflows/tests.yml | 2 +- .../tutorials/6. Flexible outputs specification.ipynb | 8 ++++---- setup.py | 6 ++---- 3 files changed, 7 insertions(+), 9 deletions(-) diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml index 7aa16ec..854ebaf 100644 --- a/.github/workflows/tests.yml +++ b/.github/workflows/tests.yml @@ -12,7 +12,7 @@ jobs: strategy: matrix: python-version: [3.8] - os: [ubuntu-latest] + os: [ubuntu-20.04] steps: - uses: actions/checkout@v1 - name: Set up Python ${{ matrix.python-version }} diff --git a/examples/tutorials/6. Flexible outputs specification.ipynb b/examples/tutorials/6. Flexible outputs specification.ipynb index 5a1ba1d..fee2cba 100644 --- a/examples/tutorials/6. Flexible outputs specification.ipynb +++ b/examples/tutorials/6. Flexible outputs specification.ipynb @@ -436,7 +436,7 @@ " 'mlprimitives.custom.preprocessing.ClassEncoder#1.y',\n", " 'mlprimitives.custom.preprocessing.ClassEncoder#1.classes',\n", "]\n", - "X, y, classes = pipeline.fit(X_train, y_train, output_=output_spec)" + "y, classes = pipeline.fit(X_train, y_train, output_=output_spec)" ] }, { @@ -463,11 +463,11 @@ "source": [ "output_spec = [\n", " 'mlprimitives.custom.feature_extraction.CategoricalEncoder#1.X',\n", - " 'sklearn.impute.SimpleImputer#1.X',\n", + " # 'sklearn.impute.SimpleImputer#1.X',\n", " 'mlprimitives.custom.preprocessing.ClassEncoder#1.y',\n", " 'mlprimitives.custom.preprocessing.ClassEncoder#1.classes',\n", "]\n", - "X_1, X_2, y, classes = pipeline.fit(X_train, y_train, output_=output_spec)" + "X_1, y, classes = pipeline.fit(X_train, y_train, output_=output_spec)" ] }, { @@ -507,7 +507,7 @@ } ], "source": [ - "X_2.shape" + "X_1.shape" ] } ], diff --git a/setup.py b/setup.py index e54291b..51974f0 100644 --- a/setup.py +++ b/setup.py @@ -53,7 +53,7 @@ 'watchdog>=0.8.3,<5', # docs - 'm2r2>=0.2.5,<0.3', + 'm2r>=0.2.0,<0.3', 'Sphinx>=1.7.1,<3', 'sphinx_rtd_theme>=0.2.4,<0.5', 'docutils>=0.12,<0.18', @@ -93,8 +93,6 @@ 'License :: OSI Approved :: MIT License', 'Natural Language :: English', 'Programming Language :: Python :: 3', - 'Programming Language :: Python :: 3.6', - 'Programming Language :: Python :: 3.7', 'Programming Language :: Python :: 3.8', 'Programming Language :: Python :: 3.9', 'Programming Language :: Python :: 3.10', @@ -119,7 +117,7 @@ long_description_content_type='text/markdown', name='mlblocks', packages=find_packages(include=['mlblocks', 'mlblocks.*']), - python_requires='>=3.6,<3.14', + python_requires='>=3.8,<3.14', setup_requires=setup_requires, test_suite='tests', tests_require=tests_require, From 298ee434403477295dd6e1e5c0fdb7c78fa34bf0 Mon Sep 17 00:00:00 2001 From: Sarah Alnegheimish Date: Fri, 15 Nov 2024 11:47:51 -0500 Subject: [PATCH 06/11] restore tutorials --- README.md | 2 +- examples/tutorials/1. Using and MLPipeline.ipynb | 2 +- .../3. Setting MLPipeline Hyperparameters.ipynb | 2 +- .../tutorials/4. Saving and Loading a Pipeline.ipynb | 2 +- ...5. Partial execution and pipeline debugging.ipynb | 2 +- .../6. Flexible outputs specification.ipynb | 12 ++++++------ 6 files changed, 11 insertions(+), 11 deletions(-) diff --git a/README.md b/README.md index 431f1c7..541d8d1 100644 --- a/README.md +++ b/README.md @@ -99,7 +99,7 @@ X_train, X_test, y_train, y_test = train_test_split(dataset, label, stratify=lab primitives = [ 'mlprimitives.custom.preprocessing.ClassEncoder', 'mlprimitives.custom.feature_extraction.CategoricalEncoder', - # 'sklearn.impute.SimpleImputer', + 'sklearn.impute.SimpleImputer', 'xgboost.XGBClassifier', 'mlprimitives.custom.preprocessing.ClassDecoder' ] diff --git a/examples/tutorials/1. Using and MLPipeline.ipynb b/examples/tutorials/1. Using and MLPipeline.ipynb index bc25fe9..901cc50 100644 --- a/examples/tutorials/1. Using and MLPipeline.ipynb +++ b/examples/tutorials/1. Using and MLPipeline.ipynb @@ -361,7 +361,7 @@ "primitives = [\n", " 'mlprimitives.custom.preprocessing.ClassEncoder',\n", " 'mlprimitives.custom.feature_extraction.CategoricalEncoder',\n", - " # 'sklearn.impute.SimpleImputer',\n", + " 'sklearn.impute.SimpleImputer',\n", " 'xgboost.XGBClassifier',\n", " 'mlprimitives.custom.preprocessing.ClassDecoder'\n", "]\n", diff --git a/examples/tutorials/3. Setting MLPipeline Hyperparameters.ipynb b/examples/tutorials/3. Setting MLPipeline Hyperparameters.ipynb index 6aacc15..7aa0ab2 100644 --- a/examples/tutorials/3. Setting MLPipeline Hyperparameters.ipynb +++ b/examples/tutorials/3. Setting MLPipeline Hyperparameters.ipynb @@ -54,7 +54,7 @@ "primitives = [\n", " 'mlprimitives.custom.preprocessing.ClassEncoder',\n", " 'mlprimitives.custom.feature_extraction.CategoricalEncoder',\n", - " # 'sklearn.impute.SimpleImputer',\n", + " 'sklearn.impute.SimpleImputer',\n", " 'xgboost.XGBClassifier',\n", " 'mlprimitives.custom.preprocessing.ClassDecoder'\n", "]\n", diff --git a/examples/tutorials/4. Saving and Loading a Pipeline.ipynb b/examples/tutorials/4. Saving and Loading a Pipeline.ipynb index 35c42df..ec1c6f9 100644 --- a/examples/tutorials/4. Saving and Loading a Pipeline.ipynb +++ b/examples/tutorials/4. Saving and Loading a Pipeline.ipynb @@ -60,7 +60,7 @@ "primitives = [\n", " 'mlprimitives.custom.preprocessing.ClassEncoder',\n", " 'mlprimitives.custom.feature_extraction.CategoricalEncoder',\n", - " # 'sklearn.impute.SimpleImputer',\n", + " 'sklearn.impute.SimpleImputer',\n", " 'xgboost.XGBClassifier',\n", " 'mlprimitives.custom.preprocessing.ClassDecoder'\n", "]\n", diff --git a/examples/tutorials/5. Partial execution and pipeline debugging.ipynb b/examples/tutorials/5. Partial execution and pipeline debugging.ipynb index 96adb0e..769a69c 100644 --- a/examples/tutorials/5. Partial execution and pipeline debugging.ipynb +++ b/examples/tutorials/5. Partial execution and pipeline debugging.ipynb @@ -275,7 +275,7 @@ "primitives = [\n", " 'mlprimitives.custom.preprocessing.ClassEncoder',\n", " 'mlprimitives.custom.feature_extraction.CategoricalEncoder',\n", - " # 'sklearn.impute.SimpleImputer',\n", + " 'sklearn.impute.SimpleImputer',\n", " 'xgboost.XGBClassifier',\n", " 'mlprimitives.custom.preprocessing.ClassDecoder'\n", "]\n", diff --git a/examples/tutorials/6. Flexible outputs specification.ipynb b/examples/tutorials/6. Flexible outputs specification.ipynb index fee2cba..6ecad5a 100644 --- a/examples/tutorials/6. Flexible outputs specification.ipynb +++ b/examples/tutorials/6. Flexible outputs specification.ipynb @@ -62,7 +62,7 @@ "primitives = [\n", " 'mlprimitives.custom.preprocessing.ClassEncoder',\n", " 'mlprimitives.custom.feature_extraction.CategoricalEncoder',\n", - " # 'sklearn.impute.SimpleImputer',\n", + " 'sklearn.impute.SimpleImputer',\n", " 'xgboost.XGBClassifier',\n", " 'mlprimitives.custom.preprocessing.ClassDecoder'\n", "]\n", @@ -432,11 +432,11 @@ ], "source": [ "output_spec = [\n", - " # 'sklearn.impute.SimpleImputer#1.X',\n", + " 'sklearn.impute.SimpleImputer#1.X',\n", " 'mlprimitives.custom.preprocessing.ClassEncoder#1.y',\n", " 'mlprimitives.custom.preprocessing.ClassEncoder#1.classes',\n", "]\n", - "y, classes = pipeline.fit(X_train, y_train, output_=output_spec)" + "X, y, classes = pipeline.fit(X_train, y_train, output_=output_spec)" ] }, { @@ -463,11 +463,11 @@ "source": [ "output_spec = [\n", " 'mlprimitives.custom.feature_extraction.CategoricalEncoder#1.X',\n", - " # 'sklearn.impute.SimpleImputer#1.X',\n", + " 'sklearn.impute.SimpleImputer#1.X',\n", " 'mlprimitives.custom.preprocessing.ClassEncoder#1.y',\n", " 'mlprimitives.custom.preprocessing.ClassEncoder#1.classes',\n", "]\n", - "X_1, y, classes = pipeline.fit(X_train, y_train, output_=output_spec)" + "X_1, X_2, y, classes = pipeline.fit(X_train, y_train, output_=output_spec)" ] }, { @@ -507,7 +507,7 @@ } ], "source": [ - "X_1.shape" + "X_2.shape" ] } ], From a7bc200399e56366f1984ca23148e82902f913e6 Mon Sep 17 00:00:00 2001 From: Sarah Alnegheimish Date: Fri, 15 Nov 2024 11:48:10 -0500 Subject: [PATCH 07/11] fix devel tests --- .github/workflows/tests.yml | 6 +++--- setup.py | 9 +++++++++ 2 files changed, 12 insertions(+), 3 deletions(-) diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml index 854ebaf..e2aaf6a 100644 --- a/.github/workflows/tests.yml +++ b/.github/workflows/tests.yml @@ -11,8 +11,8 @@ jobs: runs-on: ${{ matrix.os }} strategy: matrix: - python-version: [3.8] - os: [ubuntu-20.04] + python-version: [3.10] + os: [ubuntu-latest] steps: - uses: actions/checkout@v1 - name: Set up Python ${{ matrix.python-version }} @@ -20,7 +20,7 @@ jobs: with: python-version: ${{ matrix.python-version }} - name: Upgrade pip - run: pip install -U pip setuptools wheel + run: pip install -U "pip<=24.1" setuptools wheel - name: Install lightfm run: python -m pip install --no-use-pep517 'lightfm<2' - name: Install package diff --git a/setup.py b/setup.py index 51974f0..6599e69 100644 --- a/setup.py +++ b/setup.py @@ -62,6 +62,15 @@ 'Jinja2>=2,<3', # >=3 makes sphinx theme fail 'markupsafe<2.1.0', + # fails on Sphinx < v3.4 + 'alabaster<=0.7.12', + # fails on Sphins < v5.0 + 'sphinxcontrib-applehelp<1.0.8', + 'sphinxcontrib-devhelp<1.0.6', + 'sphinxcontrib-htmlhelp<2.0.5', + 'sphinxcontrib-serializinghtml<1.1.10', + 'sphinxcontrib-qthelp<1.0.7', + # style check 'flake8>=3.7.7,<4', 'isort>=4.3.4,<5', From 3a061cde399bf63608caa62196f5511e94cf065e Mon Sep 17 00:00:00 2001 From: Sarah Alnegheimish Date: Fri, 15 Nov 2024 12:15:29 -0500 Subject: [PATCH 08/11] change btb to baytune --- examples/tutorials/7. Tuning a Pipeline.ipynb | 4 ++-- .../8. Searching for the best pipeline with BTBSession.ipynb | 2 +- 2 files changed, 3 insertions(+), 3 deletions(-) diff --git a/examples/tutorials/7. Tuning a Pipeline.ipynb b/examples/tutorials/7. Tuning a Pipeline.ipynb index 7a288a4..a87c54e 100644 --- a/examples/tutorials/7. Tuning a Pipeline.ipynb +++ b/examples/tutorials/7. Tuning a Pipeline.ipynb @@ -242,7 +242,7 @@ "metadata": {}, "outputs": [], "source": [ - "from btb.tuning import Tunable\n", + "from baytune.tuning import Tunable\n", "\n", "tunable = Tunable.from_dict(tunable_hyperparameters)" ] @@ -265,7 +265,7 @@ "metadata": {}, "outputs": [], "source": [ - "from btb.tuning import GPTuner\n", + "from baytune.tuning import GPTuner\n", "\n", "tuner = GPTuner(tunable)" ] diff --git a/examples/tutorials/8. Searching for the best pipeline with BTBSession.ipynb b/examples/tutorials/8. Searching for the best pipeline with BTBSession.ipynb index 80ad93f..65071ea 100644 --- a/examples/tutorials/8. Searching for the best pipeline with BTBSession.ipynb +++ b/examples/tutorials/8. Searching for the best pipeline with BTBSession.ipynb @@ -286,7 +286,7 @@ "metadata": {}, "outputs": [], "source": [ - "from btb.session import BTBSession\n", + "from baytune.session import BTBSession\n", "\n", "session = BTBSession(tunables, cross_validate, verbose=True)" ] From 97f3177b66f0f9b38baca72852f927d3d7b174aa Mon Sep 17 00:00:00 2001 From: Sarah Alnegheimish Date: Fri, 15 Nov 2024 12:16:35 -0500 Subject: [PATCH 09/11] fix python specification --- .github/workflows/tests.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml index e2aaf6a..cbadf80 100644 --- a/.github/workflows/tests.yml +++ b/.github/workflows/tests.yml @@ -11,7 +11,7 @@ jobs: runs-on: ${{ matrix.os }} strategy: matrix: - python-version: [3.10] + python-version: ['3.10'] os: [ubuntu-latest] steps: - uses: actions/checkout@v1 From 6950d4d453a35c627e8a0fdac255b80990c5988a Mon Sep 17 00:00:00 2001 From: Sarah Alnegheimish Date: Fri, 15 Nov 2024 13:05:29 -0500 Subject: [PATCH 10/11] cap copulas at 0.11 --- examples/tutorials/7. Tuning a Pipeline.ipynb | 27 +- ...or the best pipeline with BTBSession.ipynb | 239 ++++++------------ setup.py | 6 +- 3 files changed, 94 insertions(+), 178 deletions(-) diff --git a/examples/tutorials/7. Tuning a Pipeline.ipynb b/examples/tutorials/7. Tuning a Pipeline.ipynb index a87c54e..484e0b2 100644 --- a/examples/tutorials/7. Tuning a Pipeline.ipynb +++ b/examples/tutorials/7. Tuning a Pipeline.ipynb @@ -181,7 +181,7 @@ { "data": { "text/plain": [ - "0.8639171383183359" + "0.863978563379761" ] }, "execution_count": 6, @@ -210,7 +210,7 @@ { "data": { "text/plain": [ - "0.8686773872402614" + "0.868554574842" ] }, "execution_count": 7, @@ -345,16 +345,15 @@ "output_type": "stream", "text": [ "scoring pipeline 1\n", + "New best found: 0.871994161365419\n", "scoring pipeline 2\n", + "New best found: 0.8723319756253888\n", "scoring pipeline 3\n", "scoring pipeline 4\n", - "New best found: 0.8642241881762839\n", "scoring pipeline 5\n", "scoring pipeline 6\n", "scoring pipeline 7\n", - "New best found: 0.8644390957265209\n", "scoring pipeline 8\n", - "New best found: 0.8679095503945804\n", "scoring pipeline 9\n", "scoring pipeline 10\n" ] @@ -395,13 +394,13 @@ "data": { "text/plain": [ "{('mlprimitives.custom.feature_extraction.CategoricalEncoder#1',\n", - " 'max_labels'): 39,\n", - " ('sklearn.impute.SimpleImputer#1', 'strategy'): 'most_frequent',\n", - " ('xgboost.XGBClassifier#1', 'n_estimators'): 70,\n", - " ('xgboost.XGBClassifier#1', 'max_depth'): 6,\n", - " ('xgboost.XGBClassifier#1', 'learning_rate'): 0.07406443671152008,\n", - " ('xgboost.XGBClassifier#1', 'gamma'): 0.9244108160038952,\n", - " ('xgboost.XGBClassifier#1', 'min_child_weight'): 1}" + " 'max_labels'): 60,\n", + " ('sklearn.impute.SimpleImputer#1', 'strategy'): 'mean',\n", + " ('xgboost.XGBClassifier#1', 'n_estimators'): 190,\n", + " ('xgboost.XGBClassifier#1', 'max_depth'): 5,\n", + " ('xgboost.XGBClassifier#1', 'learning_rate'): 0.13575511242790694,\n", + " ('xgboost.XGBClassifier#1', 'gamma'): 0.6326488945712287,\n", + " ('xgboost.XGBClassifier#1', 'min_child_weight'): 8}" ] }, "execution_count": 13, @@ -443,7 +442,7 @@ ], "metadata": { "kernelspec": { - "display_name": "Python 3", + "display_name": "Python 3 (ipykernel)", "language": "python", "name": "python3" }, @@ -457,7 +456,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.6.9" + "version": "3.10.15" } }, "nbformat": 4, diff --git a/examples/tutorials/8. Searching for the best pipeline with BTBSession.ipynb b/examples/tutorials/8. Searching for the best pipeline with BTBSession.ipynb index 65071ea..a7e9d69 100644 --- a/examples/tutorials/8. Searching for the best pipeline with BTBSession.ipynb +++ b/examples/tutorials/8. Searching for the best pipeline with BTBSession.ipynb @@ -157,7 +157,7 @@ { "data": { "text/plain": [ - "" + "" ] }, "execution_count": 6, @@ -314,12 +314,12 @@ { "data": { "application/vnd.jupyter.widget-view+json": { - "model_id": "342fe40f08024adcb5b60eea25f49d37", + "model_id": "00c20e4b982f42a1873c0d12f550ee4b", "version_major": 2, "version_minor": 0 }, "text/plain": [ - "HBox(children=(FloatProgress(value=0.0, max=5.0), HTML(value='')))" + " 0%| | 0/5 [00:00\", line 11, in cross_validate\n", + " File \"/var/folders/by/d1f3gk0x14v54qggfxmjbn1c0000gn/T/ipykernel_19852/2674531477.py\", line 11, in cross_validate\n", " pipeline.fit(X_train, y_train)\n", - " File \"/home/xals/Projects/MIT/MLBlocks.clean/mlblocks/mlpipeline.py\", line 754, in fit\n", - " block, block_name, context, output_variables, outputs, debug_info)\n", - " File \"/home/xals/Projects/MIT/MLBlocks.clean/mlblocks/mlpipeline.py\", line 645, in _produce_block\n", + " File \"/Users/sarah/Documents/git-repos/MLBlocks/mlblocks/mlpipeline.py\", line 805, in fit\n", + " self._produce_block(\n", + " File \"/Users/sarah/Documents/git-repos/MLBlocks/mlblocks/mlpipeline.py\", line 679, in _produce_block\n", " block_outputs = block.produce(**produce_args)\n", - " File \"/home/xals/Projects/MIT/MLBlocks.clean/mlblocks/mlblock.py\", line 322, in produce\n", + " File \"/Users/sarah/Documents/git-repos/MLBlocks/mlblocks/mlblock.py\", line 331, in produce\n", " return getattr(self.instance, self.produce_method)(**produce_kwargs)\n", - " File \"/home/xals/.virtualenvs/MLBlocks.clean/lib/python3.6/site-packages/mlprimitives/custom/text.py\", line 111, in produce\n", + " File \"/Users/sarah/Documents/git-repos/MLPrimitives/mlprimitives/custom/text.py\", line 111, in produce\n", " texts = X[self.column]\n", - " File \"/home/xals/.virtualenvs/MLBlocks.clean/lib/python3.6/site-packages/pandas/core/frame.py\", line 2927, in __getitem__\n", + " File \"/opt/anaconda3/envs/py10/lib/python3.10/site-packages/pandas/core/frame.py\", line 3807, in __getitem__\n", " indexer = self.columns.get_loc(key)\n", - " File \"/home/xals/.virtualenvs/MLBlocks.clean/lib/python3.6/site-packages/pandas/core/indexes/base.py\", line 2659, in get_loc\n", - " return self._engine.get_loc(self._maybe_cast_indexer(key))\n", - " File \"pandas/_libs/index.pyx\", line 108, in pandas._libs.index.IndexEngine.get_loc\n", - " File \"pandas/_libs/index.pyx\", line 132, in pandas._libs.index.IndexEngine.get_loc\n", - " File \"pandas/_libs/hashtable_class_helper.pxi\", line 1601, in pandas._libs.hashtable.PyObjectHashTable.get_item\n", - " File \"pandas/_libs/hashtable_class_helper.pxi\", line 1608, in pandas._libs.hashtable.PyObjectHashTable.get_item\n", + " File \"/opt/anaconda3/envs/py10/lib/python3.10/site-packages/pandas/core/indexes/base.py\", line 3804, in get_loc\n", + " raise KeyError(key) from err\n", "KeyError: 'text'\n", - "2020-09-16 16:32:46,587 - WARNING - btb.session - Too many errors: 1. Removing tunable single_table.classification.text\n", - "2020-09-16 16:32:46,589 - INFO - btb.session - Creating Tunable instance from dict.\n", - "2020-09-16 16:32:46,589 - INFO - btb.session - Obtaining default configuration for single_table.classification.xgb\n", - "2020-09-16 16:32:52,100 - INFO - btb.session - Generating new proposal configuration for single_table.classification\n", - "2020-09-16 16:33:28,900 - INFO - btb.session - New optimal found: single_table.classification - 0.8728234138413778\n", - "2020-09-16 16:33:28,904 - INFO - btb.session - Generating new proposal configuration for single_table.classification.xgb\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n" + "Too many errors: 1. Removing tunable single_table.classification.text\n" ] }, { "data": { "text/plain": [ - "{'id': '7e662f9b90f0e123939b7532ecc221c7',\n", - " 'name': 'single_table.classification',\n", + "{'id': '0ebe8af9c06a05f39821de36d6c9ffc2',\n", + " 'name': 'single_table.classification.xgb',\n", " 'config': {('mlprimitives.custom.feature_extraction.CategoricalEncoder#1',\n", - " 'max_labels'): 63,\n", - " ('mlprimitives.custom.feature_extraction.StringVectorizer#1',\n", - " 'lowercase'): True,\n", - " ('mlprimitives.custom.feature_extraction.StringVectorizer#1',\n", - " 'binary'): True,\n", - " ('mlprimitives.custom.feature_extraction.StringVectorizer#1',\n", - " 'max_features'): 7315,\n", + " 'max_labels'): 52,\n", " ('sklearn.impute.SimpleImputer#1', 'strategy'): 'median',\n", - " ('xgboost.XGBClassifier#1', 'n_estimators'): 879,\n", - " ('xgboost.XGBClassifier#1', 'max_depth'): 3,\n", - " ('xgboost.XGBClassifier#1', 'learning_rate'): 0.23231879890615814,\n", - " ('xgboost.XGBClassifier#1', 'gamma'): 0.5474914147721585,\n", - " ('xgboost.XGBClassifier#1', 'min_child_weight'): 3},\n", - " 'score': 0.8728234138413778}" + " ('xgboost.XGBClassifier#1', 'n_estimators'): 313,\n", + " ('xgboost.XGBClassifier#1', 'max_depth'): 5,\n", + " ('xgboost.XGBClassifier#1', 'learning_rate'): 0.7119589664956909,\n", + " ('xgboost.XGBClassifier#1', 'gamma'): 0.944854007471167,\n", + " ('xgboost.XGBClassifier#1', 'min_child_weight'): 10},\n", + " 'score': 0.8641320270062784}" ] }, "execution_count": 11, @@ -489,23 +458,17 @@ { "data": { "text/plain": [ - "{'id': '7e662f9b90f0e123939b7532ecc221c7',\n", - " 'name': 'single_table.classification',\n", + "{'id': '0ebe8af9c06a05f39821de36d6c9ffc2',\n", + " 'name': 'single_table.classification.xgb',\n", " 'config': {('mlprimitives.custom.feature_extraction.CategoricalEncoder#1',\n", - " 'max_labels'): 63,\n", - " ('mlprimitives.custom.feature_extraction.StringVectorizer#1',\n", - " 'lowercase'): True,\n", - " ('mlprimitives.custom.feature_extraction.StringVectorizer#1',\n", - " 'binary'): True,\n", - " ('mlprimitives.custom.feature_extraction.StringVectorizer#1',\n", - " 'max_features'): 7315,\n", + " 'max_labels'): 52,\n", " ('sklearn.impute.SimpleImputer#1', 'strategy'): 'median',\n", - " ('xgboost.XGBClassifier#1', 'n_estimators'): 879,\n", - " ('xgboost.XGBClassifier#1', 'max_depth'): 3,\n", - " ('xgboost.XGBClassifier#1', 'learning_rate'): 0.23231879890615814,\n", - " ('xgboost.XGBClassifier#1', 'gamma'): 0.5474914147721585,\n", - " ('xgboost.XGBClassifier#1', 'min_child_weight'): 3},\n", - " 'score': 0.8728234138413778}" + " ('xgboost.XGBClassifier#1', 'n_estimators'): 313,\n", + " ('xgboost.XGBClassifier#1', 'max_depth'): 5,\n", + " ('xgboost.XGBClassifier#1', 'learning_rate'): 0.7119589664956909,\n", + " ('xgboost.XGBClassifier#1', 'gamma'): 0.944854007471167,\n", + " ('xgboost.XGBClassifier#1', 'min_child_weight'): 10},\n", + " 'score': 0.8641320270062784}" ] }, "execution_count": 12, @@ -539,71 +502,31 @@ { "data": { "application/vnd.jupyter.widget-view+json": { - "model_id": "8dd5d4626f304c279b2b368a671b6cb7", + "model_id": "a0dbe69a0340455a937f7376f7723ec4", "version_major": 2, "version_minor": 0 }, "text/plain": [ - "HBox(children=(FloatProgress(value=0.0, max=20.0), HTML(value='')))" + " 0%| | 0/10 [00:00=0.4.0,<0.6', + 'baytune>=0.5.0,<0.6', + 'copulas<0.12', ] @@ -105,10 +106,9 @@ 'Programming Language :: Python :: 3.8', 'Programming Language :: Python :: 3.9', 'Programming Language :: Python :: 3.10', - 'Programming Language :: Python :: 3.11', + 'Programming Language :: Python :: 3.11', 'Programming Language :: Python :: 3.12', 'Programming Language :: Python :: 3.13', - ], description='Pipelines and primitives for machine learning and data science.', extras_require={ From 80448670693f0a01de77c995c70c3c86965a155f Mon Sep 17 00:00:00 2001 From: Sarah Alnegheimish Date: Fri, 15 Nov 2024 13:42:02 -0500 Subject: [PATCH 11/11] update readme --- README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/README.md b/README.md index 541d8d1..fb5ba34 100644 --- a/README.md +++ b/README.md @@ -50,7 +50,7 @@ Features include: ## Requirements -**MLBlocks** has been developed and tested on [Python 3.6, 3.7, 3.8, 3.9, 3.10, 3.11, 3.12, 3.13](https://www.python.org/downloads/) +**MLBlocks** has been developed and tested on [Python 3.8, 3.9, 3.10, 3.11, 3.12, 3.13](https://www.python.org/downloads/) ## Install with `pip`