diff --git a/CHANGELOG.md b/CHANGELOG.md index 3181cd9..5c7080a 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -1,5 +1,8 @@ # Changelog +## [Version 0.2.0](https://github.com/dataiku/dss-plugin-nlp-analysis/releases/tag/v0.2.0) +- Add support for python v3.8 to v3.10 + ## [Version 0.1.1](https://github.com/dataiku/dss-plugin-nlp-analysis/releases/tag/v0.1.1) - Fix sudachipy version not being compatible with python 3.6 anymore diff --git a/LICENSE b/LICENSE index 7bd383d..d0b2a96 100644 --- a/LICENSE +++ b/LICENSE @@ -186,7 +186,7 @@ same "printed page" as the copyright notice for easier identification within third-party archives. - Copyright 2021 Dataiku + Copyright 2023 Dataiku Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. diff --git a/code-env/python/desc.json b/code-env/python/desc.json index 21d8a3f..c2494d8 100644 --- a/code-env/python/desc.json +++ b/code-env/python/desc.json @@ -1,10 +1,13 @@ { "acceptedPythonInterpreters": [ "PYTHON36", - "PYTHON37" + "PYTHON37", + "PYTHON38", + "PYTHON39", + "PYTHON310" ], "forceConda": false, "installCorePackages": true, "installJupyterSupport": true, - "corePackagesSet": "PANDAS10" + "corePackagesSet": "AUTO" } diff --git a/plugin.json b/plugin.json index fd9fd48..7a34ff0 100644 --- a/plugin.json +++ b/plugin.json @@ -1,6 +1,6 @@ { "id": "nlp-analysis", - "version": "0.1.1", + "version": "0.2.0", "meta": { "label": "Text Analysis", "category": "Natural Language Processing", diff --git a/python-lib/nlp/spacy_tokenizer.py b/python-lib/nlp/spacy_tokenizer.py index 51bcfb5..7940f90 100644 --- a/python-lib/nlp/spacy_tokenizer.py +++ b/python-lib/nlp/spacy_tokenizer.py @@ -26,7 +26,6 @@ SPACY_LANGUAGE_MODELS_MORPHOLOGIZER, ) from utils.cleaning_utils import generate_unique, truncate_text_list -from utils.cleaning_utils import truncate_text_list # Setting custom spaCy token extensions to allow for easier filtering in downstream tasks Token.set_extension("is_hashtag", getter=lambda token: token.text[0] == "#", force=True)