From 10a7388c394c6a87cd63da438dd691734cd19a8a Mon Sep 17 00:00:00 2001 From: JP Hwang Date: Wed, 3 Jul 2024 20:21:54 +0100 Subject: [PATCH 1/3] Add kagome_kr to docstring --- weaviate/collections/classes/config.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/weaviate/collections/classes/config.py b/weaviate/collections/classes/config.py index 0b6fb881b..10ce2a096 100644 --- a/weaviate/collections/classes/config.py +++ b/weaviate/collections/classes/config.py @@ -137,6 +137,8 @@ class Tokenization(str, Enum): Tokenize using GSE (for Chinese and Japanese). `TRIGRAM` Tokenize into trigrams. + `KAGOME_KR` + Tokenize using the 'Kagome' tokenizer and a Korean MeCab dictionary (for Korean). """ WORD = "word" From 28871f892cbea02bb31278cf8e98d15144e32332 Mon Sep 17 00:00:00 2001 From: JP Hwang Date: Mon, 1 Jul 2024 16:06:47 +0100 Subject: [PATCH 2/3] Add kagome validation --- weaviate/collections/classes/config.py | 1 + 1 file changed, 1 insertion(+) diff --git a/weaviate/collections/classes/config.py b/weaviate/collections/classes/config.py index 10ce2a096..49384402a 100644 --- a/weaviate/collections/classes/config.py +++ b/weaviate/collections/classes/config.py @@ -147,6 +147,7 @@ class Tokenization(str, Enum): FIELD = "field" GSE = "gse" TRIGRAM = "trigram" + KAGOME_KR = "kagome_kr" class GenerativeSearches(str, Enum): From 640db5cee8d8c2c637fb9d89172948b7c073a6b1 Mon Sep 17 00:00:00 2001 From: Dirk Kulawiak Date: Fri, 19 Jul 2024 06:10:24 +0200 Subject: [PATCH 3/3] changelog and embedded increase --- docs/changelog.rst | 12 ++++++++++++ weaviate/embedded.py | 2 +- 2 files changed, 13 insertions(+), 1 deletion(-) diff --git a/docs/changelog.rst b/docs/changelog.rst index b87c5e466..2afe9c7f8 100644 --- a/docs/changelog.rst +++ b/docs/changelog.rst @@ -1,6 +1,18 @@ Changelog ========= +Version 4.6.7 +-------------- + +This patch version includes: + +- Fix batching with references. Under some circumstances a reference could be added before its ``to``-object and the reference would be lost. +- Fix node status for timed out nodes +- Fix parsing the year 0. While weaviate allows to add dates with year zero ("0000-01-30T00:00:00Z"), the datetime library is based on the gregorian calendar which does not have a year zero. The client will years with 0 as the minimum date that is possible in datetime (``datetime.datetime(1, 1, 1, 0, 0)``) and emit a warning +- Support for custom rerankers and generative modules using ``Configure.Generative.custom()`` and ``Configure.Reranker.custom()`` +- Add support for kagome_kr tokenizer. Requires Weaviate 1.25.8 +- Increase default embedded version to 1.25.8 + Version 4.6.6 -------------- diff --git a/weaviate/embedded.py b/weaviate/embedded.py index d737ec182..a7d2064bb 100644 --- a/weaviate/embedded.py +++ b/weaviate/embedded.py @@ -35,7 +35,7 @@ class EmbeddedOptions: persistence_data_path: str = os.environ.get("XDG_DATA_HOME", DEFAULT_PERSISTENCE_DATA_PATH) binary_path: str = os.environ.get("XDG_CACHE_HOME", DEFAULT_BINARY_PATH) - version: str = "1.23.7" + version: str = "1.25.8" port: int = DEFAULT_PORT hostname: str = "127.0.0.1" additional_env_vars: Optional[Dict[str, str]] = None