From e5685b0f0abccab077fde69551c36aec5a943db1 Mon Sep 17 00:00:00 2001 From: Uche Ogbuji Date: Thu, 20 Jun 2024 14:16:39 -0600 Subject: [PATCH 1/6] Clean up query-building logic --- README.md | 6 +++++- pylib/embedding/pgvector.py | 7 ++++--- pylib/embedding/pgvector_data.py | 22 +++++++++++----------- 3 files changed, 20 insertions(+), 15 deletions(-) diff --git a/README.md b/README.md index e21da6f..9e5d78a 100644 --- a/README.md +++ b/README.md @@ -156,6 +156,10 @@ pytest test If you want to make contributions to the project, please [read these notes](https://github.com/OoriData/OgbujiPT/wiki/Notes-for-contributors). +# Resources + +* [Against mixing environment setup with code](https://huggingface.co/blog/ucheog/separate-env-setup-from-code) + # License Apache 2. For tha culture! @@ -189,7 +193,7 @@ I mentioned the bias to software engineering, but what does this mean? ## Does this support GPU for locally-hosted models -Yes, but you have to make sure you set up your back end LLm server (llama.cpp or text-generation-webui) with GPU, and properly configure the model you load into it. If you can use the webui to query your model and get GPU usage, that will also apply here in OgbujiPT. +Yes, but you have to make sure you set up your back end LLM server (llama.cpp or text-generation-webui) with GPU, and properly configure the model you load into it. Many install guides I've found for Mac, Linux and Windows touch on enabling GPU, but the ecosystem is still in its early days, and helpful resouces can feel scattered. diff --git a/pylib/embedding/pgvector.py b/pylib/embedding/pgvector.py index 86563d0..c09b7e6 100644 --- a/pylib/embedding/pgvector.py +++ b/pylib/embedding/pgvector.py @@ -93,9 +93,6 @@ def __init__(self, embedding_model, table_name: str, pool): else: raise ValueError('embedding_model must be a SentenceTransformer object or None') - self.table_name = table_name - self.pool = pool - @classmethod async def from_conn_params(cls, embedding_model, table_name, host, port, db_name, user, password) -> 'PGVectorHelper': # noqa: E501 ''' @@ -117,6 +114,10 @@ async def from_conn_params(cls, embedding_model, table_name, host, port, db_name async def init_pool(conn): ''' Initialize vector extension for a connection from a pool + + Can be invoked from upstream if they're managing the connection pool themselves + + If they choose to have us create a connection pool (e.g. from_conn_params), it will use this ''' await conn.execute('CREATE EXTENSION IF NOT EXISTS vector;') await register_vector(conn) diff --git a/pylib/embedding/pgvector_data.py b/pylib/embedding/pgvector_data.py index 9063d44..1cb6672 100644 --- a/pylib/embedding/pgvector_data.py +++ b/pylib/embedding/pgvector_data.py @@ -184,22 +184,17 @@ async def search( query_embedding = list(self._embedding_model.encode(text)) # Build where clauses - if threshold is None: - # No where clauses, so don't bother with the WHERE keyword - where_clauses = [] - query_args = [query_embedding] - else: # construct where clauses - where_clauses = [] - query_args = [query_embedding] - if threshold is not None: - query_args.append(threshold) - where_clauses.append(THRESHOLD_WHERE_CLAUSE.format(query_threshold=f'${len(query_args)+1}')) + query_args = [query_embedding] + where_clauses = [] + if threshold is not None: + query_args.append(threshold) + where_clauses.append(THRESHOLD_WHERE_CLAUSE.format(query_threshold=f'${len(query_args)}')) for mf in meta_filter: assert callable(mf), 'All meta_filter items must be callable' clause, pval = mf() - where_clauses.append(clause.format(len(query_args)+1)) query_args.append(pval) + where_clauses.append(clause.format(len(query_args))) where_clauses_str = 'WHERE\n' + 'AND\n'.join(where_clauses) if where_clauses else '' @@ -208,6 +203,11 @@ async def search( else: limit_clause = '' + # print(QUERY_DATA_TABLE.format(table_name=self.table_name, where_clauses=where_clauses_str, + # limit_clause=limit_clause, + # )) + # print(query_args) + # Execute the search via SQL async with self.pool.acquire() as conn: # Uncomment to debug From 0c071116260febdd6485e91728214828423753cc Mon Sep 17 00:00:00 2001 From: Uche Ogbuji Date: Sun, 23 Jun 2024 22:12:01 -0600 Subject: [PATCH 2/6] Explicit Python 3.12 support --- pylib/llm_wrapper.py | 3 +-- pyproject.toml | 4 ++-- 2 files changed, 3 insertions(+), 4 deletions(-) diff --git a/pylib/llm_wrapper.py b/pylib/llm_wrapper.py index 9f2f9ef..6c97cf7 100644 --- a/pylib/llm_wrapper.py +++ b/pylib/llm_wrapper.py @@ -190,8 +190,7 @@ async def __call__(self, prompt, api_func=None, **kwargs): kwargs (dict, optional): Extra parameters to pass to the model via API. See Completions.create in OpenAI API, but in short, these: best_of, echo, frequency_penalty, logit_bias, logprobs, max_tokens, n - presence_penalty, seed, stop, stream, suffix, temperature, top_p, user -q + presence_penalty, seed, stop, stream, suffix, temperature, top_p, userq Returns: dict: JSON response from the LLM ''' diff --git a/pyproject.toml b/pyproject.toml index 749bec8..4f80c89 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -21,12 +21,12 @@ classifiers = [ "Programming Language :: Python", "Programming Language :: Python :: 3.10", "Programming Language :: Python :: 3.11", + "Programming Language :: Python :: 3.12", "Programming Language :: Python :: Implementation :: CPython", "Programming Language :: Python :: Implementation :: PyPy", ] dependencies = [ "openai>=1.1.0", - "python-dotenv", "tomli", "amara3.iri" ] @@ -78,7 +78,7 @@ cov = [ ] [[tool.hatch.envs.all.matrix]] -python = ["3.10", "3.11"] +python = ["3.10", "3.11", "3.12"] [tool.hatch.envs.lint] detached = true From 95fb488aa19d3956e66d548080114ac96e1530fd Mon Sep 17 00:00:00 2001 From: Uche Ogbuji Date: Mon, 24 Jun 2024 00:42:29 -0600 Subject: [PATCH 3/6] Update llm_wrapper.llm_response objects to handle tool calls. Clean up deprecated methods. --- pylib/llm_wrapper.py | 50 ++++++++------------------------------------ 1 file changed, 9 insertions(+), 41 deletions(-) diff --git a/pylib/llm_wrapper.py b/pylib/llm_wrapper.py index 6c97cf7..c449e1b 100644 --- a/pylib/llm_wrapper.py +++ b/pylib/llm_wrapper.py @@ -12,6 +12,7 @@ ''' import os +import json import asyncio import concurrent.futures from functools import partial @@ -70,8 +71,14 @@ def from_openai_chat(response): if 'message' in c: c['message'] = llm_response(c['message']) rc1 = resp['choices'][0] - # print(f'from_openai_chat: {rc1 =}') - resp['first_choice_text'] = rc1['text'] if 'text' in rc1 else rc1['message']['content'] + # No response message content if a tool call is invoked + if 'tool_calls' in rc1['message']: + # Why the hell does OpenAI have these arguments properties as plain text? Seems like a massive layering violation + for tc in rc1['message']['tool_calls']: + tc['function']['arguments_obj'] = json.loads(tc['function']['arguments']) + else: + resp['first_choice_text'] = rc1['text'] if 'text' in rc1 else rc1['message']['content'] + print('GRIPPO', f'from_openai_chat: {rc1 =}') else: resp['first_choice_text'] = resp['content'] return resp @@ -244,19 +251,6 @@ def available_models(self) -> List[str]: raise RuntimeError(f'Unexpected response from {self.base_url}/models:\n{repr(resp)}') return [ i['id'] for i in resp['data'] ] - @staticmethod - def first_choice_text(response): - ''' - Given an OpenAI-compatible API simple completion response, return the first choice text - ''' - warnings.warn('The first_choice_text method is deprecated; use the first_choice_text attribute or key instead', DeprecationWarning, stacklevel=2) # noqa E501 - try: - return response.choices[0].text - except AttributeError: - raise RuntimeError( - f'''Response does not appear to be an OpenAI API completion structure, as expected: -{repr(response)}''') - class openai_chat_api(openai_api): ''' @@ -322,19 +316,6 @@ async def __call__(self, prompt, api_func=None, **kwargs): # Haven't implemented any OpenAI API calls that are async, so just call the sync version return self.call(prompt, api_func, **kwargs) - @staticmethod - def first_choice_message(response): - ''' - Given an OpenAI-compatible API chat completion response, return the first choice message content - ''' - warnings.warn('The first_choice_message method is deprecated; use the first_choice_text attribute or key instead', DeprecationWarning, stacklevel=2) # noqa E501 - try: - return response.choices[0].message.content - except AttributeError: - raise RuntimeError( - f'''Response does not appear to be an OpenAI API chat-style completion structure, as expected: -{repr(response)}''') - class llama_cpp_http(llm_wrapper): ''' @@ -465,19 +446,6 @@ async def __call__(self, messages, req='/v1/chat/completions', timeout=30.0, api else: raise RuntimeError(f'Unexpected response from {self.base_url}{req}:\n{repr(result)}') - @staticmethod - def first_choice_message(response): - ''' - Given an OpenAI-compatible API chat completion response, return the first choice message content - ''' - warnings.warn('The first_choice_message method is deprecated; use the first_choice_text attribute or key instead', DeprecationWarning, stacklevel=2) # noqa E501 - try: - return response['choices'][0]['message']['content'] - except (IndexError, KeyError): - raise RuntimeError( - f'''Response does not appear to be a llama.cpp API chat-style completion structure, as expected: -{repr(response)}''') - class ctransformer: ''' From b2ea02af59a2944d08be312bf264287303b630e9 Mon Sep 17 00:00:00 2001 From: Uche Ogbuji Date: Mon, 24 Jun 2024 10:42:21 -0600 Subject: [PATCH 4/6] Index word loom items by their literal default language text, as well --- pylib/__about__.py | 2 +- pylib/word_loom.py | 13 ++++++++++--- 2 files changed, 11 insertions(+), 4 deletions(-) diff --git a/pylib/__about__.py b/pylib/__about__.py index 91abf7b..c328666 100644 --- a/pylib/__about__.py +++ b/pylib/__about__.py @@ -3,4 +3,4 @@ # SPDX-License-Identifier: Apache-2.0 # ogbujipt.about -__version__ = '0.9.2' +__version__ = '0.10.0' diff --git a/pylib/word_loom.py b/pylib/word_loom.py index 26385b6..c43740b 100644 --- a/pylib/word_loom.py +++ b/pylib/word_loom.py @@ -86,7 +86,9 @@ def clone(self, value=None, deflang=None, altlang=None, meta=None, markers=None) def load(fp_or_str, lang='en', preserve_key=False): ''' Read a word loom and return the tables as top-level result mapping - Loads the TOML, then selects text by given language + Loads the TOML + + Return a dict of the language items, indexed by the TOML key as well as its default language text fp_or_str - file-like object or string containing TOML lang - select oly texts in this language (default: 'en') @@ -97,9 +99,12 @@ def load(fp_or_str, lang='en', preserve_key=False): >>> loom = word_loom.load(fp) >>> loom['test_prompt_joke'].meta {'tag': 'humor', 'updated': '2024-01-01'} - >>> str(loom['test_prompt_joke']) + >>> actual_text = loom['test_prompt_joke'] + >>> str(actual_text) + 'Tell me a funny joke about {topic}\n' + >>> str(loom[str(actual_text)]) 'Tell me a funny joke about {topic}\n' - >>> loom['test_prompt_joke'].in_lang('fr') + >>> loom[str(actual_text)].in_lang('fr') 'Dites-moi une blague drôle sur {topic}\n' ''' # Ensure we have a file-like object @@ -136,4 +141,6 @@ def load(fp_or_str, lang='en', preserve_key=False): if preserve_key: meta['_key'] = k texts[k] = T(text, lang, altlang=altlang, meta=meta, markers=markers) + # Also index by literal text + texts[text] = T(text, lang, altlang=altlang, meta=meta, markers=markers) return texts From 7500e2ef37596ebc1d2afdb467106833919d3fad Mon Sep 17 00:00:00 2001 From: Uche Ogbuji Date: Mon, 24 Jun 2024 11:16:06 -0600 Subject: [PATCH 5/6] Fix tests --- pylib/llm_wrapper.py | 6 ++---- test/test_ogbujipt.py | 6 +++--- test/test_word_loom.py | 24 +++++++++++++++++------- 3 files changed, 22 insertions(+), 14 deletions(-) diff --git a/pylib/llm_wrapper.py b/pylib/llm_wrapper.py index c449e1b..9490ef7 100644 --- a/pylib/llm_wrapper.py +++ b/pylib/llm_wrapper.py @@ -17,7 +17,6 @@ import concurrent.futures from functools import partial from typing import List -import warnings from amara3 import iri @@ -72,13 +71,12 @@ def from_openai_chat(response): c['message'] = llm_response(c['message']) rc1 = resp['choices'][0] # No response message content if a tool call is invoked - if 'tool_calls' in rc1['message']: - # Why the hell does OpenAI have these arguments properties as plain text? Seems like a massive layering violation + if rc1.get('message', {}).get('tool_calls'): + # WTH does OpenAI have these arguments properties as plain text? Seems a massive layering violation for tc in rc1['message']['tool_calls']: tc['function']['arguments_obj'] = json.loads(tc['function']['arguments']) else: resp['first_choice_text'] = rc1['text'] if 'text' in rc1 else rc1['message']['content'] - print('GRIPPO', f'from_openai_chat: {rc1 =}') else: resp['first_choice_text'] = resp['content'] return resp diff --git a/test/test_ogbujipt.py b/test/test_ogbujipt.py index 2cc1ede..f8b460a 100644 --- a/test/test_ogbujipt.py +++ b/test/test_ogbujipt.py @@ -12,14 +12,14 @@ # import pytest -from ogbujipt.llm_wrapper import openai_chat_api +from ogbujipt.llm_wrapper import llm_response #, openai_chat_api def test_oapi_first_choice_text(OPENAI_TEXT_RESPONSE_OBJECT): - text1 = openai_chat_api.first_choice_text(OPENAI_TEXT_RESPONSE_OBJECT) + text1 = llm_response.from_openai_chat(OPENAI_TEXT_RESPONSE_OBJECT).first_choice_text assert text1 == '…is an exceptional employee who has made significant contributions to our company.' def test_oapi_first_choice_message(OPENAI_MSG_RESPONSE_OBJECT): - msg1 = openai_chat_api.first_choice_message(OPENAI_MSG_RESPONSE_OBJECT) + msg1 = llm_response.from_openai_chat(OPENAI_MSG_RESPONSE_OBJECT).first_choice_text assert msg1 == '…is an exceptional employee who has made significant contributions to our company.' diff --git a/test/test_word_loom.py b/test/test_word_loom.py index b22dcfe..5034a87 100644 --- a/test/test_word_loom.py +++ b/test/test_word_loom.py @@ -12,7 +12,7 @@ import os import sys -# import pkgutil +from itertools import chain import pytest @@ -49,9 +49,19 @@ def test_load_fp_vs_str(SAMPLE_TOML_STR, SAMPLE_TOML_FP): def test_sample_texts_check(SAMPLE_TOML_STR): # print(SAMPLE_TOML) loom = word_loom.load(SAMPLE_TOML_STR) - assert list(sorted(loom.keys())) == ['davinci3_instruct_system', 'hello_translated', 'i18n_context', 'write_i18n_advocacy'] - assert list(sorted([v[:20] for v in loom.values()])) == ['Hello', 'Internationalization', 'Obey the instruction', '{davinci3_instruct_s'] - assert [v.markers or [] for v in loom.values()] == [[], [], ['davinci3_instruct_system', 'i18n_context'], []] + # default language text is also a key + assert len(loom.keys()) == 8 + for k in ['davinci3_instruct_system', 'hello_translated', 'i18n_context', 'write_i18n_advocacy']: + assert k in loom.keys() + assert 'Hello' in loom.keys() + + # loom_dlt = set([v[:20] for v in loom.values()]) + + assert len(set(loom.values())) == 4 + for k in ['Hello', 'Internationalization', 'Obey the instruction', '{davinci3_instruct_s']: + assert k in [v[:20] for v in loom.values()] + + assert [v.markers or [] for v in loom.values()] == [[], [], [], [], ['davinci3_instruct_system', 'i18n_context'], ['davinci3_instruct_system', 'i18n_context'], [], []] assert loom['davinci3_instruct_system'].lang == 'en' # Default language is English @@ -59,9 +69,9 @@ def test_sample_texts_check(SAMPLE_TOML_STR): assert loom1 == loom loom = word_loom.load(SAMPLE_TOML_STR, lang='fr') - assert list(sorted(loom.keys())) == ['goodbye_translated', 'hardcoded_food', 'translate_request'] - assert list(sorted([v[:20] for v in loom.values()])) == ['Adieu', 'Comment dit-on en an', 'pomme de terre'] - assert [v.markers or [] for v in loom.values()] == [['hardcoded_food'], [], []] + assert list(sorted(loom.keys())) == ['Adieu', 'Comment dit-on en anglais: {hardcoded_food}?', 'goodbye_translated', 'hardcoded_food', 'pomme de terre', 'translate_request'] + assert list(sorted(set([v[:20] for v in loom.values()]))) == ['Adieu', 'Comment dit-on en an', 'pomme de terre'] + assert [v.markers or [] for v in loom.values()] == [['hardcoded_food'], ['hardcoded_food'], [], [], [], []] assert loom['hardcoded_food'].lang == 'fr' From b2ed163829a8e750d0601800687dea308f981554 Mon Sep 17 00:00:00 2001 From: Uche Ogbuji Date: Mon, 24 Jun 2024 11:41:05 -0600 Subject: [PATCH 6/6] CHANGELOG --- CHANGELOG.md | 21 +++++++++++++++++++++ pylib/__about__.py | 2 +- pylib/word_loom.py | 5 +++++ test/test_word_loom.py | 2 +- 4 files changed, 28 insertions(+), 2 deletions(-) diff --git a/CHANGELOG.md b/CHANGELOG.md index 3d0cb00..d6a2539 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -7,6 +7,27 @@ Notable changes to Format based on [Keep a Changelog](https://keepachangelog.co --> +## [0.9.2] - 20240625 + +### Added + +- `joiner` param to `text_helper.text_split()` for better control of regex separator handling +- query filter mix-in, `embedding.pgvector.match_oneof()`, for use with `meta_filter` argument to `DB.search` + +### Changed + +- Index word loom items by their literal default language text, as well +- Cleaned up PGVector query-building logic + +### Fixed + +- `llm_wrapper.llm_response` objects to handle tool calls +- failure of some matching scenarios in `embedding.pgvector.match_exact()` + +### Removed + +- Previously deprecated `first_choice_text` & `first_choice_message` methods + ## [0.9.1] - 20240604 ### Fixed diff --git a/pylib/__about__.py b/pylib/__about__.py index c328666..91abf7b 100644 --- a/pylib/__about__.py +++ b/pylib/__about__.py @@ -3,4 +3,4 @@ # SPDX-License-Identifier: Apache-2.0 # ogbujipt.about -__version__ = '0.10.0' +__version__ = '0.9.2' diff --git a/pylib/word_loom.py b/pylib/word_loom.py index c43740b..711d71d 100644 --- a/pylib/word_loom.py +++ b/pylib/word_loom.py @@ -140,7 +140,12 @@ def load(fp_or_str, lang='en', preserve_key=False): meta = {kk: vv for kk, vv in v.items() if (not kk.startswith('_') and kk not in ('text', 'markers'))} if preserve_key: meta['_key'] = k + if k in texts: + warnings.warn(f'Key {k} duplicates an existing item, which will be overwritten') texts[k] = T(text, lang, altlang=altlang, meta=meta, markers=markers) # Also index by literal text + if text in texts: + warnings.warn( + f'Item default language text {text[:20]} duplicates an existing item, which will be overwritten') texts[text] = T(text, lang, altlang=altlang, meta=meta, markers=markers) return texts diff --git a/test/test_word_loom.py b/test/test_word_loom.py index 5034a87..136ead3 100644 --- a/test/test_word_loom.py +++ b/test/test_word_loom.py @@ -12,7 +12,7 @@ import os import sys -from itertools import chain +# from itertools import chain import pytest