Skip to content

Commit

Permalink
Register full embedding model names (#654)
Browse files Browse the repository at this point in the history
Provide backward compatible aliases.
This makes available the same model names that ttok uses.
  • Loading branch information
web-sst authored Jan 23, 2025
1 parent 5998374 commit 6f7ea40
Show file tree
Hide file tree
Showing 3 changed files with 9 additions and 9 deletions.
12 changes: 6 additions & 6 deletions llm/default_plugins/openai_models.py
Original file line number Diff line number Diff line change
Expand Up @@ -134,14 +134,14 @@ def register_models(register):
@hookimpl
def register_embedding_models(register):
register(
OpenAIEmbeddingModel("ada-002", "text-embedding-ada-002"), aliases=("ada",)
OpenAIEmbeddingModel("text-embedding-ada-002", "text-embedding-ada-002"), aliases=("ada","ada-002",)
)
register(OpenAIEmbeddingModel("3-small", "text-embedding-3-small"))
register(OpenAIEmbeddingModel("3-large", "text-embedding-3-large"))
register(OpenAIEmbeddingModel("text-embedding-3-small", "text-embedding-3-small"), aliases=("3-small",))
register(OpenAIEmbeddingModel("text-embedding-3-large", "text-embedding-3-large"), aliases=("3-large",))
# With varying dimensions
register(OpenAIEmbeddingModel("3-small-512", "text-embedding-3-small", 512))
register(OpenAIEmbeddingModel("3-large-256", "text-embedding-3-large", 256))
register(OpenAIEmbeddingModel("3-large-1024", "text-embedding-3-large", 1024))
register(OpenAIEmbeddingModel("text-embedding-3-small-512", "text-embedding-3-small", 512), aliases=("3-small-512",))
register(OpenAIEmbeddingModel("text-embedding-3-large-256", "text-embedding-3-large", 256), aliases=("3-large-256",))
register(OpenAIEmbeddingModel("text-embedding-3-large-1024", "text-embedding-3-large", 1024), aliases=("3-large-1024",))


class OpenAIEmbeddingModel(EmbeddingModel):
Expand Down
4 changes: 2 additions & 2 deletions tests/test_aliases.py
Original file line number Diff line number Diff line change
Expand Up @@ -39,7 +39,7 @@ def test_cli_aliases_list(args):
"gpt4 : gpt-4\n"
"4-32k : gpt-4-32k\n"
"e-demo : embed-demo (embedding)\n"
"ada : ada-002 (embedding)\n"
"ada : text-embedding-ada-002 (embedding)\n"
).split("\n"):
line = line.strip()
if not line:
Expand All @@ -65,7 +65,7 @@ def test_cli_aliases_list_json(args):
"4": "gpt-4",
"gpt4": "gpt-4",
"4-32k": "gpt-4-32k",
"ada": "ada-002",
"ada": "text-embedding-ada-002",
"e-demo": "embed-demo",
}.items()
)
Expand Down
2 changes: 1 addition & 1 deletion tests/test_embed_cli.py
Original file line number Diff line number Diff line change
Expand Up @@ -554,7 +554,7 @@ def test_default_embedding_model():
assert result2.exit_code == 0
result3 = runner.invoke(cli, ["embed-models", "default"])
assert result3.exit_code == 0
assert result3.output == "ada-002\n"
assert result3.output == "text-embedding-ada-002\n"
result4 = runner.invoke(cli, ["embed-models", "default", "--remove-default"])
assert result4.exit_code == 0
result5 = runner.invoke(cli, ["embed-models", "default"])
Expand Down

0 comments on commit 6f7ea40

Please sign in to comment.