Show details for query tokens (#1392)

2024-07-05 00:10:56 +05:30
parent ea09b5f7f0
commit 4880557d51
25 changed files with 1825 additions and 517 deletions
--- a/tests/llm/test_cohere.py
+++ b/tests/llm/test_cohere.py
@@ -9,7 +9,7 @@ from embedchain.llm.cohere import CohereLlm
@pytest.fixture
 def cohere_llm_config():
    os.environ["COHERE_API_KEY"] = "test_api_key"
-    config = BaseLlmConfig(model="gptd-instruct-tft", max_tokens=50, temperature=0.7, top_p=0.8)
+    config = BaseLlmConfig(model="command-r", max_tokens=100, temperature=0.7, top_p=0.8, token_usage=False)
    yield config
    os.environ.pop("COHERE_API_KEY")

@@ -36,10 +36,35 @@ def test_get_llm_model_answer(cohere_llm_config, mocker):
    assert answer == "Test answer"


+def test_get_llm_model_answer_with_token_usage(cohere_llm_config, mocker):
+    test_config = BaseLlmConfig(
+        temperature=cohere_llm_config.temperature,
+        max_tokens=cohere_llm_config.max_tokens,
+        top_p=cohere_llm_config.top_p,
+        model=cohere_llm_config.model,
+        token_usage=True,
+    )
+    mocker.patch(
+        "embedchain.llm.cohere.CohereLlm._get_answer",
+        return_value=("Test answer", {"input_tokens": 1, "output_tokens": 2}),
+    )
+
+    llm = CohereLlm(test_config)
+    answer, token_info = llm.get_llm_model_answer("Test query")
+
+    assert answer == "Test answer"
+    assert token_info == {
+        "prompt_tokens": 1,
+        "completion_tokens": 2,
+        "total_tokens": 3,
+        "total_cost": 3.5e-06,
+        "cost_currency": "USD",
+    }
+
+
 def test_get_answer_mocked_cohere(cohere_llm_config, mocker):
-    mocked_cohere = mocker.patch("embedchain.llm.cohere.Cohere")
-    mock_instance = mocked_cohere.return_value
-    mock_instance.invoke.return_value = "Mocked answer"
+    mocked_cohere = mocker.patch("embedchain.llm.cohere.ChatCohere")
+    mocked_cohere.return_value.invoke.return_value.content = "Mocked answer"

    llm = CohereLlm(cohere_llm_config)
    prompt = "Test query"