Fixes rc and add async tests (#407)

* Fix type * Add async tests * Drop tests.yml * Add chat stream tests
cohere-ai · Mar 18, 2024 · 77e0087 · 77e0087
1 parent 372bb05
commit 77e0087
Show file tree

Hide file tree

Showing 5 changed files with 332 additions and 45 deletions.
diff --git a/.fernignore b/.fernignore
@@ -4,4 +4,5 @@ README.md
 src/cohere/client.py
 tests
 .github/workflows/ci.yml
-LICENSE
+LICENSE
+.github/workflows/tests.yml
diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
diff --git a/src/cohere/client.py b/src/cohere/client.py
@@ -3,7 +3,7 @@
 import httpx
 
 from .base_client import BaseCohere, AsyncBaseCohere
-from .environment import CohereEnvironment
+from .environment import ClientEnvironment
 
 # Use NoReturn as Never type for compatibility
 Never = typing.NoReturn
@@ -59,7 +59,7 @@ def __init__(
             api_key: typing.Union[str, typing.Callable[[], str]],
             *,
             base_url: typing.Optional[str] = None,
-            environment: CohereEnvironment = CohereEnvironment.PRODUCTION,
+            environment: ClientEnvironment = ClientEnvironment.PRODUCTION,
             client_name: typing.Optional[str] = None,
             timeout: typing.Optional[float] = 60,
             httpx_client: typing.Optional[httpx.Client] = None,
@@ -128,7 +128,7 @@ def __init__(
             api_key: typing.Union[str, typing.Callable[[], str]],
             *,
             base_url: typing.Optional[str] = None,
-            environment: CohereEnvironment = CohereEnvironment.PRODUCTION,
+            environment: ClientEnvironment = ClientEnvironment.PRODUCTION,
             client_name: typing.Optional[str] = None,
             timeout: typing.Optional[float] = 60,
             httpx_client: typing.Optional[httpx.AsyncClient] = None,

diff --git a/tests/test_async_client.py b/tests/test_async_client.py
@@ -0,0 +1,310 @@
+import os
+import unittest
+from time import sleep
+
+import cohere
+from cohere import ChatMessage, ChatConnector, ClassifyExample, CreateConnectorServiceAuth, Tool, \
+    ToolParameterDefinitionsValue, ChatRequestToolResultsItem
+
+co = cohere.AsyncClient(os.environ['COHERE_API_KEY'], timeout=10000)
+
+package_dir = os.path.dirname(os.path.abspath(__file__))
+embed_job = os.path.join(package_dir, 'embed_job.jsonl')
+
+
+class TestClient(unittest.TestCase):
+
+    async def test_chat(self) -> None:
+        chat = await co.chat(
+            chat_history=[
+                ChatMessage(role="USER",
+                            message="Who discovered gravity?"),
+                ChatMessage(role="CHATBOT", message="The man who is widely credited with discovering "
+                                                    "gravity is Sir Isaac Newton")
+            ],
+            message="What year was he born?",
+            connectors=[ChatConnector(id="web-search")]
+        )
+
+        print(chat)
+
+    async def test_chat_stream(self) -> None:
+        stream = co.chat_stream(
+            chat_history=[
+                ChatMessage(role="USER",
+                            message="Who discovered gravity?"),
+                ChatMessage(role="CHATBOT", message="The man who is widely credited with discovering "
+                                                    "gravity is Sir Isaac Newton")
+            ],
+            message="What year was he born?",
+            connectors=[ChatConnector(id="web-search")]
+        )
+
+        async for chat_event in stream:
+            if chat_event.event_type == "text-generation":
+                print(chat_event.text)
+
+    async def test_stream_equals_true(self) -> None:
+        with self.assertRaises(ValueError):
+            await co.chat(
+                stream=True,  # type: ignore
+                message="What year was he born?",
+            )
+
+    async def test_deprecated_fn(self) -> None:
+        with self.assertRaises(ValueError):
+            await co.check_api_key("dummy", dummy="dummy")  # type: ignore
+
+    async def test_moved_fn(self) -> None:
+        with self.assertRaises(ValueError):
+            await co.list_connectors("dummy", dummy="dummy")  # type: ignore
+
+    async def test_generate(self) -> None:
+        response = await co.generate(
+            prompt='Please explain to me how LLMs work',
+        )
+        print(response)
+
+    async def test_embed(self) -> None:
+        response = await co.embed(
+            texts=['hello', 'goodbye'],
+            model='embed-english-v3.0',
+            input_type="classification"
+        )
+        print(response)
+
+    async def test_embed_job_crud(self) -> None:
+        dataset = await co.datasets.create(
+            name="test",
+            type="embed-input",
+            data=open(embed_job, 'rb'),
+        )
+
+        while True:
+            ds = await co.datasets.get(dataset.id or "")
+            sleep(2)
+            print(ds, flush=True)
+            if ds.dataset.validation_status != "processing":
+                break
+
+        # start an embed job
+        job = await co.embed_jobs.create(
+            dataset_id=dataset.id or "",
+            input_type="search_document",
+            model='embed-english-v3.0')
+
+        print(job)
+
+        # list embed jobs
+        my_embed_jobs = await co.embed_jobs.list()
+
+        print(my_embed_jobs)
+
+        while True:
+            em = await co.embed_jobs.get(job.job_id)
+            sleep(2)
+            print(em, flush=True)
+            if em.status != "processing":
+                break
+
+        await co.embed_jobs.cancel(job.job_id)
+
+        await co.datasets.delete(dataset.id or "")
+
+    async def test_rerank(self) -> None:
+        docs = [
+            'Carson City is the capital city of the American state of Nevada.',
+            'The Commonwealth of the Northern Mariana Islands is a group of islands in the Pacific Ocean. Its capital is Saipan.',
+            'Washington, D.C. (also known as simply Washington or D.C., and officially as the District of Columbia) is the capital of the United States. It is a federal district.',
+            'Capital punishment (the death penalty) has existed in the United States since beforethe United States was a country. As of 2017, capital punishment is legal in 30 of the 50 states.']
+
+        response = await co.rerank(
+            model='rerank-english-v2.0',
+            query='What is the capital of the United States?',
+            documents=docs,
+            top_n=3,
+        )
+
+        print(response)
+
+    async def test_classify(self) -> None:
+        examples = [
+            ClassifyExample(text="Dermatologists don't like her!", label="Spam"),
+            ClassifyExample(text="'Hello, open to this?'", label="Spam"),
+            ClassifyExample(
+                text="I need help please wire me $1000 right now", label="Spam"),
+            ClassifyExample(text="Nice to know you ;)", label="Spam"),
+            ClassifyExample(text="Please help me?", label="Spam"),
+            ClassifyExample(
+                text="Your parcel will be delivered today", label="Not spam"),
+            ClassifyExample(
+                text="Review changes to our Terms and Conditions", label="Not spam"),
+            ClassifyExample(text="Weekly sync notes", label="Not spam"),
+            ClassifyExample(
+                text="'Re: Follow up from today's meeting'", label="Not spam"),
+            ClassifyExample(text="Pre-read for tomorrow", label="Not spam"),
+        ]
+        inputs = [
+            "Confirm your email address",
+            "hey i need u to send some $",
+        ]
+        response = await co.classify(
+            inputs=inputs,
+            examples=examples,
+        )
+        print(response)
+
+    async def test_datasets_crud(self) -> None:
+        my_dataset = await co.datasets.create(
+            name="test",
+            type="embed-input",
+            data=open(embed_job, 'rb'),
+        )
+
+        print(my_dataset)
+
+        my_datasets = await co.datasets.list()
+
+        print(my_datasets)
+
+        dataset = await co.datasets.get(my_dataset.id or "")
+
+        print(dataset)
+
+        await co.datasets.delete(my_dataset.id or "")
+
+    async def test_summarize(self) -> None:
+        text = (
+            "Ice cream is a sweetened frozen food typically eaten as a snack or dessert. "
+            "It may be made from milk or cream and is flavoured with a sweetener, "
+            "either sugar or an alternative, and a spice, such as cocoa or vanilla, "
+            "or with fruit such as strawberries or peaches. "
+            "It can also be made by whisking a flavored cream base and liquid nitrogen together. "
+            "Food coloring is sometimes added, in addition to stabilizers. "
+            "The mixture is cooled below the freezing point of water and stirred to incorporate air spaces "
+            "and to prevent detectable ice crystals from forming. The result is a smooth, "
+            "semi-solid foam that is solid at very low temperatures (below 2 °C or 35 °F). "
+            "It becomes more malleable as its temperature increases.\n\n"
+            "The meaning of the name \"ice cream\" varies from one country to another. "
+            "In some countries, such as the United States, \"ice cream\" applies only to a specific variety, "
+            "and most governments regulate the commercial use of the various terms according to the "
+            "relative quantities of the main ingredients, notably the amount of cream. "
+            "Products that do not meet the criteria to be called ice cream are sometimes labelled "
+            "\"frozen dairy dessert\" instead. In other countries, such as Italy and Argentina, "
+            "one word is used fo\r all variants. Analogues made from dairy alternatives, "
+            "such as goat's or sheep's milk, or milk substitutes "
+            "(e.g., soy, cashew, coconut, almond milk or tofu), are available for those who are "
+            "lactose intolerant, allergic to dairy protein or vegan."
+        )
+
+        response = await co.summarize(
+            text=text,
+        )
+
+        print(response)
+
+    async def test_tokenize(self) -> None:
+        response = await co.tokenize(
+            text='tokenize me! :D',
+            model='command'
+        )
+        print(response)
+
+    async def test_detokenize(self) -> None:
+        response = await co.detokenize(
+            tokens=[10104, 12221, 1315, 34, 1420, 69],
+            model="command"
+        )
+        print(response)
+
+    async def test_connectors_crud(self) -> None:
+        created_connector = await co.connectors.create(
+            name="Example connector",
+            url="https://dummy-connector-o5btz7ucgq-uc.a.run.app/search",
+            service_auth=CreateConnectorServiceAuth(
+                token="dummy-connector-token",
+                type="bearer",
+            )
+        )
+        print(created_connector)
+
+        connector = await co.connectors.get(created_connector.connector.id)
+
+        print(connector)
+
+        updated_connector = await co.connectors.update(
+            id=connector.connector.id, name="new name")
+
+        print(updated_connector)
+
+        await co.connectors.delete(created_connector.connector.id)
+
+    async def test_tool_use(self) -> None:
+        tools = [
+            Tool(
+                name="sales_database",
+                description="Connects to a database about sales volumes",
+                parameter_definitions={
+                    "day": ToolParameterDefinitionsValue(
+                        description="Retrieves sales data from this day, formatted as YYYY-MM-DD.",
+                        type="str",
+                        required=True
+                    )}
+            )
+        ]
+
+        tool_parameters_response = await co.chat(
+            message="How good were the sales on September 29?",
+            tools=tools,
+            model="command-nightly",
+            preamble="""
+                ## Task Description
+                You help people answer their questions and other requests interactively. You will be asked a very wide array of requests on all kinds of topics. You will be equipped with a wide range of search engines or similar tools to help you, which you use to research your answer. You should focus on serving the user's needs as best you can, which will be wide-ranging.
+    
+                ## Style Guide
+                Unless the user asks for a different style of answer, you should answer in full sentences, using proper grammar and spelling.
+            """
+        )
+
+        if tool_parameters_response.tool_calls is not None:
+            self.assertEqual(tool_parameters_response.tool_calls[0].name, "sales_database")
+            self.assertEqual(tool_parameters_response.tool_calls[0].parameters, {"day": "2023-09-29"})
+        else:
+            raise ValueError("Expected tool calls to be present")
+
+        local_tools = {
+            "sales_database": lambda day: {
+                "number_of_sales": 120,
+                "total_revenue": 48500,
+                "average_sale_value": 404.17,
+                "date": "2023-09-29"
+            }
+        }
+
+        tool_results = []
+        for tool_call in tool_parameters_response.tool_calls:
+            output = local_tools[tool_call.name](**tool_call.parameters)
+            outputs = [output]
+
+            tool_results.append(ChatRequestToolResultsItem(
+                call=tool_call,
+                outputs=outputs
+            ))
+
+        cited_response = await co.chat(
+            message="How good were the sales on September 29?",
+            tools=tools,
+            tool_results=tool_results,
+            model="command-nightly",
+        )
+
+        self.assertEqual(cited_response.documents, [
+            {
+                "tool_name": "sales_database",
+                "average_sale_value": "404.17",
+                "date": "2023-09-29",
+                "id": "sales_database:0:0",
+                "number_of_sales": "120",
+                "total_revenue": "48500",
+            }
+        ])