improve tests

Josephrp · Josephrp · commit ada155a4a307 · 2024-07-19T17:54:24.000+02:00
diff --git a/docs/api/llm/01ai.md b/docs/api/llm/01ai.md
@@ -1,3 +1,3 @@
 # 01ai API
 
-::: distilabel.llms.oneai
+::: distilabel.llms.oneai
diff --git a/docs/sections/how_to_guides/basic/llm/index.md b/docs/sections/how_to_guides/basic/llm/index.md
@@ -142,4 +142,4 @@ To create custom LLMs, subclass either [`LLM`][distilabel.llms.LLM] for synchron
 
 ## Available LLMs
 
-[Our LLM gallery](/distilabel/components-gallery/llms/) shows a list of the available LLMs that can be used within the `distilabel` library.
+[Our LLM gallery](/distilabel/components-gallery/llms/) shows a list of the available LLMs that can be used within the `distilabel` library.
diff --git a/tests/unit/llms/test_01ai.py b/tests/unit/llms/test_01ai.py
@@ -1,171 +1,163 @@
-from distilabel.llms.oneai import OneAI
-from typing import Any, Dict
-from unittest import mock
-from unittest.mock import AsyncMock, MagicMock, Mock, patch
-
-import nest_asyncio
-import pytest
-from .utils import DummyUserDetail
-
-
-@patch("openai.AsyncOpenAI")
-class TestOneAI:
-    model_id: str = "gpt-4"
-
-    def test_oneai_llm(self, _: MagicMock) -> None:
-        llm = OneAI(model=self.model_id, api_key="api.key")  # type: ignore
-
-        assert isinstance(llm, OneAI)
-        assert llm.model_name == self.model_id
-
-    def test_oneai_llm_env_vars(self, _: MagicMock) -> None:
-        with mock.patch.dict(os.environ, clear=True):
-            os.environ["01AI_API_KEY"] = "another.api.key"
-            os.environ["01AI_BASE_URL"] = "https://example.com"
-
-            llm = OneAI(model=self.model_id)
-
-            assert isinstance(llm, OneAI)
-            assert llm.model_name == self.model_id
-            assert llm.base_url == "https://example.com"
-            assert llm.api_key.get_secret_value() == "another.api.key"  # type: ignore
-
-    @pytest.mark.asyncio
-    async def test_agenerate(self, mock_openai: MagicMock) -> None:
-        llm = OneAI(model=self.model_id, api_key="api.key")  # type: ignore
-        llm._aclient = mock_openai
-
-        mocked_completion = Mock(
-            choices=[Mock(message=Mock(content=" Aenean hendrerit aliquam velit. ..."))]
-        )
-        llm._aclient.chat.completions.create = AsyncMock(return_value=mocked_completion)
-
-        await llm.agenerate(
-            input=[
-                {"role": "system", "content": ""},
-                {
-                    "role": "user",
-                    "content": "Lorem ipsum dolor sit amet, consectetur adipiscing elit.",
-                },
-            ]
-        )
-
-    @pytest.mark.asyncio
-    async def test_agenerate_structured(self, mock_openai: MagicMock) -> None:
-        llm = OneAI(
-            model=self.model_id,
-            api_key="api.key",
-            structured_output={
-                "schema": DummyUserDetail,
-                "mode": "tool_call",
-                "max_retries": 1,
-            },
-        )  # type: ignore
-        llm._aclient = mock_openai
-
-        sample_user = DummyUserDetail(name="John Doe", age=30)
-
-        llm._aclient.chat.completions.create = AsyncMock(return_value=sample_user)
-
-        generation = await llm.agenerate(
-            input=[
-                {"role": "system", "content": ""},
-                {
-                    "role": "user",
-                    "content": "Lorem ipsum dolor sit amet, consectetur adipiscing elit.",
-                },
-            ]
-        )
-        assert generation[0] == sample_user.model_dump_json()
-
-    @pytest.mark.skipif(
-        sys.version_info < (3, 9), reason="`mistralai` requires Python 3.9 or higher"
-    )
-    @pytest.mark.asyncio
-    async def test_generate(self, mock_openai: MagicMock) -> None:
-        llm = OneAI(model=self.model_id, api_key="api.key")  # type: ignore
-        llm._aclient = mock_openai
-
-        mocked_completion = Mock(
-            choices=[Mock(message=Mock(content=" Aenean hendrerit aliquam velit. ..."))]
-        )
-        llm._aclient.chat.completions.create = AsyncMock(return_value=mocked_completion)
-
-        nest_asyncio.apply()
-
-        llm.generate(
-            inputs=[
-                [
-                    {"role": "system", "content": ""},
-                    {
-                        "role": "user",
-                        "content": "Lorem ipsum dolor sit amet, consectetur adipiscing elit.",
-                    },
-                ]
-            ]
-        )
-
-        with pytest.raises(ValueError):
-            llm.generate(
-                inputs=[
-                    [
-                        {"role": "system", "content": ""},
-                        {
-                            "role": "user",
-                            "content": "Lorem ipsum dolor sit amet, consectetur adipiscing elit.",
-                        },
-                    ]
-                ],
-                response_format="unkown_format",
-            )
-
-    @pytest.mark.parametrize(
-        "structured_output, dump",
-        [
-            (
-                None,
-                {
-                    "model": "gpt-4",
-                    "generation_kwargs": {},
-                    "max_retries": 6,
-                    "base_url": "https://api.openai.com/v1",
-                    "timeout": 120,
-                    "structured_output": None,
-                    "type_info": {
-                        "module": "distilabel.llms.oneai",
-                        "name": "OneAI",
-                    },
-                },
-            ),
-            (
-                {
-                    "schema": DummyUserDetail.model_json_schema(),
-                    "mode": "tool_call",
-                    "max_retries": 1,
-                },
-                {
-                    "model": "gpt-4",
-                    "generation_kwargs": {},
-                    "max_retries": 6,
-                    "base_url": "https://api.openai.com/v1",
-                    "timeout": 120,
-                    "structured_output": {
-                        "schema": DummyUserDetail.model_json_schema(),
-                        "mode": "tool_call",
-                        "max_retries": 1,
-                    },
-                    "type_info": {
-                        "module": "distilabel.llms.oneai",
-                        "name": "OneAI",
-                    },
-                },
-            ),
-        ],
-    )
-    def test_serialization(
-        self, _: MagicMock, structured_output: Dict[str, Any], dump: Dict[str, Any]
-    ) -> None:
-        llm = OneAI(model=self.model_id, structured_output=structured_output)
-
-        assert llm.dump() == dump
-        assert isinstance(OneAI.from_dict(dump), OneAI)
+# tests/test_oneai.py  
+  
+import os  
+import sys  
+from typing import Any, Dict  
+from unittest import mock  
+from unittest.mock import AsyncMock, MagicMock, Mock, patch  
+  
+import nest_asyncio  
+import pytest  
+  
+from distilabel.llms.oneai import OneAI  
+from .utils import DummyUserDetail  
+  
+  
+@patch("openai.AsyncOpenAI")  
+class TestOneAI:  
+    model_id: str = "yi-large"  
+  
+    def test_oneai_llm(self, _: MagicMock) -> None:  
+        llm = OneAI(model=self.model_id, api_key="api.key")  # type: ignore  
+        assert isinstance(llm, OneAI)  
+        assert llm.model_name == self.model_id  
+  
+    def test_oneai_llm_env_vars(self, _: MagicMock) -> None:  
+        with mock.patch.dict(os.environ, clear=True):  
+            os.environ["01AI_API_KEY"] = "another.api.key"  
+            os.environ["01AI_BASE_URL"] = "https://api.01.ai/v1/chat/completions"  
+            llm = OneAI(model=self.model_id)  
+            assert isinstance(llm, OneAI)  
+            assert llm.model_name == self.model_id  
+            assert llm.base_url == "https://api.01.ai/v1/chat/completions"  
+            assert llm.api_key.get_secret_value() == "another.api.key"  # type: ignore  
+  
+    @pytest.mark.asyncio  
+    async def test_agenerate(self, mock_openai: MagicMock) -> None:  
+        llm = OneAI(model=self.model_id, api_key="api.key")  # type: ignore  
+        llm._aclient = mock_openai  
+        mocked_completion = Mock(  
+            choices=[Mock(message=Mock(content=" Aenean hendrerit aliquam velit. ..."))]  
+        )  
+        llm._aclient.chat.completions.create = AsyncMock(return_value=mocked_completion)  
+        await llm.agenerate(  
+            input=[  
+                {"role": "system", "content": ""},  
+                {  
+                    "role": "user",  
+                    "content": "Lorem ipsum dolor sit amet, consectetur adipiscing elit.",  
+                },  
+            ]  
+        )  
+  
+    @pytest.mark.asyncio  
+    async def test_agenerate_structured(self, mock_openai: MagicMock) -> None:  
+        llm = OneAI(  
+            model=self.model_id,  
+            api_key="api.key",  
+            structured_output={  
+                "schema": DummyUserDetail,  
+                "mode": "tool_call",  
+                "max_retries": 1,  
+            },  
+        )  # type: ignore  
+        llm._aclient = mock_openai  
+        sample_user = DummyUserDetail(name="John Doe", age=30)  
+        llm._aclient.chat.completions.create = AsyncMock(return_value=sample_user)  
+        generation = await llm.agenerate(  
+            input=[  
+                {"role": "system", "content": ""},  
+                {  
+                    "role": "user",  
+                    "content": "Lorem ipsum dolor sit amet, consectetur adipiscing elit.",  
+                },  
+            ]  
+        )  
+        assert generation[0] == sample_user.model_dump_json()  
+  
+    @pytest.mark.skipif(  
+        sys.version_info < (3, 9), reason="`01ai` requires Python 3.9 or higher"  
+    )  
+    @pytest.mark.asyncio  
+    async def test_generate(self, mock_openai: MagicMock) -> None:  
+        llm = OneAI(model=self.model_id, api_key="api.key")  # type: ignore  
+        llm._aclient = mock_openai  
+        mocked_completion = Mock(  
+            choices=[Mock(message=Mock(content=" Aenean hendrerit aliquam velit. ..."))]  
+        )  
+        llm._aclient.chat.completions.create = AsyncMock(return_value=mocked_completion)  
+        nest_asyncio.apply()  
+        llm.generate(  
+            inputs=[  
+                [  
+                    {"role": "system", "content": ""},  
+                    {  
+                        "role": "user",  
+                        "content": "Lorem ipsum dolor sit amet, consectetur adipiscing elit.",  
+                    },  
+                ]  
+            ]  
+        )  
+        with pytest.raises(ValueError):  
+            llm.generate(  
+                inputs=[  
+                    [  
+                        {"role": "system", "content": ""},  
+                        {  
+                            "role": "user",  
+                            "content": "Lorem ipsum dolor sit amet, consectetur adipiscing elit.",  
+                        },  
+                    ]  
+                ],  
+                response_format="unknown_format",  
+            )  
+  
+    @pytest.mark.parametrize(  
+        "structured_output, dump",  
+        [  
+            (  
+                None,  
+                {  
+                    "model": "yi-large",  
+                    "generation_kwargs": {},  
+                    "max_retries": 6,  
+                    "base_url": "https://api.01.ai/v1/chat/completions",  
+                    "timeout": 120,  
+                    "structured_output": None,  
+                    "type_info": {  
+                        "module": "distilabel.llms.oneai",  
+                        "name": "OneAI",  
+                    },  
+                },  
+            ),  
+            (  
+                {  
+                    "schema": DummyUserDetail.model_json_schema(),  
+                    "mode": "tool_call",  
+                    "max_retries": 1,  
+                },  
+                {  
+                    "model": "gpt-4",  
+                    "generation_kwargs": {},  
+                    "max_retries": 6,  
+                    "base_url": "https://api.01.ai/v1/chat/completions",  
+                    "timeout": 120,  
+                    "structured_output": {  
+                        "schema": DummyUserDetail.model_json_schema(),  
+                        "mode": "tool_call",  
+                        "max_retries": 1,  
+                    },  
+                    "type_info": {  
+                        "module": "distilabel.llms.oneai",  
+                        "name": "OneAI",  
+                    },  
+                },  
+            ),  
+        ],  
+    )  
+    def test_serialization(  
+        self, _: MagicMock, structured_output: Dict[str, Any], dump: Dict[str, Any]  
+    ) -> None:  
+        llm = OneAI(model=self.model_id, structured_output=structured_output)  
+        assert llm.dump() == dump  
+        assert isinstance(OneAI.from_dict(dump), OneAI)  

Original file line number	Diff line number	Diff line change
`@@ -1,3 +1,3 @@`
`1`	`1`	`# 01ai API`
`2`	`2`
`3`		`-::: distilabel.llms.oneai`
	`3`	`+::: distilabel.llms.oneai`
Original file line number	Diff line number	Diff line change
@@ -142,4 +142,4 @@ To create custom LLMs, subclass either [`LLM`][distilabel.llms.LLM] for synchron
`142`	`142`
`143`	`143`	`## Available LLMs`
`144`	`144`
`145`		-[Our LLM gallery](/distilabel/components-gallery/llms/) shows a list of the available LLMs that can be used within the `distilabel` library.
	`145`	+[Our LLM gallery](/distilabel/components-gallery/llms/) shows a list of the available LLMs that can be used within the `distilabel` library.