diff --git a/README.md b/README.md index b0f1ba089..ce36df5d7 100644 --- a/README.md +++ b/README.md @@ -56,6 +56,7 @@ The following plugins are available today: | [livekit-plugins-anthropic](https://pypi.org/project/livekit-plugins-anthropic/) | LLM | | [livekit-plugins-azure](https://pypi.org/project/livekit-plugins-azure/) | STT, TTS | | [livekit-plugins-deepgram](https://pypi.org/project/livekit-plugins-deepgram/) | STT | +| [livekit-plugins-dify](https://pypi.org/project/livekit-plugins-dify/) | LLM | | [livekit-plugins-cartesia](https://pypi.org/project/livekit-plugins-cartesia/) | TTS | | [livekit-plugins-elevenlabs](https://pypi.org/project/livekit-plugins-elevenlabs/) | TTS | | [livekit-plugins-playht](https://pypi.org/project/livekit-plugins-playht/) | TTS | diff --git a/livekit-plugins/livekit-plugins-dify/CHANGELOG.md b/livekit-plugins/livekit-plugins-dify/CHANGELOG.md new file mode 100644 index 000000000..8c42e2d52 --- /dev/null +++ b/livekit-plugins/livekit-plugins-dify/CHANGELOG.md @@ -0,0 +1,10 @@ +Changelog + +- v0.3.0 +Remove sleep to speed up the response + +- v0.2.0 +Fix bug + +- v0.1.0 +Init Project \ No newline at end of file diff --git a/livekit-plugins/livekit-plugins-dify/README.md b/livekit-plugins/livekit-plugins-dify/README.md new file mode 100644 index 000000000..e55c1c22b --- /dev/null +++ b/livekit-plugins/livekit-plugins-dify/README.md @@ -0,0 +1,21 @@ +# LiveKit Plugins Dify + +LLM inference implemention from Dify API + +Usage: +``` + agent = VoicePipelineAgent( + vad=ctx.proc.userdata["vad"], + stt=deepgram.STT(model=dg_model), + llm=dify.LLM( + base_url="Your dify API", + api_key="Your Dify App API Key", + ), + tts=openai.TTS(), + chat_ctx=initial_ctx, + ) +``` + +Notes: Do not use `initial_ctx = llm.ChatContext().append` to add system prompt or context. Implement these in your Dify. + +Only 'Chatflow' is supported. \ No newline at end of file diff --git a/livekit-plugins/livekit-plugins-dify/livekit/plugins/dify/__init__.py b/livekit-plugins/livekit-plugins-dify/livekit/plugins/dify/__init__.py new file mode 100644 index 000000000..24d073513 --- /dev/null +++ b/livekit-plugins/livekit-plugins-dify/livekit/plugins/dify/__init__.py @@ -0,0 +1,32 @@ +from livekit.agents import Plugin + +from .log import logger +from .version import __version__ +from .llm import LLM, LLMStream +from .models import ChatModels + + +__all__ = [ + "LLM", + "LLMStream", + "logger", + "__version__", +] + +class DifyPlugin(Plugin): + def __init__(self): + super().__init__(__name__, __version__, __package__, logger) + +Plugin.register_plugin(DifyPlugin()) +_module = dir() +NOT_IN_ALL = [m for m in _module if m not in __all__] + +__pdoc__ = {} + +for n in NOT_IN_ALL: + __pdoc__[n] = False + +def greet(): + return 'hi, im dify' + + diff --git a/livekit-plugins/livekit-plugins-dify/livekit/plugins/dify/llm.py b/livekit-plugins/livekit-plugins-dify/livekit/plugins/dify/llm.py new file mode 100644 index 000000000..40bb67edc --- /dev/null +++ b/livekit-plugins/livekit-plugins-dify/livekit/plugins/dify/llm.py @@ -0,0 +1,226 @@ +# Copyright 2024 Riino.Site (https://riino.site) + +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. + +from __future__ import annotations + +import base64 +import inspect +import json +import os +from dataclasses import dataclass +from typing import Any, Awaitable, List, Tuple, get_args, get_origin +import asyncio +import httpx +from livekit import rtc +from livekit.agents import llm, utils +from .models import ( + ChatModels, +) +from .log import logger + +def build_message(msg: llm.Message) -> dict: + + return { + "role": msg.role, + "content": msg.content + } + +@dataclass +class LLMOptions: + model: str | ChatModels + user: str | None + temperature: float | None + +class LLM(llm.LLM): + def __init__( + self, + *, + model: str | ChatModels = "dify",#will not be used + api_key: str | None = None, + base_url: str | None = "https://api.dify.ai/v1", + user: str | None = None, + client: httpx.AsyncClient | None = None, + temperature: float | None = None,#will not be used + ) -> None: + """ + Create a new instance of Telnyx LLM. + + ``api_key`` must be set to your Dify App API key, either using the argument or by setting + the ``DIFY_API_KEY`` environmental variable. + """ + api_key = api_key or os.environ.get("DIFY_API_KEY") + if api_key is None: + raise ValueError("Please") + self.base_url = base_url or "https://api.dify.ai/v1" + self._opts = LLMOptions( + model=model, + user=user, + temperature=temperature + ) + + self._client = client or httpx.AsyncClient( + base_url=base_url, + headers={ + 'Authorization': f'Bearer {api_key}', + 'Content-Type': 'application/json' + }, + # timeout=httpx.Timeout(connect=15.0, read=5.0, write=5.0, pool=5.0), + follow_redirects=True, + timeout=httpx.Timeout( + connect=15.0, # Connect Timeout + read=300.0, # 5-min Read Timeout + write=30.0, # Write Timeout + pool=5.0 + ), + limits=httpx.Limits( + max_connections=50, + max_keepalive_connections=50, + keepalive_expiry=120, + ), + ) + self._conversation_id = "" + + def chat( + self, + *, + chat_ctx: llm.ChatContext, + fnc_ctx: llm.FunctionContext | None = None, + temperature: float | None = None, + n: int | None = None, + parallel_tool_calls: bool | None = None, + ) -> "LLMStream": + last_message = chat_ctx.messages[-1] if chat_ctx.messages else None + + request_data = { + "inputs": {}, + "query": last_message.content if last_message else "", + "response_mode": "streaming",#must be streaming + "conversation_id": self._conversation_id, + "user": self._opts.user or "livekit-plugin-dify", + #no temperature + } + + stream = self._client.post( + '/chat-messages', + json=request_data, + ) + + return LLMStream( + dify_stream=stream, + chat_ctx=chat_ctx, + fnc_ctx=fnc_ctx, + conversation_id_callback=self._update_conversation_id # pass callback to update conversation_id + ) + + def _update_conversation_id(self, new_id: str) -> None: + """ + Callback for conversation id update + """ + self._conversation_id = new_id + + async def close(self) -> None: + """Close Connection""" + if self._client: + await self._client.aclose() + +class LLMStream(llm.LLMStream): + def __init__( + self, + *, + dify_stream, + chat_ctx: llm.ChatContext, + fnc_ctx: llm.FunctionContext | None, + conversation_id_callback: callable, + ) -> None: + super().__init__(chat_ctx=chat_ctx, fnc_ctx=fnc_ctx) + self._awaitable_dify_stream = dify_stream + self._dify_stream = None + self._conversation_id_callback = conversation_id_callback + self._conversation_id_updated = False + self._current_count = 0 + self._skip_interval = 1 + + async def aclose(self) -> None: + if self._dify_stream: + await self._dify_stream.close() + return await super().aclose() + + async def __anext__(self): + if not self._dify_stream: + # print("Initializing stream...") + self._dify_stream = await self._awaitable_dify_stream + # print("Stream initialized.") + + async for chunk in self._dify_stream.aiter_lines(): + + if not chunk.strip(): + # await asyncio.sleep(0.1) #remove this sleep after testing. + continue + + # print(f"Received chunk: {chunk.strip()}") + + self._current_count += 1 + # print(f"Current count: {self._current_count}, Skip interval: {self._skip_interval}") + + if self._current_count < self._skip_interval: + # print("Skipping this chunk.") + continue + else: + # print("Processing this chunk.") + self._current_count = 0 + + event_data = chunk[len("data: "):].strip() + try: + message = json.loads(event_data) + # print(f"Parsed message: {message}") + except json.JSONDecodeError: + # print("Failed to parse JSON, skipping this chunk.") + logger.warning( + "Failed to parse JSON, skipping this chunk." + ) + continue + + if 'answer' in message: + chat_chunk = self._parse_message(message) + if chat_chunk is not None: + self._skip_interval += 1 + return chat_chunk + else: + pass + # print("No 'answer' key found in message, skipping.") + + # print("No more chunks to process, stopping iteration.") + raise StopAsyncIteration + + + + def _parse_message(self, message: dict) -> llm.ChatChunk | None: + if not self._conversation_id_updated and "conversation_id" in message: + self._conversation_id_callback(message["conversation_id"]) + self._conversation_id_updated = True + + if message.get("event") == "message": + return llm.ChatChunk( + choices=[ + llm.Choice( + delta=llm.ChoiceDelta( + content=message["answer"], + role="assistant" + ), + index=0 + ) + ] + ) + else: + return None \ No newline at end of file diff --git a/livekit-plugins/livekit-plugins-dify/livekit/plugins/dify/log.py b/livekit-plugins/livekit-plugins-dify/livekit/plugins/dify/log.py new file mode 100644 index 000000000..209033185 --- /dev/null +++ b/livekit-plugins/livekit-plugins-dify/livekit/plugins/dify/log.py @@ -0,0 +1,3 @@ +import logging + +logger = logging.getLogger("livekit.plugins.dify") diff --git a/livekit-plugins/livekit-plugins-dify/livekit/plugins/dify/models.py b/livekit-plugins/livekit-plugins-dify/livekit/plugins/dify/models.py new file mode 100644 index 000000000..2db18f53a --- /dev/null +++ b/livekit-plugins/livekit-plugins-dify/livekit/plugins/dify/models.py @@ -0,0 +1,5 @@ +from typing import Literal + +ChatModels = Literal[ + "dify", +] diff --git a/livekit-plugins/livekit-plugins-dify/livekit/plugins/dify/version.py b/livekit-plugins/livekit-plugins-dify/livekit/plugins/dify/version.py new file mode 100644 index 000000000..7078e1a58 --- /dev/null +++ b/livekit-plugins/livekit-plugins-dify/livekit/plugins/dify/version.py @@ -0,0 +1,15 @@ +# Copyright 2024 Riino.Site (https://riino.site) + +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. + +__version__ = "0.3.0" diff --git a/livekit-plugins/livekit-plugins-dify/package.json b/livekit-plugins/livekit-plugins-dify/package.json new file mode 100644 index 000000000..97477084a --- /dev/null +++ b/livekit-plugins/livekit-plugins-dify/package.json @@ -0,0 +1,8 @@ +{ + "name": "livekit-plugins-dify", + "private": true, + "version": "0.2.0", + "dependencies": { + "livekit-plugins-dify": "file:" + } +} diff --git a/livekit-plugins/livekit-plugins-dify/pyproject.toml b/livekit-plugins/livekit-plugins-dify/pyproject.toml new file mode 100644 index 000000000..8cf32563a --- /dev/null +++ b/livekit-plugins/livekit-plugins-dify/pyproject.toml @@ -0,0 +1,3 @@ +[build-system] +requires = ["setuptools>=61.0"] +build-backend = "setuptools.build_meta" \ No newline at end of file diff --git a/livekit-plugins/livekit-plugins-dify/setup.py b/livekit-plugins/livekit-plugins-dify/setup.py new file mode 100644 index 000000000..647564aed --- /dev/null +++ b/livekit-plugins/livekit-plugins-dify/setup.py @@ -0,0 +1,59 @@ +# Copyright 2024 Riino.Site +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. + +import os +import pathlib + +import setuptools +import setuptools.command.build_py + +here = pathlib.Path(__file__).parent.resolve() +about = {} +with open(os.path.join(here, "livekit", "plugins", "dify", "version.py"), "r") as f: + exec(f.read(), about) + + +setuptools.setup( + name="livekit-plugins-dify", + author = 'sorphwer@riino.site', + author_email='sorphwer@gmail.com', + version=about["__version__"], + description="Dify plugin for LiveKit Agents", + long_description=(here / "README.md").read_text(encoding="utf-8"), + long_description_content_type="text/markdown", + url="https://github.com/livekit/agents", + cmdclass={}, + classifiers=[ + "Intended Audience :: Developers", + "License :: OSI Approved :: Apache Software License", + "Topic :: Multimedia :: Sound/Audio", + "Topic :: Multimedia :: Video", + "Topic :: Scientific/Engineering :: Artificial Intelligence", + "Programming Language :: Python :: 3", + "Programming Language :: Python :: 3.9", + "Programming Language :: Python :: 3.10", + "Programming Language :: Python :: 3 :: Only", + ], + keywords=["webrtc", "realtime", "audio", "video", "livekit","dify"], + license="Apache-2.0", + packages=setuptools.find_namespace_packages(include=["livekit.*"]), + python_requires=">=3.9.0", + install_requires=["livekit-agents>=0.8.0.dev0"], + package_data={"livekit.plugins.dify": ["py.typed"]}, + project_urls={ + "Documentation": "https://docs.livekit.io", + "Website": "https://livekit.io/", + "Source": "https://github.com/livekit/agents", + }, +)