src/inference/plugins/llm/base.py
373 bytes · 16 lines · capsule://quake0day/[email protected]
raw on github
from abc import abstractmethod
from typing import AsyncIterator
from inference.core.types import LLMResponseChunk
from inference.plugins.base import CyberVersePlugin
class LLMPlugin(CyberVersePlugin):
supports_images = False
@abstractmethod
async def generate_stream(
self, messages: list[dict]
) -> AsyncIterator[LLMResponseChunk]:
...