Source code for intelligence_layer.examples.qa.long_context_qa

from pydantic import BaseModel

from intelligence_layer.connectors.retrievers.base_retriever import Document
from intelligence_layer.connectors.retrievers.qdrant_in_memory_retriever import (
    QdrantInMemoryRetriever,
)
from intelligence_layer.core import (
    Chunk,
    ChunkInput,
    ChunkOutput,
    ControlModel,
    Language,
    LuminousControlModel,
    Task,
    TaskSpan,
    TextChunk,
)
from intelligence_layer.examples.qa.multiple_chunk_qa import (
    MultipleChunkQa,
    MultipleChunkQaInput,
    MultipleChunkQaOutput,
)
from intelligence_layer.examples.search.search import Search, SearchInput


[docs] class LongContextQaInput(BaseModel): """The input for a `LongContextQa` task. Attributes: text: Text of arbitrary length on the basis of which the question is to be answered. question: The question for the text. language: The desired language of the answer. ISO 619 str with language e.g. en, fr, etc. """ text: str question: str language: Language = Language("en")
[docs] class LongContextQa(Task[LongContextQaInput, MultipleChunkQaOutput]): """Answer a question on the basis of a (lengthy) document. Best for answering a question on the basis of a long document, where the length of text exceeds the context length of a model (e.g. 2048 tokens for the luminous models). Note: - Creates instance of `InMemoryRetriever` on the fly. - `model` provided should be a control-type model. Args: multi_chunk_qa: task used to produce answers for each relevant chunk generated by the chunk-task for the given input. Defaults to :class:`MultipleChunkQa` . chunk: task used to chunk the input. Defaults to :class:`Chunk` . k: The number of top relevant chunks to retrieve. model: The model used in the task. Example: >>> from intelligence_layer.core import InMemoryTracer, LuminousControlModel >>> from intelligence_layer.examples import LongContextQa, LongContextQaInput >>> model = LuminousControlModel("luminous-base-control") >>> task = LongContextQa(model=model) >>> input = LongContextQaInput(text="Lengthy text goes here...", ... question="Where does the text go?") >>> tracer = InMemoryTracer() >>> output = task.run(input, tracer) """ def __init__( self, multi_chunk_qa: Task[MultipleChunkQaInput, MultipleChunkQaOutput] | None = None, chunk: Task[ChunkInput, ChunkOutput] | None = None, k: int = 4, model: ControlModel | None = None, ): super().__init__() self._model = model or LuminousControlModel("luminous-supreme-control") self._chunk_task = chunk or Chunk(self._model, 1024) self._multi_chunk_qa = multi_chunk_qa or MultipleChunkQa( merge_answers_model=self._model ) self._k = k
[docs] def do_run( self, input: LongContextQaInput, task_span: TaskSpan ) -> MultipleChunkQaOutput: chunk_output = self._chunk_task.run(ChunkInput(text=input.text), task_span) retriever = QdrantInMemoryRetriever( client=self._model._client, documents=[ Document( text=c, ) for c in chunk_output.chunks ], k=self._k, threshold=0.5, ) search_output = Search(retriever).run( SearchInput(query=input.question), task_span ) multi_chunk_qa_input = MultipleChunkQaInput( chunks=[ TextChunk(result.document_chunk.text) for result in search_output.results ], question=input.question, language=input.language, ) qa_output = self._multi_chunk_qa.run(multi_chunk_qa_input, task_span) return qa_output