PyPI - logdetective - Versions diffs - 0.4.0__py3-none-any.whl → 2.11.0__py3-none-any.whl - Mend

logdetective 0.4.0py3-none-any.whl → 2.11.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (39) hide show

logdetective/constants.py +33 -12
logdetective/extractors.py +137 -68
logdetective/logdetective.py +102 -33
logdetective/models.py +99 -0
logdetective/prompts-summary-first.yml +20 -0
logdetective/prompts-summary-only.yml +13 -0
logdetective/prompts.yml +90 -0
logdetective/remote_log.py +67 -0
logdetective/server/compressors.py +186 -0
logdetective/server/config.py +78 -0
logdetective/server/database/base.py +34 -26
logdetective/server/database/models/__init__.py +33 -0
logdetective/server/database/models/exceptions.py +17 -0
logdetective/server/database/models/koji.py +143 -0
logdetective/server/database/models/merge_request_jobs.py +623 -0
logdetective/server/database/models/metrics.py +427 -0
logdetective/server/emoji.py +148 -0
logdetective/server/exceptions.py +37 -0
logdetective/server/gitlab.py +451 -0
logdetective/server/koji.py +159 -0
logdetective/server/llm.py +309 -0
logdetective/server/metric.py +75 -30
logdetective/server/models.py +426 -23
logdetective/server/plot.py +432 -0
logdetective/server/server.py +580 -468
logdetective/server/templates/base_response.html.j2 +59 -0
logdetective/server/templates/gitlab_full_comment.md.j2 +73 -0
logdetective/server/templates/gitlab_short_comment.md.j2 +62 -0
logdetective/server/utils.py +98 -32
logdetective/skip_snippets.yml +12 -0
logdetective/utils.py +187 -73
logdetective-2.11.0.dist-info/METADATA +568 -0
logdetective-2.11.0.dist-info/RECORD +40 -0
{logdetective-0.4.0.dist-info → logdetective-2.11.0.dist-info}/WHEEL +1 -1
logdetective/server/database/models.py +0 -88
logdetective-0.4.0.dist-info/METADATA +0 -333
logdetective-0.4.0.dist-info/RECORD +0 -19
{logdetective-0.4.0.dist-info → logdetective-2.11.0.dist-info}/entry_points.txt +0 -0
{logdetective-0.4.0.dist-info → logdetective-2.11.0.dist-info/licenses}/LICENSE +0 -0

logdetective/server/llm.py ADDED Viewed

@@ -0,0 +1,309 @@
+import os
+import asyncio
+import random
+import time
+from typing import List, Tuple, Dict
+import backoff
+from fastapi import HTTPException
+from pydantic import ValidationError
+import aiohttp
+from openai import AsyncStream
+from openai.types.chat import ChatCompletionChunk
+from logdetective.utils import (
+    compute_certainty,
+    prompt_to_messages,
+    format_snippets,
+    mine_logs,
+)
+from logdetective.server.config import (
+    LOG,
+    SERVER_CONFIG,
+    PROMPT_CONFIG,
+    CLIENT,
+)
+from logdetective.server.models import (
+    AnalyzedSnippet,
+    InferenceConfig,
+    Explanation,
+    StagedResponse,
+    SnippetAnalysis,
+    RatedSnippetAnalysis,
+    Response,
+)
+from logdetective.server.utils import (
+    format_analyzed_snippets,
+    should_we_giveup,
+    we_give_up,
+    filter_snippets,
+    construct_final_prompt,
+)
+LLM_CPP_SERVER_TIMEOUT = os.environ.get("LLAMA_CPP_SERVER_TIMEOUT", 600)
+@backoff.on_exception(
+    lambda: backoff.constant([10, 30, 120]),
+    aiohttp.ClientResponseError,
+    max_tries=4,  # 4 tries and 3 retries
+    jitter=lambda wait_gen_value: random.uniform(wait_gen_value, wait_gen_value + 30),
+    giveup=should_we_giveup,
+    raise_on_giveup=False,
+    on_giveup=we_give_up,
+)
+async def call_llm(
+    messages: List[Dict[str, str]],
+    inference_cfg: InferenceConfig,
+    stream: bool = False,
+    structured_output: dict | None = None,
+) -> Explanation:
+    """Submit prompt to LLM.
+    inference_cfg: The configuration section from the config.json representing
+    the relevant inference server for this request.
+    """
+    LOG.info("Analyzing the text")
+    LOG.info("Submitting to /v1/chat/completions endpoint")
+    kwargs = {}
+    # OpenAI API does not guarantee that the behavior for parameter set to `None`
+    # and parameter not given at all is the same.
+    # We build a dictionary of parameters based on the configuration.
+    if inference_cfg.log_probs:
+        LOG.info("Requesting log probabilities from LLM")
+        kwargs["logprobs"] = inference_cfg.log_probs
+    if structured_output:
+        LOG.info("Requesting structured output from LLM")
+        response_format = {
+            "type": "json_schema",
+            "json_schema": {
+                "name": "rated-snippet-analysis",
+                "schema": structured_output,
+            },
+        }
+        kwargs["response_format"] = response_format
+    async with inference_cfg.get_limiter():
+        response = await CLIENT.chat.completions.create(
+            messages=messages,
+            max_tokens=inference_cfg.max_tokens,
+            stream=stream,
+            model=inference_cfg.model,
+            temperature=inference_cfg.temperature,
+            **kwargs,
+        )
+    if not response.choices[0].message.content:
+        LOG.error("No response content recieved from %s", inference_cfg.url)
+        raise RuntimeError()
+    message_content = response.choices[0].message.content
+    if response.choices[0].logprobs and response.choices[0].logprobs.content:
+        logprobs = [e.to_dict() for e in response.choices[0].logprobs.content]
+    else:
+        logprobs = None
+    return Explanation(
+        text=message_content,
+        logprobs=logprobs,
+    )
+@backoff.on_exception(
+    lambda: backoff.constant([10, 30, 120]),
+    aiohttp.ClientResponseError,
+    max_tries=4,  # 4 tries and 3 retries
+    jitter=lambda wait_gen_value: random.uniform(wait_gen_value, wait_gen_value + 30),
+    giveup=should_we_giveup,
+    raise_on_giveup=False,
+    on_giveup=we_give_up,
+)
+async def call_llm_stream(
+    messages: List[Dict[str, str]],
+    inference_cfg: InferenceConfig,
+    stream: bool = False,
+) -> AsyncStream[ChatCompletionChunk]:
+    """Submit prompt to LLM and recieve stream of tokens as a result.
+    inference_cfg: The configuration section from the config.json representing
+    the relevant inference server for this request.
+    """
+    LOG.info("Analyzing the text")
+    LOG.info("Submitting to /v1/chat/completions endpoint")
+    async with inference_cfg.get_limiter():
+        response = await CLIENT.chat.completions.create(
+            messages=messages,
+            max_tokens=inference_cfg.max_tokens,
+            logprobs=inference_cfg.log_probs,
+            stream=stream,
+            model=inference_cfg.model,
+            temperature=inference_cfg.temperature,
+        )
+    return response
+async def analyze_snippets(
+    log_summary: List[Tuple[int, str]], structured_output: dict | None = None
+) -> List[SnippetAnalysis | RatedSnippetAnalysis]:
+    """Submit log file snippets to the LLM and gather results"""
+    # Process snippets asynchronously
+    awaitables = [
+        call_llm(
+            prompt_to_messages(
+                PROMPT_CONFIG.snippet_prompt_template.format(s),
+                PROMPT_CONFIG.snippet_system_prompt,
+                SERVER_CONFIG.inference.system_role,
+                SERVER_CONFIG.inference.user_role,
+            ),
+            inference_cfg=SERVER_CONFIG.snippet_inference,
+            structured_output=structured_output,
+        )
+        for s in log_summary
+    ]
+    gathered_responses = await asyncio.gather(*awaitables)
+    analyzed_snippets = []
+    for response in gathered_responses:
+        if structured_output:
+            try:
+                snippet = RatedSnippetAnalysis.model_validate_json(response.text)
+            except ValidationError as ex:
+                LOG.error("Invalid data structure returned `%s`", response.text)
+                raise ex
+        else:
+            snippet = SnippetAnalysis(text=response.text)
+        analyzed_snippets.append(snippet)
+    return analyzed_snippets
+async def perfrom_analysis(log_text: str) -> Response:
+    """Sumbit log file snippets in aggregate to LLM and retrieve results"""
+    log_summary = mine_logs(log_text, SERVER_CONFIG.extractor.get_extractors())
+    log_summary = format_snippets(log_summary)
+    final_prompt = construct_final_prompt(log_summary, PROMPT_CONFIG.prompt_template)
+    messages = prompt_to_messages(
+        final_prompt,
+        PROMPT_CONFIG.default_system_prompt,
+        SERVER_CONFIG.inference.system_role,
+        SERVER_CONFIG.inference.user_role,
+    )
+    response = await call_llm(
+        messages,
+        inference_cfg=SERVER_CONFIG.inference,
+    )
+    certainty = 0
+    if response.logprobs is not None:
+        try:
+            certainty = compute_certainty(response.logprobs)
+        except ValueError as ex:
+            LOG.error("Error encountered while computing certainty: %s", ex)
+            raise HTTPException(
+                status_code=400,
+                detail=f"Couldn't compute certainty with data:\n{response.logprobs}",
+            ) from ex
+    return Response(explanation=response, response_certainty=certainty)
+async def perform_analyis_stream(log_text: str) -> AsyncStream:
+    """Submit log file snippets in aggregate and return a stream of tokens"""
+    log_summary = mine_logs(log_text, SERVER_CONFIG.extractor.get_extractors())
+    log_summary = format_snippets(log_summary)
+    final_prompt = construct_final_prompt(log_summary, PROMPT_CONFIG.prompt_template)
+    messages = prompt_to_messages(
+        final_prompt,
+        PROMPT_CONFIG.default_system_prompt,
+        SERVER_CONFIG.inference.system_role,
+        SERVER_CONFIG.inference.user_role,
+    )
+    stream = call_llm_stream(
+        messages,
+        inference_cfg=SERVER_CONFIG.inference,
+    )
+    # we need to figure out a better response here, this is how it looks rn:
+    # b'data: {"choices":[{"finish_reason":"stop","index":0,"delta":{}}],
+    #   "created":1744818071,"id":"chatcmpl-c9geTxNcQO7M9wR...
+    return stream
+async def perform_staged_analysis(log_text: str) -> StagedResponse:
+    """Submit the log file snippets to the LLM and retrieve their results"""
+    log_summary = mine_logs(log_text, SERVER_CONFIG.extractor.get_extractors())
+    start = time.time()
+    if SERVER_CONFIG.general.top_k_snippets:
+        rated_snippets = await analyze_snippets(
+            log_summary=log_summary,
+            structured_output=RatedSnippetAnalysis.model_json_schema(),
+        )
+        # Extract original text and line number from `log_summary`
+        processed_snippets = [
+            AnalyzedSnippet(line_number=e[0][0], text=e[0][1], explanation=e[1])
+            for e in zip(log_summary, rated_snippets)
+        ]
+        processed_snippets = filter_snippets(
+            processed_snippets=processed_snippets,
+            top_k=SERVER_CONFIG.general.top_k_snippets,
+        )
+        LOG.info(
+            "Keeping %d of original %d snippets",
+            len(processed_snippets),
+            len(rated_snippets),
+        )
+    else:
+        processed_snippets = await analyze_snippets(log_summary=log_summary)
+        # Extract original text and line number from `log_summary`
+        processed_snippets = [
+            AnalyzedSnippet(line_number=e[0][0], text=e[0][1], explanation=e[1])
+            for e in zip(log_summary, processed_snippets)
+        ]
+    delta = time.time() - start
+    LOG.info("Snippet analysis performed in %f s", delta)
+    log_summary = format_analyzed_snippets(processed_snippets)
+    final_prompt = construct_final_prompt(log_summary, PROMPT_CONFIG.prompt_template_staged)
+    messages = prompt_to_messages(
+        final_prompt,
+        PROMPT_CONFIG.staged_system_prompt,
+        SERVER_CONFIG.inference.system_role,
+        SERVER_CONFIG.inference.user_role,
+    )
+    final_analysis = await call_llm(
+        messages,
+        inference_cfg=SERVER_CONFIG.inference,
+    )
+    certainty = 0
+    if final_analysis.logprobs:
+        try:
+            certainty = compute_certainty(final_analysis.logprobs)
+        except ValueError as ex:
+            LOG.error("Error encountered while computing certainty: %s", ex)
+            raise HTTPException(
+                status_code=400,
+                detail=f"Couldn't compute certainty with data:\n"
+                f"{final_analysis.logprobs}",
+            ) from ex
+    return StagedResponse(
+        explanation=final_analysis,
+        snippets=processed_snippets,
+        response_certainty=certainty,
+    )

logdetective/server/metric.py CHANGED Viewed

@@ -1,35 +1,54 @@
-import datetime
 import inspect
-from typing import Union
+import datetime
+from typing import Optional, Union
 from functools import wraps
+import aiohttp
 from starlette.responses import StreamingResponse
-from logdetective.server.database.models import EndpointType, AnalyzeRequestMetrics
 from logdetective.server import models
+from logdetective.remote_log import RemoteLog
+from logdetective.server.config import LOG
+from logdetective.server.compressors import LLMResponseCompressor, RemoteLogCompressor
+from logdetective.server.database.models import EndpointType, AnalyzeRequestMetrics
+from logdetective.server.exceptions import LogDetectiveMetricsError
-def add_new_metrics(
-    api_name: str, build_log: models.BuildLog, received_at: datetime.datetime = None
+async def add_new_metrics(
+    api_name: EndpointType,
+    url: Optional[str] = None,
+    http_session: Optional[aiohttp.ClientSession] = None,
+    received_at: Optional[datetime.datetime] = None,
+    compressed_log_content: Optional[bytes] = None,
 ) -> int:
     """Add a new database entry for a received request.
     This will store the time when this function is called,
     the endpoint from where the request was received,
-    and the log for which analysis is requested.
+    and the log (in a zip format) for which analysis is requested.
     """
-    return AnalyzeRequestMetrics.create(
+    if not compressed_log_content:
+        if not (url and http_session):
+            raise LogDetectiveMetricsError(
+                f"""Remote log can not be retrieved without URL and http session.
+                URL: {url}, http session:{http_session}""")
+        remote_log = RemoteLog(url, http_session)
+        compressed_log_content = await RemoteLogCompressor(remote_log).zip_content()
+    return await AnalyzeRequestMetrics.create(
         endpoint=EndpointType(api_name),
-        log_url=build_log.url,
+        compressed_log=compressed_log_content,
         request_received_at=received_at
         if received_at
         else datetime.datetime.now(datetime.timezone.utc),
     )
-def update_metrics(
+async def update_metrics(
     metrics_id: int,
     response: Union[models.Response, models.StagedResponse, StreamingResponse],
-    sent_at: datetime.datetime = None,
+    sent_at: Optional[datetime.datetime] = None,
 ) -> None:
     """Update a database metric entry for a received request,
     filling data for the given response.
@@ -37,46 +56,72 @@ def update_metrics(
     This will add to the database entry the time when the response was sent,
     the length of the created response and the certainty for it.
     """
+    try:
+        compressed_response = LLMResponseCompressor(response).zip_response()
+    except AttributeError as e:
+        compressed_response = None
+        LOG.warning(
+            "Given response can not be serialized "
+            "and saved in db (probably a StreamingResponse): %s.",
+            e,
+        )
     response_sent_at = (
         sent_at if sent_at else datetime.datetime.now(datetime.timezone.utc)
     )
     response_length = None
-    if hasattr(response, "explanation") and "choices" in response.explanation:
-        response_length = sum(
-            len(choice["text"])
-            for choice in response.explanation["choices"]
-            if "text" in choice
-        )
+    if hasattr(response, "explanation") and isinstance(
+        response.explanation, models.Explanation
+    ):
+        response_length = len(response.explanation.text)
     response_certainty = (
         response.response_certainty if hasattr(response, "response_certainty") else None
     )
-    AnalyzeRequestMetrics.update(
-        metrics_id, response_sent_at, response_length, response_certainty
+    await AnalyzeRequestMetrics.update(
+        id_=metrics_id,
+        response_sent_at=response_sent_at,
+        response_length=response_length,
+        response_certainty=response_certainty,
+        compressed_response=compressed_response,
     )
-def track_request():
+def track_request(name=None):
     """
-    Decorator to track requests metrics
+    Decorator to track requests/responses metrics
+    On entering the decorated function, it registers the time for the request
+    and saves the passed log content.
+    On exiting the decorated function, it registers the time for the response
+    and saves the generated response.
+    Use it to decorate server endpoints that generate a llm response
+    as in the following example:
+    >>> @app.post("/analyze", response_model=Response)
+    >>> @track_request()
+    >>> async def analyze_log(build_log)
+    >>>     pass
+    Warning: the decorators' order is important!
+    The function returned by the *track_request* decorator is the
+    server API function we want to be called by FastAPI.
     """
     def decorator(f):
         @wraps(f)
         async def async_decorated_function(*args, **kwargs):
-            metrics_id = add_new_metrics(f.__name__, kwargs["build_log"])
+            log_url = kwargs["build_log"].url
+            metrics_id = await add_new_metrics(
+                api_name=EndpointType(name if name else f.__name__),
+                url=log_url, http_session=kwargs["http_session"]
+            )
             response = await f(*args, **kwargs)
-            update_metrics(metrics_id, response)
-            return response
-        @wraps(f)
-        def sync_decorated_function(*args, **kwargs):
-            metrics_id = add_new_metrics(f.__name__, kwargs["build_log"])
-            response = f(*args, **kwargs)
-            update_metrics(metrics_id, response)
+            await update_metrics(metrics_id, response)
             return response
         if inspect.iscoroutinefunction(f):
             return async_decorated_function
-        return sync_decorated_function
+        raise NotImplementedError("An async coroutine is needed")
     return decorator

logdetective 0.4.0__py3-none-any.whl → 2.11.0__py3-none-any.whl

logdetective 0.4.0py3-none-any.whl → 2.11.0py3-none-any.whl