merge main

Agenta-AI · Nov 22, 2024 · 216b963 · 216b963
2 parents 8e1f13b + 1221f27
commit 216b963
Show file tree

Hide file tree

Showing 35 changed files with 879 additions and 799 deletions.
diff --git a/README.md b/README.md
@@ -1,26 +1,25 @@
-<div align="center" style="margin: 30px">
-  <a href="https://agenta.ai/">
-    <div  align="center" >
+<p align="center">
+  <a href="https://agenta.ai?utm_source=github&utm_medium=referral&utm_campaign=readme">
       <picture >
-        <source width="500" media="(prefers-color-scheme: dark)" srcset="https://github.com/Agenta-AI/agenta/assets/4510758/cdddf5ad-2352-4920-b1d9-ae7f8d9d7735"  >
-        <source width="500" media="(prefers-color-scheme: light)" srcset="https://github.com/Agenta-AI/agenta/assets/4510758/ab75cbac-b807-496f-aab3-57463a33f726"  >
+        <source width="275" media="(prefers-color-scheme: dark)" srcset="https://github.com/Agenta-AI/agenta/assets/4510758/cdddf5ad-2352-4920-b1d9-ae7f8d9d7735"  >
+        <source width="275" media="(prefers-color-scheme: light)" srcset="https://github.com/Agenta-AI/agenta/assets/4510758/ab75cbac-b807-496f-aab3-57463a33f726"  >
         <img alt="Shows the logo of agenta" src="https://github.com/Agenta-AI/agenta/assets/4510758/68e055d4-d7b8-4943-992f-761558c64253" >
       </picture>
-    </div>
   </a>
-  <h4 align="center">
-    <a href="https://agenta.ai">Home Page</a> |
-    <a href="https://join.slack.com/t/agenta-hq/shared_invite/zt-1zsafop5i-Y7~ZySbhRZvKVPV5DO_7IA">Slack</a> |
-    <a href="https://docs.agenta.ai/">Documentation</a>
-  </h4>
+</p>
+  <p align="center">
+    <a href="https://docs.agenta.ai?utm_source=github&utm_medium=referral&utm_campaign=readme">Documentation</a> |
+    <a href="https://agenta.ai?utm_source=github&utm_medium=referral&utm_campaign=readme">Website</a> |
+    <a href="https://join.slack.com/t/agenta-hq/shared_invite/zt-1zsafop5i-Y7~ZySbhRZvKVPV5DO_7IA">Slack</a>
+  </p>
 <div align="center">
-  <strong> <h2> Collaborate on prompts, evaluate, and deploy LLM applications with confidence </h2></strong>
-  The open-source LLM developer platform for prompt-engineering, evaluation, human feedback, and deployment of complex LLM apps.
+  <strong> <h2> The Open source LLMOps Platform </h2></strong>
+  Prompt playground, prompt management, evaluation, and observability
 </div>
 </br>
 <p align="center">
   <img src="https://img.shields.io/badge/license-MIT-blue.svg" alt="MIT license." />
-  <a href="https://docs.agenta.ai/">
+  <a href="https://docs.agenta.ai?utm_source=github&utm_medium=referral&utm_campaign=readme">
     <img src="https://img.shields.io/badge/Doc-online-green" alt="Doc">
   </a>
 
@@ -49,21 +48,25 @@
     </a>
 </p>
 
-</br>
-
-<a href="https://cloud.agenta.ai">
-  <picture>
-  <img src="https://github.com/Agenta-AI/agenta/assets/4510758/d622f268-c295-42d4-a43c-548b611ff6f2" />
-  </picture>
-</a>
-
-<br>
-  <br />
   <br />
-      <div  align="center" >
+<p align="center">
+  <a href="https://cloud.agenta.ai?utm_source=github&utm_medium=referral&utm_campaign=readme">
       <picture >
-        <img alt="Glamour Shot" src="https://github.com/user-attachments/assets/32e95ddb-e001-4462-b92e-72bf4cc78597" >
+        <source width="275" media="(prefers-color-scheme: dark)" srcset="https://github.com/user-attachments/assets/b8912ecb-c7a0-47bd-8507-29b12382fef6"  >
+        <source width="275" media="(prefers-color-scheme: light)" srcset="https://github.com/user-attachments/assets/f133dd08-04a3-4b20-b047-22f8f841cfbb"  >
+        <img alt="Try Agenta Live Demo" src="https://github.com/Agenta-AI/agenta/assets/4510758/68e055d4-d7b8-4943-992f-761558c64253" >
       </picture>
+  </a>
+</p>
+
+<br/>
+  <br />
+      <div align="center" >
+        <a href="https://cloud.agenta.ai?utm_source=github&utm_medium=referral&utm_campaign=readme">
+          <picture >
+            <img width="800" alt="Screenshot Agenta" src="https://github.com/user-attachments/assets/32e95ddb-e001-4462-b92e-72bf4cc78597" >
+          </picture>
+        </a>
     </div>
 </div>
 <br />
@@ -72,91 +75,66 @@
 ---
 
 <h3 align="center">
-  <a href="#quick-start"><b>Quick Start</b></a> &bull;
-  <a href="#features"><b>Features</b></a> &bull;
-  <a href="https://docs.agenta.ai"><b>Documentation</b></a> &bull;
-  <a href="#enterprise-support"><b>Enterprise</b></a> &bull;
-  <a href="https://github.com/orgs/Agenta-AI/projects/13"><b>Roadmap</b></a> &bull;
-  <a href="https://join.slack.com/t/agenta-hq/shared_invite/zt-1zsafop5i-Y7~ZySbhRZvKVPV5DO_7IA"><b>Join Our Slack</b></a> &bull;
-  <a href="#contributing"><b>Contributing</b></a>
+  <a href="https://docs.agenta.ai?utm_source=github&utm_medium=referral&utm_campaign=readme"><b>Documentation</b></a> &bull;
+  <a href="https://docs.agenta.ai/changelog/main?utm_source=github&utm_medium=referral&utm_campaign=readme"><b>Changelog</b></a> &bull;
+  <a href="https://agenta.ai?utm_source=github&utm_medium=referral&utm_campaign=readme"><b>Website</b></a> &bull;
+  <a href="https://cloud.agenta.ai?utm_source=github&utm_medium=referral&utm_campaign=readme"><b>Agenta Cloud</b></a>
+
 </h3>
 
 ---
 
-# ⭐️ Why Agenta?
-
-Agenta is an end-to-end LLM developer platform. It provides the tools for **prompt engineering and management**, ⚖️ **evaluation**, **human annotation**, and :rocket: **deployment**. All without imposing any restrictions on your choice of framework, library, or model.
-
-Agenta allows developers and product teams to collaborate in building production-grade LLM-powered applications in less time.
-
-### With Agenta, you can:
-
-- [🧪 **Experiment** and **compare** prompts](https://docs.agenta.ai/prompt_management/prompt_engineering) on [any LLM workflow](https://docs.agenta.ai/prompt_management/setting_up/custom_applications) (chain-of-prompts, Retrieval Augmented Generation (RAG), LLM agents...)
-- ✍️ Collect and [**annotate golden test sets**](https://docs.agenta.ai/evaluation/test_sets) for evaluation
-- 📈 [**Evaluate** your application](https://docs.agenta.ai/evaluation/automatic_evaluation) with pre-existing or [**custom evaluators**](https://docs.agenta.ai/evaluation/custom_evaluator)
-- [🔍 **Annotate** and **A/B test**](https://docs.agenta.ai/evaluation/human_evaluation) your applications with **human feedback**
-- [🤝 **Collaborate with product teams**](https://docs.agenta.ai/misc/team_management) for prompt engineering and evaluation
-- [🚀 **Deploy your application**](https://docs.agenta.ai/prompt_management/deployment) in one-click in the UI, through CLI, or through github workflows.
+# What is Agenta?
 
-### Works with any LLM app workflow
+Agenta is a platform for building production-grade LLM applications. It helps **engineering and product teams** create reliable LLM apps faster.
 
-Agenta enables prompt engineering and evaluation on any LLM app architecture:
 
-- Chain of prompts
-- RAG
-- Agents
-
-It works with any framework such as [Langchain](https://www.langchain.com/), [LlamaIndex](https://www.llamaindex.ai/) and any LLM provider (openAI, Cohere, Mistral).
-
-# Quick Start
-
-### [Get started for free](https://cloud.agenta.ai?utm_source=github&utm_medium=readme&utm_campaign=github)
-
-### [Explore the Docs](https://docs.agenta.ai/)
-
-### [Create your first application in one-minute](https://docs.agenta.ai/getting_started/quick-start)
-
-### [Create an application using Langchain](https://docs.agenta.ai/guides/tutorials/first-app-with-langchain)
-
-### [Self-host agenta](https://docs.agenta.ai/self-host/host-locally)
-
-### [Check the Cookbook](https://docs.agenta.ai/guides/cookbooks/evaluations_with_sdk)
+Agenta provides end-to-end tools for the entire LLMOps workflow:  building (**LLM playground**, **evaluation**), deploying (**prompt and configuration management**), and monitoring (**LLM observability and tracing**).
 
 # Features
-
-| Playground                                                                                                                                                                                                                         | Evaluation                                                                                                                                                                                                                                   |
-| ---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- | -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-| Compare and version prompts for any LLM app, from single prompt to agents. <br/> <video src="https://github.com/Agenta-AI/agenta/assets/4510758/8b736d2b-7c61-414c-b534-d95efc69134c" controls="controls" style="max-width:100%;"> | Define test sets, then evaluate manually or programmatically your different variants.<br/> <video src="https://github.com/Agenta-AI/agenta/assets/4510758/8c6997c6-da87-46ad-a81f-e15e277263d2" controls="controls" style="max-width:100%;"> |
-| Human annotation                                                                                                                                                                                                                   | Deployment                                                                                                                                                                                                                                   |
-| Use Human annotator to A/B test and score your LLM apps. <br/> <img width="750" alt="Screenshot 2024-01-28 at 12 57 46" src="https://github.com/Agenta-AI/agenta/assets/4510758/bf62a697-bf19-4ba9-850e-742fbfb75424">             | When you are ready, deploy your LLM applications as APIs in one click.<br/>![](https://github.com/Agenta-AI/agenta/blob/main/docs/images/endpoint.gif)                                                                                       |
-
-# Enterprise Support
-
-Contact us here for enterprise support and early access to agenta self-managed enterprise with Kubernetes support. <br/><br/>
-<a href="https://cal.com/mahmoud-mabrouk-ogzgey/demo"><img src="https://cal.com/book-with-cal-dark.svg" alt="Book us"></a>
+- **Prompt Playground**: Experiment, iterate on prompts, and compare outputs from over 50 LLM models side by side ([docs](https://docs.agenta.ai/prompt-management/using-the-playground?utm_source=github&utm_medium=referral&utm_campaign=readme))
+- **Custom Workflows**: Build a playground for any custom LLM workflow, such as RAG or agents. Enable all the team to easily iterate on its parameters and evaluate it from the web UI.
+- **LLM evaluation**: Run evaluation suite from the webUI using predefined evaluators like LLM-as-a-judge, RAG evaluators, or custom code evaluators. ([docs](https://docs.agenta.ai/evaluation/overview?utm_source=github&utm_medium=referral&utm_campaign=readme))
+- **Human evaluation**: Collaborate with subject matter experts for human annotation evaluation, including A/B testing and annotating golden test sets.
+- **Prompt Management**: Version your prompts and manage them across different environments ([docs](https://docs.agenta.ai/prompt-management/overview?utm_source=github&utm_medium=referral&utm_campaign=readme), [quick start](https://docs.agenta.ai/prompt-management/quick-start?utm_source=github&utm_medium=referral&utm_campaign=readme))
+- **LLM Tracing**: Observe and debug your apps with integrations to most providers and frameworks ([docs](https://docs.agenta.ai/observability/overview?utm_source=github&utm_medium=referral&utm_campaign=readme), [quick start](https://docs.agenta.ai/observability/quickstart?utm_source=github&utm_medium=referral&utm_campaign=readme))
+- **LLM Monitoring**: Track cost and latency and compare different deployments.
+
+
+# Getting Started 
+## Agenta Cloud:
+The easiest way to get started is through Agenta Cloud. It is free to signup, and comes with a generous free-tier.
+
+  <a href="https://cloud.agenta.ai?utm_source=github&utm_medium=referral&utm_campaign=readme">
+      <picture >
+        <source width="160" media="(prefers-color-scheme: dark)" srcset="https://github.com/user-attachments/assets/759422d8-01bc-4503-bf3c-b5871c99359a"  >
+        <source width="160" media="(prefers-color-scheme: light)" srcset="https://github.com/user-attachments/assets/ffa9af5f-0981-4e95-9272-cb35eedb6780"  >
+        <img alt="Get Started with Agenta Cloud" src="https://github.com/user-attachments/assets/ffa9af5f-0981-4e95-9272-cb35eedb6780" >
+      </picture>
+  </a>
+
+## Self-host:
+```
+mkdir agenta && cd agenta
+curl -L https://raw.githubusercontent.com/agenta-ai/agenta/main/docker-compose.gh.yml -o docker-compose.gh.yml
+docker compose -f docker-compose.gh.yml up -d
+```
 
 # Disabling Anonymized Tracking
 
-By default, Agenta automatically reports anonymized basic usage statistics. This helps us understand how Agenta is used and track its overall usage and growth. This data does not include any sensitive information.
-
-To disable anonymized telemetry, follow these steps:
+By default, Agenta automatically reports anonymized basic usage statistics. This helps us understand how Agenta is used and track its overall usage and growth. This data does not include any sensitive information. To disable anonymized telemetry, follow these steps:
 
 - For web: Set `TELEMETRY_TRACKING_ENABLED` to `false` in your `agenta-web/.env` file.
 - For CLI: Set `telemetry_tracking_enabled` to `false` in your `~/.agenta/config.toml` file.
 
-After making this change, restart Agenta Compose.
-
-# ⭐️ Join Our Team
-
-- [Founding Product Engineer Frontend](https://agentaai.notion.site/Founding-Product-Engineer-Frontend-b6d26a3e9b254be6b6c2bfffbf0b53c5)
 
 # Contributing
 
 We warmly welcome contributions to Agenta. Feel free to submit issues, fork the repository, and send pull requests.
 
 We are usually hanging in our Slack. Feel free to [join our Slack and ask us anything](https://join.slack.com/t/agenta-hq/shared_invite/zt-1zsafop5i-Y7~ZySbhRZvKVPV5DO_7IA)
 
-Check out our [Contributing Guide](https://docs.agenta.ai/misc/contributing/getting-started) for more information.
+Check out our [Contributing Guide](https://docs.agenta.ai/misc/contributing/getting-started?utm_source=github&utm_medium=referral&utm_campaign=readme) for more information.
 
 ## Contributors ✨
 

diff --git a/agenta-backend/agenta_backend/core/observability/utils.py b/agenta-backend/agenta_backend/core/observability/utils.py
@@ -41,7 +41,7 @@ def _is_uuid_key(key: str) -> bool:
         "root.id",
         "tree.id",
         "node.id",
-        "parend.id",
+        "parent.id",
     )
 
 
@@ -152,6 +152,7 @@ def parse_ingest_value(
         attributes[key] = to_type(attributes[key])
     except ValueError:
         print_exc()
+        print(f"key='{key}' attribute='{attributes[key]}' type='{to_type}'")
 
         del attributes[key]
 
@@ -167,7 +168,7 @@ def parse_ingest(
         }
         for field, attributes in typecheck.items():
             if attributes is not None:
-                for key in attributes.keys():
+                for key in list(attributes.keys()):
                     scoped_key = f"{field}.{key}"
                     if _is_uuid_key(scoped_key):
                         parse_ingest_value(attributes, UUID, key)

diff --git a/agenta-backend/agenta_backend/routers/permissions_router.py b/agenta-backend/agenta_backend/routers/permissions_router.py
@@ -29,8 +29,8 @@ def __init__(
 class Deny(HTTPException):
     def __init__(self) -> None:
         super().__init__(
-            status_code=401,
-            detail="Unauthorized",
+            status_code=403,
+            detail="Forbidden",
         )
 
 

diff --git a/agenta-backend/agenta_backend/services/llm_apps_service.py b/agenta-backend/agenta_backend/services/llm_apps_service.py
@@ -3,7 +3,7 @@
 import asyncio
 import traceback
 import aiohttp
-from typing import Any, Dict, List
+from typing import Any, Dict, List, Optional
 
 
 from agenta_backend.models.shared_models import InvokationResult, Result, Error
@@ -362,7 +362,17 @@ async def batch_invoke(
     list_of_app_outputs: List[
         InvokationResult
     ] = []  # Outputs after running all batches
-    openapi_parameters = await get_parameters_from_openapi(uri + "/openapi.json")
+
+    headers = None
+    if isCloudEE():
+        secret_token = await sign_secret_token(user_id, project_id, None)
+
+        headers = {"Authorization": f"Secret {secret_token}"}
+
+    openapi_parameters = await get_parameters_from_openapi(
+        uri + "/openapi.json",
+        headers,
+    )
 
     async def run_batch(start_idx: int):
         tasks = []
@@ -402,7 +412,10 @@ async def run_batch(start_idx: int):
     return list_of_app_outputs
 
 
-async def get_parameters_from_openapi(uri: str) -> List[Dict]:
+async def get_parameters_from_openapi(
+    uri: str,
+    headers: Optional[Dict[str, str]],
+) -> List[Dict]:
     """
     Parse the OpenAI schema of an LLM app to return list of parameters that it takes with their type as determined by the x-parameter
     Args:
@@ -417,7 +430,7 @@ async def get_parameters_from_openapi(uri: str) -> List[Dict]:
 
     """
 
-    schema = await _get_openai_json_from_uri(uri)
+    schema = await _get_openai_json_from_uri(uri, headers)
 
     try:
         body_schema_name = (
@@ -447,9 +460,12 @@ async def get_parameters_from_openapi(uri: str) -> List[Dict]:
     return parameters
 
 
-async def _get_openai_json_from_uri(uri):
+async def _get_openai_json_from_uri(
+    uri: str,
+    headers: Optional[Dict[str, str]],
+):
     async with aiohttp.ClientSession() as client:
-        resp = await client.get(uri, timeout=5)
+        resp = await client.get(uri, headers=headers, timeout=5)
         resp_text = await resp.text()
         json_data = json.loads(resp_text)
         return json_data
diff --git a/agenta-backend/agenta_backend/tasks/evaluations.py b/agenta-backend/agenta_backend/tasks/evaluations.py
@@ -6,6 +6,10 @@
 from celery import shared_task, states
 
 from agenta_backend.utils.common import isCloudEE
+
+if isCloudEE():
+    from agenta_backend.cloud.services.auth_helper import sign_secret_token
+
 from agenta_backend.services import (
     evaluators_service,
     llm_apps_service,
@@ -143,8 +147,20 @@ def evaluate(
         )
 
         # 4. Evaluate the app outputs
+        secret_token = None
+        headers = None
+        if isCloudEE():
+            secret_token = loop.run_until_complete(
+                sign_secret_token(user_id, project_id, None)
+            )
+            if secret_token:
+                headers = {"Authorization": f"Secret {secret_token}"}
+
         openapi_parameters = loop.run_until_complete(
-            llm_apps_service.get_parameters_from_openapi(uri + "/openapi.json")
+            llm_apps_service.get_parameters_from_openapi(
+                uri + "/openapi.json",
+                headers,
+            ),
         )
 
         for data_point, app_output in zip(testset_db.csvdata, app_outputs):  # type: ignore

diff --git a/agenta-cli/agenta/__init__.py b/agenta-cli/agenta/__init__.py
@@ -1,3 +1,5 @@
+from typing import Any, Callable, Optional
+
 from .sdk.utils.preinit import PreInitObject
 
 import agenta.client.backend.types as client_types  # pylint: disable=wrong-import-order
@@ -18,7 +20,7 @@
 )
 
 from .sdk.utils.logging import log as logging
-from .sdk.tracing import Tracing
+from .sdk.tracing import Tracing, get_tracer
 from .sdk.decorators.tracing import instrument
 from .sdk.tracing.conventions import Reference
 from .sdk.decorators.routing import entrypoint, app, route
@@ -36,15 +38,36 @@
 DEFAULT_AGENTA_SINGLETON_INSTANCE = AgentaSingleton()
 
 types = client_types
-tracing = None
+
 api = None
 async_api = None
 
+tracing = DEFAULT_AGENTA_SINGLETON_INSTANCE.tracing  # type: ignore
+tracer = get_tracer(tracing)
 
-def init(*args, **kwargs):
-    global api, async_api, tracing, config
-    _init(*args, **kwargs)
 
-    tracing = DEFAULT_AGENTA_SINGLETON_INSTANCE.tracing  # type: ignore
+def init(
+    host: Optional[str] = None,
+    api_key: Optional[str] = None,
+    config_fname: Optional[str] = None,
+    redact: Optional[Callable[..., Any]] = None,
+    redact_on_error: Optional[bool] = True,
+    # DEPRECATING
+    app_id: Optional[str] = None,
+):
+    global api, async_api, tracing, tracer  # pylint: disable=global-statement
+
+    _init(
+        host=host,
+        api_key=api_key,
+        config_fname=config_fname,
+        redact=redact,
+        redact_on_error=redact_on_error,
+        app_id=app_id,
+    )
+
     api = DEFAULT_AGENTA_SINGLETON_INSTANCE.api  # type: ignore
     async_api = DEFAULT_AGENTA_SINGLETON_INSTANCE.async_api  # type: ignore
+
+    tracing = DEFAULT_AGENTA_SINGLETON_INSTANCE.tracing  # type: ignore
+    tracer = get_tracer(tracing)