Agenta-AI · jp-agenta · Nov 11, 2025
diff --git a/.claude/agents/changelog-editor.md b/.claude/agents/changelog-editor.md
diff --git a/README.md b/README.md
@@ -2,12 +2,11 @@
 <p align="center">
   <a href="https://agenta.ai?utm_source=github&utm_medium=referral&utm_campaign=readme">
       <picture >
-        <source width="275" media="(prefers-color-scheme: dark)" srcset="https://github.com/user-attachments/assets/97e31bfc-b1fc-4d19-b443-5aedf6029017"  >
-        <source width="275" media="(prefers-color-scheme: light)" srcset="https://github.com/user-attachments/assets/fdc5f23f-2095-4cfc-9511-14c6851c1262"  >
+        <source width="275" media="(prefers-color-scheme: dark)" srcset="https://github.com/Agenta-AI/agenta/assets/4510758/cdddf5ad-2352-4920-b1d9-ae7f8d9d7735"  >
+        <source width="275" media="(prefers-color-scheme: light)" srcset="https://github.com/Agenta-AI/agenta/assets/4510758/ab75cbac-b807-496f-aab3-57463a33f726"  >
         <img alt="Shows the logo of agenta" src="https://github.com/Agenta-AI/agenta/assets/4510758/68e055d4-d7b8-4943-992f-761558c64253" >
       </picture>
   </a>
-
 <div align="center">
   <strong> <h1> The Open-source LLMOps Platform </h1></strong>
   Build reliable LLM applications faster with integrated prompt management, evaluation, and observability.
@@ -84,15 +83,15 @@ Agenta is a platform for building production-grade LLM applications. It helps **
 Collaborate with Subject Matter Experts (SMEs) on prompt engineering and make sure nothing breaks in production.
 
 - **Interactive Playground**: Compare prompts side by side against your test cases
-- **Multi-Model Support**: Experiment with 50+ LLM models or [bring-your-own models](https://docs.agenta.ai/prompt-engineering/playground/custom-providers?utm_source=github&utm_medium=referral&utm_campaign=readme)
+- **Multi-Model Support**: Experiment with 50+ LLM models or [bring-your-own models](https://docs.agenta.ai/prompt-engineering/playground/adding-custom-providers?utm_source=github&utm_medium=referral&utm_campaign=readme)
 - **Version Control**: Version prompts and configurations with branching and environments
 - **Complex Configurations**: Enable SMEs to collaborate on [complex configuration schemas](https://docs.agenta.ai/custom-workflows/overview?utm_source=github&utm_medium=referral&utm_campaign=readme) beyond simple prompts
 
-[Explore prompt management →](https://docs.agenta.ai/prompt-engineering/concepts?utm_source=github&utm_medium=referral&utm_campaign=readme)
+[Explore prompt management →](https://docs.agenta.ai/prompt-engineering/overview?utm_source=github&utm_medium=referral&utm_campaign=readme)
 
 ### 📊 Evaluation & Testing
 Evaluate your LLM applications systematically with both human and automated feedback.
-- **Flexible Testsets**: Create testcases from production data, playground experiments, or upload CSVs
+- **Flexible Test Sets**: Create test cases from production data, playground experiments, or upload CSVs
 - **Pre-built and Custom Evaluators**: Use LLM-as-judge, one of our 20+ pre-built evaluators, or you custom evaluators
 - **UI and API Access**: Run evaluations via UI (for SMEs) or programmatically (for engineers)
 - **Human Feedback Integration**: Collect and incorporate expert annotations

diff --git a/api/ee/databases/postgres/migrations/core/data_migrations/projects.py b/api/ee/databases/postgres/migrations/core/data_migrations/projects.py
@@ -21,7 +21,7 @@
     EvaluatorConfigDB,
     HumanEvaluationDB,
     HumanEvaluationScenarioDB,
-    TestsetDB,
+    TestSetDB,
 )
 
 
@@ -38,7 +38,7 @@
     EvaluatorConfigDB,  # have workspace_id
     HumanEvaluationDB,  # have workspace_id
     HumanEvaluationScenarioDB,  # have workspace_id
-    TestsetDB,  # have workspace_id
+    TestSetDB,  # have workspace_id
 ]
 
 

diff --git a/api/ee/databases/postgres/migrations/core/data_migrations/testsets.py b/api/ee/databases/postgres/migrations/core/data_migrations/testsets.py
@@ -21,7 +21,7 @@
 )
 from oss.src.dbs.postgres.git.dao import GitDAO
 from oss.src.core.testcases.service import TestcasesService
-from oss.src.models.deprecated_models import DeprecatedTestsetDB
+from oss.src.models.deprecated_models import DeprecatedTestSetDB
 from oss.src.core.testsets.service import TestsetsService, SimpleTestsetsService
 
 
@@ -81,8 +81,8 @@ async def migration_old_testsets_to_new_testsets(
         # Count total rows with a non-null project_id
         total_query = (
             select(func.count())
-            .select_from(DeprecatedTestsetDB)
-            .filter(DeprecatedTestsetDB.project_id.isnot(None))
+            .select_from(DeprecatedTestSetDB)
+            .filter(DeprecatedTestSetDB.project_id.isnot(None))
         )
         result = await connection.execute(total_query)
         total_rows = result.scalar()
@@ -98,8 +98,8 @@ async def migration_old_testsets_to_new_testsets(
         while offset < total_testsets:
             # STEP 1: Fetch evaluator configurations with non-null project_id
             result = await connection.execute(
-                select(DeprecatedTestsetDB)
-                .filter(DeprecatedTestsetDB.project_id.isnot(None))
+                select(DeprecatedTestSetDB)
+                .filter(DeprecatedTestSetDB.project_id.isnot(None))
                 .offset(offset)
                 .limit(DEFAULT_BATCH_SIZE)
             )

diff --git a/api/ee/databases/postgres/migrations/core/versions/863f8ebc200f_extend_app_type_again.py b/api/ee/databases/postgres/migrations/core/versions/863f8ebc200f_extend_app_type_again.py
diff --git a/api/ee/databases/postgres/migrations/core/versions/baa02d66a365_migrate_code_evaluators.py b/api/ee/databases/postgres/migrations/core/versions/baa02d66a365_migrate_code_evaluators.py
diff --git a/api/ee/docker/Dockerfile.dev b/api/ee/docker/Dockerfile.dev
@@ -18,13 +18,12 @@ RUN pip install --upgrade pip \
 COPY ./ee /app/ee/
 COPY ./oss /app/oss/
 COPY ./entrypoint.py ./pyproject.toml /app/
-#
 
 RUN poetry config virtualenvs.create false \
     && poetry install --no-interaction --no-ansi
-#
+    # && pip install -e /sdk/
 
-ENV PYTHONPATH=/sdk:$PYTHONPATH
+# ENV PYTHONPATH=/sdk:$PYTHONPATH
 
 COPY ./ee/src/crons/meters.sh /meters.sh
 COPY ./ee/src/crons/meters.txt /etc/cron.d/meters-cron
@@ -34,8 +33,8 @@ RUN cat -A /etc/cron.d/meters-cron
 RUN chmod +x /meters.sh \
     && chmod 0644 /etc/cron.d/meters-cron
 
-COPY ./oss/src/crons/queries.sh /queries.sh
-COPY ./oss/src/crons/queries.txt /etc/cron.d/queries-cron
+COPY ./ee/src/crons/queries.sh /queries.sh
+COPY ./ee/src/crons/queries.txt /etc/cron.d/queries-cron
 RUN sed -i -e '$a\' /etc/cron.d/queries-cron
 RUN cat -A /etc/cron.d/queries-cron
 

diff --git a/api/ee/docker/Dockerfile.gh b/api/ee/docker/Dockerfile.gh
@@ -18,11 +18,10 @@ RUN pip install --upgrade pip \
 COPY ./ee /app/ee/
 COPY ./oss /app/oss/
 COPY ./entrypoint.py ./pyproject.toml /app/
-COPY ./sdk /sdk/
 
 RUN poetry config virtualenvs.create false \
-    && poetry install --no-interaction --no-ansi \
-    && pip install --force-reinstall --upgrade /sdk/
+    && poetry install --no-interaction --no-ansi
+#
 
 #
 
@@ -34,8 +33,8 @@ RUN cat -A /etc/cron.d/meters-cron
 RUN chmod +x /meters.sh \
     && chmod 0644 /etc/cron.d/meters-cron
 
-COPY ./oss/src/crons/queries.sh /queries.sh
-COPY ./oss/src/crons/queries.txt /etc/cron.d/queries-cron
+COPY ./ee/src/crons/queries.sh /queries.sh
+COPY ./ee/src/crons/queries.txt /etc/cron.d/queries-cron
 RUN sed -i -e '$a\' /etc/cron.d/queries-cron
 RUN cat -A /etc/cron.d/queries-cron