agentEvaluation.title
agentEvaluation.subtitle
agentEvaluation.displayTypes.title
agentEvaluation.displayTypes.subtitle
agentEvaluation.displayTypes.items.agentTrace.title
agentEvaluation.displayTypes.items.agentTrace.description
agentEvaluation.displayTypes.items.webAgent.title
agentEvaluation.displayTypes.items.webAgent.description
agentEvaluation.displayTypes.items.interactiveChat.title
agentEvaluation.displayTypes.items.interactiveChat.description
agentEvaluation.displayTypes.items.liveAgent.title
agentEvaluation.displayTypes.items.liveAgent.description
agentEvaluation.displayTypes.items.codingTrace.title
agentEvaluation.displayTypes.items.codingTrace.description
agentEvaluation.schemas.title
agentEvaluation.schemas.subtitle
agentEvaluation.schemas.items.trajectoryEval.title
agentEvaluation.schemas.items.trajectoryEval.description
agentEvaluation.schemas.items.rubricEval.title
agentEvaluation.schemas.items.rubricEval.description
agentEvaluation.schemas.items.pairwise.title
agentEvaluation.schemas.items.pairwise.description
agentEvaluation.schemas.items.perTurn.title
agentEvaluation.schemas.items.perTurn.description
agentEvaluation.schemas.items.processReward.title
agentEvaluation.schemas.items.processReward.description
agentEvaluation.schemas.items.codeReview.title
agentEvaluation.schemas.items.codeReview.description
agentEvaluation.traceFormats.title
agentEvaluation.traceFormats.subtitle
| agentEvaluation.traceFormats.headers.converter | agentEvaluation.traceFormats.headers.source | agentEvaluation.traceFormats.headers.features |
|---|---|---|
| agentEvaluation.traceFormats.items.langchain.name | agentEvaluation.traceFormats.items.langchain.source | agentEvaluation.traceFormats.items.langchain.features |
| agentEvaluation.traceFormats.items.langfuse.name | agentEvaluation.traceFormats.items.langfuse.source | agentEvaluation.traceFormats.items.langfuse.features |
| agentEvaluation.traceFormats.items.openai.name | agentEvaluation.traceFormats.items.openai.source | agentEvaluation.traceFormats.items.openai.features |
| agentEvaluation.traceFormats.items.anthropic.name | agentEvaluation.traceFormats.items.anthropic.source | agentEvaluation.traceFormats.items.anthropic.features |
| agentEvaluation.traceFormats.items.mcp.name | agentEvaluation.traceFormats.items.mcp.source | agentEvaluation.traceFormats.items.mcp.features |
| agentEvaluation.traceFormats.items.opentelemetry.name | agentEvaluation.traceFormats.items.opentelemetry.source | agentEvaluation.traceFormats.items.opentelemetry.features |
| agentEvaluation.traceFormats.items.atif.name | agentEvaluation.traceFormats.items.atif.source | agentEvaluation.traceFormats.items.atif.features |
| agentEvaluation.traceFormats.items.webarena.name | agentEvaluation.traceFormats.items.webarena.source | agentEvaluation.traceFormats.items.webarena.features |
| agentEvaluation.traceFormats.items.rawWeb.name | agentEvaluation.traceFormats.items.rawWeb.source | agentEvaluation.traceFormats.items.rawWeb.features |
| agentEvaluation.traceFormats.items.claudeCode.name | agentEvaluation.traceFormats.items.claudeCode.source | agentEvaluation.traceFormats.items.claudeCode.features |
| agentEvaluation.traceFormats.items.aider.name | agentEvaluation.traceFormats.items.aider.source | agentEvaluation.traceFormats.items.aider.features |
| agentEvaluation.traceFormats.items.sweAgent.name | agentEvaluation.traceFormats.items.sweAgent.source | agentEvaluation.traceFormats.items.sweAgent.features |
| agentEvaluation.traceFormats.items.react.name | agentEvaluation.traceFormats.items.react.source | agentEvaluation.traceFormats.items.react.features |
agentEvaluation.codingAgents.title
agentEvaluation.codingAgents.subtitle
agentEvaluation.liveAgent.title
agentEvaluation.liveAgent.subtitle
agentEvaluation.liveAgent.backends.ollama.title
agentEvaluation.liveAgent.backends.ollama.description
agentEvaluation.liveAgent.backends.anthropic.title
agentEvaluation.liveAgent.backends.anthropic.description
agentEvaluation.liveAgent.backends.claudeSdk.title
agentEvaluation.liveAgent.backends.claudeSdk.description
agentEvaluation.comparison.title
agentEvaluation.comparison.subtitle
| agentEvaluation.comparison.headers.feature | agentEvaluation.comparison.headers.potato | agentEvaluation.comparison.headers.langsmith | agentEvaluation.comparison.headers.langfuse | agentEvaluation.comparison.headers.labelStudio | agentEvaluation.comparison.headers.argilla | agentEvaluation.comparison.headers.scaleAI |
|---|---|---|---|---|---|---|
| agentEvaluation.comparison.rows.traceFormats.feature | agentEvaluation.comparison.rows.traceFormats.potato | agentEvaluation.comparison.rows.traceFormats.langsmith | agentEvaluation.comparison.rows.traceFormats.langfuse | agentEvaluation.comparison.rows.traceFormats.labelStudio | agentEvaluation.comparison.rows.traceFormats.argilla | agentEvaluation.comparison.rows.traceFormats.scaleAI |
| agentEvaluation.comparison.rows.perStepAnnotation.feature | agentEvaluation.comparison.rows.perStepAnnotation.potato | agentEvaluation.comparison.rows.perStepAnnotation.langsmith | agentEvaluation.comparison.rows.perStepAnnotation.langfuse | agentEvaluation.comparison.rows.perStepAnnotation.labelStudio | agentEvaluation.comparison.rows.perStepAnnotation.argilla | agentEvaluation.comparison.rows.perStepAnnotation.scaleAI |
| agentEvaluation.comparison.rows.liveObservation.feature | agentEvaluation.comparison.rows.liveObservation.potato | agentEvaluation.comparison.rows.liveObservation.langsmith | agentEvaluation.comparison.rows.liveObservation.langfuse | agentEvaluation.comparison.rows.liveObservation.labelStudio | agentEvaluation.comparison.rows.liveObservation.argilla | agentEvaluation.comparison.rows.liveObservation.scaleAI |
| agentEvaluation.comparison.rows.pauseResume.feature | agentEvaluation.comparison.rows.pauseResume.potato | agentEvaluation.comparison.rows.pauseResume.langsmith | agentEvaluation.comparison.rows.pauseResume.langfuse | agentEvaluation.comparison.rows.pauseResume.labelStudio | agentEvaluation.comparison.rows.pauseResume.argilla | agentEvaluation.comparison.rows.pauseResume.scaleAI |
| agentEvaluation.comparison.rows.codeDiffRendering.feature | agentEvaluation.comparison.rows.codeDiffRendering.potato | agentEvaluation.comparison.rows.codeDiffRendering.langsmith | agentEvaluation.comparison.rows.codeDiffRendering.langfuse | agentEvaluation.comparison.rows.codeDiffRendering.labelStudio | agentEvaluation.comparison.rows.codeDiffRendering.argilla | agentEvaluation.comparison.rows.codeDiffRendering.scaleAI |
| agentEvaluation.comparison.rows.terminalRendering.feature | agentEvaluation.comparison.rows.terminalRendering.potato | agentEvaluation.comparison.rows.terminalRendering.langsmith | agentEvaluation.comparison.rows.terminalRendering.langfuse | agentEvaluation.comparison.rows.terminalRendering.labelStudio | agentEvaluation.comparison.rows.terminalRendering.argilla | agentEvaluation.comparison.rows.terminalRendering.scaleAI |
| agentEvaluation.comparison.rows.prmCollection.feature | agentEvaluation.comparison.rows.prmCollection.potato | agentEvaluation.comparison.rows.prmCollection.langsmith | agentEvaluation.comparison.rows.prmCollection.langfuse | agentEvaluation.comparison.rows.prmCollection.labelStudio | agentEvaluation.comparison.rows.prmCollection.argilla | agentEvaluation.comparison.rows.prmCollection.scaleAI |
| agentEvaluation.comparison.rows.codeReview.feature | agentEvaluation.comparison.rows.codeReview.potato | agentEvaluation.comparison.rows.codeReview.langsmith | agentEvaluation.comparison.rows.codeReview.langfuse | agentEvaluation.comparison.rows.codeReview.labelStudio | agentEvaluation.comparison.rows.codeReview.argilla | agentEvaluation.comparison.rows.codeReview.scaleAI |
| agentEvaluation.comparison.rows.pairwiseComparison.feature | agentEvaluation.comparison.rows.pairwiseComparison.potato | agentEvaluation.comparison.rows.pairwiseComparison.langsmith | agentEvaluation.comparison.rows.pairwiseComparison.langfuse | agentEvaluation.comparison.rows.pairwiseComparison.labelStudio | agentEvaluation.comparison.rows.pairwiseComparison.argilla | agentEvaluation.comparison.rows.pairwiseComparison.scaleAI |
| agentEvaluation.comparison.rows.rubricEval.feature | agentEvaluation.comparison.rows.rubricEval.potato | agentEvaluation.comparison.rows.rubricEval.langsmith | agentEvaluation.comparison.rows.rubricEval.langfuse | agentEvaluation.comparison.rows.rubricEval.labelStudio | agentEvaluation.comparison.rows.rubricEval.argilla | agentEvaluation.comparison.rows.rubricEval.scaleAI |
| agentEvaluation.comparison.rows.selfHosted.feature | agentEvaluation.comparison.rows.selfHosted.potato | agentEvaluation.comparison.rows.selfHosted.langsmith | agentEvaluation.comparison.rows.selfHosted.langfuse | agentEvaluation.comparison.rows.selfHosted.labelStudio | agentEvaluation.comparison.rows.selfHosted.argilla | agentEvaluation.comparison.rows.selfHosted.scaleAI |
| agentEvaluation.comparison.rows.free.feature | agentEvaluation.comparison.rows.free.potato | agentEvaluation.comparison.rows.free.langsmith | agentEvaluation.comparison.rows.free.langfuse | agentEvaluation.comparison.rows.free.labelStudio | agentEvaluation.comparison.rows.free.argilla | agentEvaluation.comparison.rows.free.scaleAI |
agentEvaluation.examples.title
agentEvaluation.examples.subtitle
agentEvaluation.examples.items.agentTraceEval.title
agentEvaluation.examples.items.agentTraceEval.description
agentEvaluation.examples.items.webAgentReview.title
agentEvaluation.examples.items.webAgentReview.description
agentEvaluation.examples.items.webAgentCreation.title
agentEvaluation.examples.items.webAgentCreation.description
agentEvaluation.examples.items.liveAgentEval.title
agentEvaluation.examples.items.liveAgentEval.description
agentEvaluation.examples.items.interactiveVlm.title
agentEvaluation.examples.items.interactiveVlm.description
agentEvaluation.examples.items.swebenchEval.title
agentEvaluation.examples.items.swebenchEval.description
agentEvaluation.examples.items.anthropicEval.title
agentEvaluation.examples.items.anthropicEval.description
agentEvaluation.examples.items.openaiEval.title
agentEvaluation.examples.items.openaiEval.description
agentEvaluation.examples.items.langchainIntegration.title
agentEvaluation.examples.items.langchainIntegration.description
agentEvaluation.examples.items.multiAgentEval.title
agentEvaluation.examples.items.multiAgentEval.description
agentEvaluation.examples.items.agentComparison.title
agentEvaluation.examples.items.agentComparison.description
agentEvaluation.examples.items.multiDimComparison.title
agentEvaluation.examples.items.multiDimComparison.description
agentEvaluation.examples.items.ragEvaluation.title
agentEvaluation.examples.items.ragEvaluation.description
agentEvaluation.examples.items.visualAgentEval.title
agentEvaluation.examples.items.visualAgentEval.description
agentEvaluation.cta.title
agentEvaluation.cta.subtitle