diff --git a/.speakeasy/in.openapi.yaml b/.speakeasy/in.openapi.yaml index a56ecc47..72dc7d24 100644 --- a/.speakeasy/in.openapi.yaml +++ b/.speakeasy/in.openapi.yaml @@ -3649,6 +3649,125 @@ components: - prompt - completion type: object + BenchmarksAAItem: + example: + aa_name: GPT-4o + agentic_index: 58.3 + coding_index: 65.8 + intelligence_index: 71.2 + model_permaslug: openai/gpt-4o + pricing: + completion: '0.00001' + prompt: '0.0000025' + properties: + aa_name: + description: Model name as listed on Artificial Analysis. + example: GPT-4o + type: string + agentic_index: + description: Artificial Analysis Agentic Index composite score. Higher is better. + example: 58.3 + format: double + nullable: true + type: number + coding_index: + description: Artificial Analysis Coding Index composite score. Higher is better. + example: 65.8 + format: double + nullable: true + type: number + intelligence_index: + description: Artificial Analysis Intelligence Index composite score. Higher is better. + example: 71.2 + format: double + nullable: true + type: number + model_permaslug: + description: Stable OpenRouter model identifier. + example: openai/gpt-4o + type: string + pricing: + $ref: '#/components/schemas/BenchmarkPricing' + required: + - model_permaslug + - aa_name + - intelligence_index + - coding_index + - agentic_index + - pricing + type: object + BenchmarksAAMeta: + example: + as_of: '2026-06-03T12:00:00Z' + citation: 'Source: Artificial Analysis (artificialanalysis.ai) via OpenRouter (openrouter.ai/rankings).' + model_count: 50 + source: artificial-analysis + source_url: https://artificialanalysis.ai + version: v1 + properties: + as_of: + description: ISO-8601 timestamp of when this data was last updated. + example: '2026-06-03T12:00:00Z' + type: string + citation: + description: Required attribution when republishing this data. + example: 'Source: Artificial Analysis (artificialanalysis.ai) via OpenRouter (openrouter.ai/rankings).' + type: string + model_count: + description: Number of unique models in the response. + type: integer + source: + description: Data source identifier. + enum: + - artificial-analysis + type: string + source_url: + description: URL of the upstream data source. + enum: + - https://artificialanalysis.ai + type: string + version: + description: Dataset version. + enum: + - v1 + type: string + required: + - as_of + - version + - source + - source_url + - citation + - model_count + type: object + BenchmarksAAResponse: + example: + data: + - aa_name: GPT-4o + agentic_index: 58.3 + coding_index: 65.8 + intelligence_index: 71.2 + model_permaslug: openai/gpt-4o + pricing: + completion: '0.00001' + prompt: '0.0000025' + meta: + as_of: '2026-06-03T12:00:00Z' + citation: 'Source: Artificial Analysis (artificialanalysis.ai) via OpenRouter (openrouter.ai/rankings).' + model_count: 1 + source: artificial-analysis + source_url: https://artificialanalysis.ai + version: v1 + properties: + data: + items: + $ref: '#/components/schemas/BenchmarksAAItem' + type: array + meta: + $ref: '#/components/schemas/BenchmarksAAMeta' + required: + - data + - meta + type: object BenchmarksDAItem: example: arena: models @@ -23646,6 +23765,92 @@ paths: outputs: results: $.data type: offsetLimit + /datasets/benchmarks/artificial-analysis: + get: + description: >- + Returns composite index scores (Intelligence, Coding, Agentic) from Artificial Analysis for LLM models. Includes + OpenRouter pricing per model. Authenticate with any valid OpenRouter API key. Rate-limited to 30 requests/minute + per key and 500 requests/day per account. + operationId: getBenchmarksArtificialAnalysis + parameters: + - description: Max results to return (1–100, default 50). + in: query + name: max_results + required: false + schema: + default: 50 + description: Max results to return (1–100, default 50). + example: 20 + maximum: 100 + minimum: 1 + type: integer + responses: + '200': + content: + application/json: + example: + data: + - aa_name: GPT-4o + agentic_index: 58.3 + coding_index: 65.8 + intelligence_index: 71.2 + model_permaslug: openai/gpt-4o + pricing: + completion: '0.00001' + prompt: '0.0000025' + meta: + as_of: '2026-06-03T12:00:00Z' + citation: 'Source: Artificial Analysis (artificialanalysis.ai) via OpenRouter (openrouter.ai/rankings).' + model_count: 1 + source: artificial-analysis + source_url: https://artificialanalysis.ai + version: v1 + schema: + $ref: '#/components/schemas/BenchmarksAAResponse' + description: Artificial Analysis composite index scores with pricing and attribution metadata. + '400': + content: + application/json: + example: + error: + code: 400 + message: Invalid request parameters + schema: + $ref: '#/components/schemas/BadRequestResponse' + description: Bad Request - Invalid request parameters or malformed input + '401': + content: + application/json: + example: + error: + code: 401 + message: Missing Authentication header + schema: + $ref: '#/components/schemas/UnauthorizedResponse' + description: Unauthorized - Authentication required or invalid credentials + '429': + content: + application/json: + example: + error: + code: 429 + message: Rate limit exceeded + schema: + $ref: '#/components/schemas/TooManyRequestsResponse' + description: Too Many Requests - Rate limit exceeded + '500': + content: + application/json: + example: + error: + code: 500 + message: Internal Server Error + schema: + $ref: '#/components/schemas/InternalServerResponse' + description: Internal Server Error - Unexpected server error + summary: Artificial Analysis Benchmark Indices + tags: + - Datasets /datasets/benchmarks/design-arena: get: description: >-