diff --git a/.all-contributorsrc b/.all-contributorsrc new file mode 100644 index 00000000..1a505349 --- /dev/null +++ b/.all-contributorsrc @@ -0,0 +1,20 @@ +{ + "files": ["README.md"], + "imageSize": 100, + "contributorsPerLine": 7, + "contributorsSortAlphabetically": true, + "badgeTemplate": "[![All Contributors](https://img.shields.io/badge/all_contributors-<%= contributors.length %>-orange.svg?style=flat-square)](#contributors-)", + "contributorTemplate": "\">\" width=\"<%= options.imageSize %>px;\" alt=\"<%= contributor.name %>\"/>
<%= contributor.name %>
", + "types": { + "code": { "symbol": "๐Ÿ’ป", "description": "Code" }, + "data": { "symbol": "๐Ÿ”ฃ", "description": "Data" }, + "doc": { "symbol": "๐Ÿ“–", "description": "Documentation" }, + "ideas": { "symbol": "๐Ÿค”", "description": "Ideas, Planning, & Feedback" }, + "maintenance": { "symbol": "๐Ÿšง", "description": "Maintenance" }, + "review": { "symbol": "๐Ÿ‘€", "description": "Reviewed Pull Requests" }, + "test": { "symbol": "โš ๏ธ", "description": "Tests" }, + "infra": { "symbol": "๐Ÿ”ง", "description": "Infrastructure" } + }, + "skipCi": true, + "contributors": [] +} diff --git a/.editorconfig b/.editorconfig new file mode 100644 index 00000000..44ce5230 --- /dev/null +++ b/.editorconfig @@ -0,0 +1,21 @@ +root = true + +[*] +charset = utf-8 +end_of_line = lf +insert_final_newline = true +trim_trailing_whitespace = true +indent_style = space +indent_size = 2 + +[*.md] +trim_trailing_whitespace = false + +[*.yaml] +indent_size = 2 + +[*.yml] +indent_size = 2 + +[Makefile] +indent_style = tab diff --git a/.github/CODEOWNERS b/.github/CODEOWNERS new file mode 100644 index 00000000..ff8d40a2 --- /dev/null +++ b/.github/CODEOWNERS @@ -0,0 +1,14 @@ +# Default reviewers for all changes +* @liushuai + +# Provider data changes +providers/ @liushuai + +# Type definitions +types/ @liushuai + +# CI/CD workflows +.github/workflows/ @liushuai + +# Documentation +docs/ @liushuai diff --git a/.github/FUNDING.yml b/.github/FUNDING.yml new file mode 100644 index 00000000..ff862f3b --- /dev/null +++ b/.github/FUNDING.yml @@ -0,0 +1,3 @@ +# These supported funding platforms will be linked from the repository sidebar + +github: i-need-token diff --git a/.github/ISSUE_TEMPLATE/bug_report.md b/.github/ISSUE_TEMPLATE/bug_report.md new file mode 100644 index 00000000..b7b37e2e --- /dev/null +++ b/.github/ISSUE_TEMPLATE/bug_report.md @@ -0,0 +1,30 @@ +--- +name: Bug Report +about: Report incorrect model data or a bug in a scrape script +title: "[Bug] " +labels: bug +--- + +## Description + + + +## Provider + + + +## Model ID + + + +## Expected Data + + + +## Current Data + + + +## Source + + diff --git a/.github/ISSUE_TEMPLATE/config.yml b/.github/ISSUE_TEMPLATE/config.yml new file mode 100644 index 00000000..ee50c7bf --- /dev/null +++ b/.github/ISSUE_TEMPLATE/config.yml @@ -0,0 +1,5 @@ +blank_issues_enabled: false +contact_links: + - name: ๐Ÿ’ฌ Ask a Question + url: https://github.com/i-need-token/ai-models/discussions + about: Ask questions and discuss the catalog with the community diff --git a/.github/ISSUE_TEMPLATE/data_update.md b/.github/ISSUE_TEMPLATE/data_update.md new file mode 100644 index 00000000..45fece32 --- /dev/null +++ b/.github/ISSUE_TEMPLATE/data_update.md @@ -0,0 +1,22 @@ +--- +name: Data Update +about: Report outdated model data that needs updating +title: "[Data] " +labels: data, good first issue +--- + +## Provider + + + +## Model ID + + + +## What Changed + + + +## Source + + diff --git a/.github/ISSUE_TEMPLATE/feature_request.md b/.github/ISSUE_TEMPLATE/feature_request.md new file mode 100644 index 00000000..162dcb55 --- /dev/null +++ b/.github/ISSUE_TEMPLATE/feature_request.md @@ -0,0 +1,27 @@ +--- +name: Feature request +about: Suggest a new feature, documentation page, or capability +title: "[Feature] " +labels: ["enhancement"] +assignees: "" +--- + +## Problem + + + +## Proposed Solution + + + +## Alternatives Considered + + + +## Additional Context + + + +## Would you be willing to submit a PR? + +- [ ] Yes, I'd like to contribute this feature diff --git a/.github/ISSUE_TEMPLATE/provider_request.md b/.github/ISSUE_TEMPLATE/provider_request.md new file mode 100644 index 00000000..2fc50ed8 --- /dev/null +++ b/.github/ISSUE_TEMPLATE/provider_request.md @@ -0,0 +1,40 @@ +--- +name: Provider Request +about: Request adding a new AI model provider to the catalog +title: "[Provider] " +labels: enhancement +--- + +## Provider Name + + + +## Provider URL + + + +## API Documentation + + + +## Data Source + +How can we obtain model data from this provider? + +- [ ] Public API (no auth required) +- [ ] Public API (auth required) +- [ ] Website (server-side rendered) +- [ ] Website (client-side rendered) +- [ ] Other: \***\*\_\_\_\*\*** + +## Pricing Model + +- [ ] Per-token pricing (USD/CNY/EUR) +- [ ] Per-second pricing +- [ ] Credit-based pricing +- [ ] No public pricing +- [ ] Other: \***\*\_\_\_\*\*** + +## Additional Context + + diff --git a/.github/ISSUE_TEMPLATE/stargazer.md b/.github/ISSUE_TEMPLATE/stargazer.md new file mode 100644 index 00000000..ee805856 --- /dev/null +++ b/.github/ISSUE_TEMPLATE/stargazer.md @@ -0,0 +1,16 @@ +--- +name: ๐ŸŒŸ Stargazer +about: Leave a star and say hi! +title: "๐ŸŒŸ I starred this repo!" +labels: stargazer +--- + +Thanks for checking out the AI Models Catalog! ๐ŸŽ‰ + +If you find this project useful, please consider: + +- โญ **Starring** this repository โ€” it helps others discover it +- ๐Ÿฆ **Sharing** it on social media +- ๐Ÿ“ **Contributing** a new provider or fixing data + +Feel free to leave a comment below telling us how you use the catalog! diff --git a/.github/PULL_REQUEST_TEMPLATE.md b/.github/PULL_REQUEST_TEMPLATE.md new file mode 100644 index 00000000..4b6cad30 --- /dev/null +++ b/.github/PULL_REQUEST_TEMPLATE.md @@ -0,0 +1,25 @@ +## Description + + + +## Type of Change + +- [ ] New provider +- [ ] Data update (pricing, capabilities, etc.) +- [ ] Bug fix +- [ ] Documentation +- [ ] Refactor + +## Provider Affected + + + +## Validation + +- [ ] `npx tsx scripts/validate.ts` passes +- [ ] Data comes from first-party sources only +- [ ] No hardcoded model ID lists in scrape functions + +## Additional Notes + + diff --git a/.github/badges/models.json b/.github/badges/models.json new file mode 100644 index 00000000..4f27c22a --- /dev/null +++ b/.github/badges/models.json @@ -0,0 +1 @@ +{ "schemaVersion": 1, "label": "models", "message": "4587", "color": "green" } diff --git a/.github/badges/providers.json b/.github/badges/providers.json new file mode 100644 index 00000000..89c832bf --- /dev/null +++ b/.github/badges/providers.json @@ -0,0 +1 @@ +{ "schemaVersion": 1, "label": "providers", "message": "87", "color": "blue" } diff --git a/.github/dependabot.yml b/.github/dependabot.yml new file mode 100644 index 00000000..9d3e3db6 --- /dev/null +++ b/.github/dependabot.yml @@ -0,0 +1,19 @@ +version: 2 + +updates: + - package-ecosystem: npm + directory: / + schedule: + interval: weekly + open-pull-requests-limit: 5 + labels: + - dependencies + + - package-ecosystem: github-actions + directory: / + schedule: + interval: weekly + open-pull-requests-limit: 5 + labels: + - dependencies + - ci diff --git a/.github/discussions-setup.md b/.github/discussions-setup.md new file mode 100644 index 00000000..2da1cdb8 --- /dev/null +++ b/.github/discussions-setup.md @@ -0,0 +1,42 @@ +# GitHub Discussions Setup Guide + +Enable GitHub Discussions to create a community hub around the AI Models Catalog. + +## Steps + +1. Go to **Settings โ†’ Features** in the repository +2. Check โœ… **Discussions** +3. Create the following discussion categories: + +### Recommended Categories + +| Category | Format | Description | +| ---------------- | ------------ | --------------------------------------------- | +| ๐Ÿ“ข Announcements | Announcement | New providers, data updates, breaking changes | +| ๐Ÿ’ฌ General | Open-ended | Questions, ideas, show-and-tell | +| ๐Ÿ™ Q&A | Q&A | How to use the catalog, data questions | +| ๐Ÿ’ก Ideas | Open-ended | Feature requests, new docs suggestions | +| ๐Ÿท๏ธ Show and Tell | Open-ended | Projects built with the catalog | + +### First Discussion Posts + +Create these seed discussions to set the tone: + +1. **Welcome to AI Models Catalog** (Announcement) + - Introduce the project, link to quick-start, invite contributions + +2. **What are you building with the catalog?** (Show and Tell) + - Encourage users to share their projects + +3. **Which provider should we add next?** (Ideas) + - Crowdsource new provider requests + +4. **Data quality report โ€” how to report issues** (Q&A) + - Explain how to report stale or incorrect data + +## Benefits + +- **Reduces issue noise** โ€” questions move to Discussions instead of Issues +- **Builds community** โ€” users help each other, share projects +- **SEO boost** โ€” public discussions are indexed by search engines +- **Feedback loop** โ€” learn what users need most diff --git a/.github/labeler.yml b/.github/labeler.yml new file mode 100644 index 00000000..fa424d43 --- /dev/null +++ b/.github/labeler.yml @@ -0,0 +1,27 @@ +documentation: + - changed-files: + - any-glob-to-any-file: ["docs/**", "*.md", "README.md", "CONTRIBUTING.md"] + +data-update: + - changed-files: + - any-glob-to-any-file: ["providers/**/*.yaml", "providers/**/*.yml"] + +new-provider: + - changed-files: + - any-glob-to-any-file: ["providers/*/provider.yaml", "providers/*/scrape.ts"] + +ci: + - changed-files: + - any-glob-to-any-file: [".github/workflows/**", "action.yml"] + +dependencies: + - changed-files: + - any-glob-to-any-file: ["package.json", "package-lock.json"] + +types: + - changed-files: + - any-glob-to-any-file: ["types/**"] + +scripts: + - changed-files: + - any-glob-to-any-file: ["scripts/**"] diff --git a/.github/repo-settings.md b/.github/repo-settings.md new file mode 100644 index 00000000..79430127 --- /dev/null +++ b/.github/repo-settings.md @@ -0,0 +1,48 @@ +# GitHub Repository Settings + +This file documents the recommended GitHub repository settings for discoverability. + +## Repository Description + +``` +Structured YAML catalog of 4,587 AI models across 95 providers โ€” pricing, context windows, modalities, capabilities. First-party data with TypeScript types and Zod validation. +``` + +## Topics + +Add these topics to the repository (Settings โ†’ General โ†’ Topics): + +- ai-models +- llm +- large-language-model +- ai-catalog +- model-pricing +- ai-pricing +- openai +- anthropic +- gemini +- deepseek +- llama +- qwen +- mistral +- groq +- cerebras +- inference-api +- model-comparison +- ai-provider +- yaml +- machine-readable +- zod +- open-weights +- context-window +- tool-calling +- function-calling +- ai-agents +- reasoning-models +- vision-models +- free-ai-models +- ai-model-catalog +- structured-data +- npm-package +- huggingface +- github-action diff --git a/.github/stale.yml b/.github/stale.yml new file mode 100644 index 00000000..b020f753 --- /dev/null +++ b/.github/stale.yml @@ -0,0 +1,32 @@ +# Configuration for probot/stale - https://github.com/probot/stale + +# Number of days of inactivity before an issue becomes stale +daysUntilStale: 60 + +# Number of days of inactivity before a stale issue is closed +daysUntilClose: 7 + +# Issues with these labels will never be considered stale +exemptLabels: + - pinned + - security + - good first issue + - help wanted + +# Label to use when marking an issue as stale +staleLabel: wontfix + +# Comment to post when marking an issue as stale +markComment: > + This issue has been automatically marked as stale because it has not had + recent activity. It will be closed if no further activity occurs in 7 days. + Thank you for your contributions! + +# Comment to post when closing a stale issue +closeComment: > + This issue has been automatically closed due to inactivity. + If you believe this was closed in error, please reopen the issue + or leave a comment explaining why it should remain open. + +# Limit to only issues (not PRs) +only: issues diff --git a/.github/workflows/auto-merge.yml b/.github/workflows/auto-merge.yml new file mode 100644 index 00000000..ed468ab6 --- /dev/null +++ b/.github/workflows/auto-merge.yml @@ -0,0 +1,38 @@ +name: Auto-merge Dependabot + +on: + pull_request_target: + types: [opened, synchronize] + +permissions: + contents: write + pull-requests: write + +jobs: + auto-merge: + runs-on: ubuntu-latest + if: github.actor == 'dependabot[bot]' + steps: + - name: Dependabot metadata + id: metadata + uses: dependabot/fetch-metadata@v2 + with: + github-token: "${{ secrets.GITHUB_TOKEN }}" + + - name: Auto-approve minor and patch updates + if: > + steps.metadata.outputs.update-type == 'version-update:semver-patch' || + steps.metadata.outputs.update-type == 'version-update:semver-minor' + run: gh pr review --approve "$PR_URL" + env: + PR_URL: ${{ github.event.pull_request.html_url }} + GH_TOKEN: ${{ secrets.GITHUB_TOKEN }} + + - name: Auto-merge approved updates + if: > + steps.metadata.outputs.update-type == 'version-update:semver-patch' || + steps.metadata.outputs.update-type == 'version-update:semver-minor' + run: gh pr merge --auto --squash "$PR_URL" + env: + PR_URL: ${{ github.event.pull_request.html_url }} + GH_TOKEN: ${{ secrets.GITHUB_TOKEN }} diff --git a/.github/workflows/demo.yml b/.github/workflows/demo.yml new file mode 100644 index 00000000..2f62c814 --- /dev/null +++ b/.github/workflows/demo.yml @@ -0,0 +1,50 @@ +name: AI Models Demo +on: + workflow_dispatch: + schedule: + - cron: "0 6 * * 1" # Every Monday 6:00 UTC + +jobs: + demo: + runs-on: ubuntu-latest + steps: + - name: Get AI Model Data + id: models + uses: i-need-token/ai-models@v0.2.2 + with: + format: json + output-dir: model-data + + - name: Show Stats + run: | + echo "๐Ÿ“Š ${{ steps.models.outputs.model-count }} models from ${{ steps.models.outputs.provider-count }} providers" + echo "๐Ÿ“ Data saved to ${{ steps.models.outputs.file-path }}" + + - name: Find Cheapest Tool-Calling Model + run: | + python3 -c " + import json + with open('model-data/models.json') as f: + data = json.load(f) + models = data['models'] + AGG = {'openrouter','requesty','auriko','llmgateway','cortecs','aihubmix','orcarouter','fastrouter','302ai','martian','nanogpt','jiekou','venice','meganova'} + tc = [m for m in models if m.get('tool_call') and m.get('provider') not in AGG and m.get('pricing',{}).get('unit') != 'free' and m.get('pricing',{}).get('input',999) > 0] + tc.sort(key=lambda m: (m['pricing']['input'], m['pricing']['output'])) + print('๐Ÿ’ฐ Cheapest tool-calling models:') + for m in tc[:5]: + print(f' {m[\"id\"]}: \${m[\"pricing\"][\"input\"]}/\${m[\"pricing\"][\"output\"]}/M tokens') + " + + - name: Find Free Reasoning Models + run: | + python3 -c " + import json + with open('model-data/models.json') as f: + data = json.load(f) + models = data['models'] + free_reason = [m for m in models if m.get('reasoning') and m.get('pricing',{}).get('unit') == 'free'] + print('๐Ÿ†“ Free reasoning models:') + for m in free_reason[:5]: + ctx = m.get('limit',{}).get('context',0) + print(f' {m[\"id\"]}: {ctx//1000 if ctx >= 1000 else ctx}K context') + " diff --git a/.github/workflows/digest.yml b/.github/workflows/digest.yml new file mode 100644 index 00000000..d441e1f7 --- /dev/null +++ b/.github/workflows/digest.yml @@ -0,0 +1,99 @@ +name: Weekly Digest + +on: + workflow_dispatch: + schedule: + - cron: "0 6 * * 1" # Monday 6:00 UTC + +permissions: + contents: read + discussions: write + +jobs: + digest: + runs-on: ubuntu-latest + steps: + - uses: actions/checkout@v6 + + - uses: actions/setup-node@v4 + with: + node-version: 22 + + - name: Install dependencies + run: npm ci + + - name: Compute stats + run: npx tsx scripts/stats.ts json > stats.json + + - name: Generate digest + env: + GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }} + run: | + STATS=$(cat stats.json) + + # Extract key numbers + TOTAL=$(echo "$STATS" | jq '.model_files') + PROVIDERS=$(echo "$STATS" | jq '.providers') + FREE=$(echo "$STATS" | jq '.free') + TOOL_CALL=$(echo "$STATS" | jq '.tool_call') + REASONING=$(echo "$STATS" | jq '.reasoning') + VISION=$(echo "$STATS" | jq '.vision') + OPEN_WEIGHTS=$(echo "$STATS" | jq '.open_weights') + DEPRECATED=$(echo "$STATS" | jq '.deprecated') + FAMILIES=$(echo "$STATS" | jq '.families') + + # Get date range + WEEK_START=$(date -d "last monday" +%Y-%m-%d 2>/dev/null || date -v-7d +%Y-%m-%d) + TODAY=$(date +%Y-%m-%d) + + # Build the discussion body + cat > /tmp/digest.md << 'HEADER' + ## ๐Ÿ“Š Weekly AI Models Digest + HEADER + + echo "" >> /tmp/digest.md + echo "**Week of ${WEEK_START} โ€” ${TODAY}**" >> /tmp/digest.md + echo "" >> /tmp/digest.md + + echo "| Metric | Count |" >> /tmp/digest.md + echo "|--------|-------|" >> /tmp/digest.md + echo "| Total Models | ${TOTAL} |" >> /tmp/digest.md + echo "| Providers | ${PROVIDERS} |" >> /tmp/digest.md + echo "| Free Models | ${FREE} |" >> /tmp/digest.md + echo "| Tool Calling | ${TOOL_CALL} |" >> /tmp/digest.md + echo "| Reasoning | ${REASONING} |" >> /tmp/digest.md + echo "| Vision | ${VISION} |" >> /tmp/digest.md + echo "| Open Weights | ${OPEN_WEIGHTS} |" >> /tmp/digest.md + echo "| Families | ${FAMILIES} |" >> /tmp/digest.md + echo "| Deprecated | ${DEPRECATED} |" >> /tmp/digest.md + + echo "" >> /tmp/digest.md + echo "### ๐Ÿ”— Quick Links" >> /tmp/digest.md + echo "- [Interactive Catalog](https://i-need-token.github.io/ai-models/) โ€” search, filter, compare" >> /tmp/digest.md + echo "- [Download Data](https://github.com/i-need-token/ai-models/releases/latest) โ€” JSON, CSV, schema" >> /tmp/digest.md + echo "- [Free Models Guide](https://github.com/i-need-token/ai-models/blob/main/docs/free-models.md)" >> /tmp/digest.md + echo "- [Pricing Comparison](https://github.com/i-need-token/ai-models/blob/main/docs/pricing-comparison.md)" >> /tmp/digest.md + echo "" >> /tmp/digest.md + echo "---" >> /tmp/digest.md + echo "*Auto-generated by the [Weekly Digest workflow](https://github.com/i-need-token/ai-models/actions/workflows/digest.yml).*" >> /tmp/digest.md + + # Create or update the discussion + # Discussion category: Announcements (id from repo) + TITLE="๐Ÿ“Š Weekly Digest โ€” ${TODAY}" + BODY=$(cat /tmp/digest.md) + + # Use GraphQL to create a discussion + gh api graphql -f query=' + mutation { + createDiscussion(input: { + repositoryId: "'$(gh api repos/i-need-token/ai-models --jq '.node_id')'", + categoryId: "'$(gh api graphql -f query='{ repository(owner:"i-need-token", name:"ai-models") { discussionCategories(first:10) { nodes { id name } } } }' --jq '.data.repository.discussionCategories.nodes[] | select(.name == "Announcements") | .id')'", + title: "'"${TITLE}"'", + body: "'"${BODY}"'" + }) { + discussion { + url + } + } + } + ' 2>/dev/null || echo "Note: Discussion creation requires proper category setup" diff --git a/.github/workflows/labeler.yml b/.github/workflows/labeler.yml new file mode 100644 index 00000000..b756dc12 --- /dev/null +++ b/.github/workflows/labeler.yml @@ -0,0 +1,17 @@ +name: PR Labeler + +on: + pull_request_target: + types: [opened] + +permissions: + contents: read + pull-requests: write + +jobs: + label: + runs-on: ubuntu-latest + steps: + - uses: actions/labeler@v5 + with: + repo-token: "${{ secrets.GITHUB_TOKEN }}" diff --git a/.github/workflows/pages.yml b/.github/workflows/pages.yml new file mode 100644 index 00000000..156b4401 --- /dev/null +++ b/.github/workflows/pages.yml @@ -0,0 +1,47 @@ +name: Deploy Pages + +on: + push: + branches: [main] + paths: + - "site/**" + - "providers/**" + - "scripts/compile.ts" + - ".github/workflows/pages.yml" + workflow_dispatch: + +permissions: + contents: read + pages: write + id-token: write + +concurrency: + group: pages + cancel-in-progress: true + +jobs: + deploy: + runs-on: ubuntu-latest + environment: + name: github-pages + url: ${{ steps.deployment.outputs.page_url }} + steps: + - uses: actions/checkout@v6 + + - name: Setup Pages + uses: actions/configure-pages@v5 + + - name: Install dependencies + run: npm install + - name: Compile models.json + run: npx tsx scripts/compile.ts + - name: Copy data to site + run: cp dist/models.json site/models.json + - name: Upload artifact + uses: actions/upload-pages-artifact@v3 + with: + path: site + + - name: Deploy to GitHub Pages + id: deployment + uses: actions/deploy-pages@v4 diff --git a/.github/workflows/publish.yml b/.github/workflows/publish.yml new file mode 100644 index 00000000..3bf9cc3f --- /dev/null +++ b/.github/workflows/publish.yml @@ -0,0 +1,27 @@ +name: Publish to npm + +on: + release: + types: [published] + +permissions: + contents: read + +jobs: + publish: + runs-on: ubuntu-latest + steps: + - uses: actions/checkout@v6 + + - uses: actions/setup-node@v6 + with: + node-version: 22 + registry-url: https://registry.npmjs.org/ + + - run: npm ci + + - run: npm run build + + - run: npm publish --access public + env: + NODE_AUTH_TOKEN: ${{ secrets.NPM_TOKEN }} diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml new file mode 100644 index 00000000..d597af4f --- /dev/null +++ b/.github/workflows/release.yml @@ -0,0 +1,67 @@ +name: Release + +on: + push: + tags: + - "v*" + workflow_dispatch: + +permissions: + contents: write + +jobs: + release: + runs-on: ubuntu-latest + steps: + - uses: actions/checkout@v6 + + - uses: actions/setup-node@v6 + with: + node-version: 22 + + - name: Install dependencies + run: npm ci + + - name: Validate + run: npx tsx scripts/validate.ts + + - name: Compile models.json + run: npx tsx scripts/compile.ts + + - name: Export models.csv + run: npx tsx scripts/export-csv.ts + + - name: Compute stats + run: npx tsx scripts/stats.ts json > stats.json + + - name: Create release + uses: softprops/action-gh-release@v3 + with: + files: | + dist/models.json + models.csv + stats.json + body: | + ## AI Models Catalog Release + + **Compiled data files:** + + | File | Format | Size | Description | + | ---- | ------ | ---- | ----------- | + | `models.json` | JSON | ~2.3 MB | All 4,587 models with full metadata | + | `models.csv` | CSV | ~560 KB | Flat table โ€” open in Excel, Google Sheets, Python | + | `stats.json` | JSON | ~1 KB | Catalog statistics summary | + + **Usage:** + ```bash + # Download the compiled JSON + curl -LO https://github.com/i-need-token/ai-models/releases/latest/download/models.json + + # Download the CSV (for Excel/Sheets) + curl -LO https://github.com/i-need-token/ai-models/releases/latest/download/models.csv + + # Use in JavaScript + const catalog = require("./models.json"); + console.log(catalog.stats); + ``` + generate-release-notes: true diff --git a/.github/workflows/stats.yml b/.github/workflows/stats.yml new file mode 100644 index 00000000..d37890ea --- /dev/null +++ b/.github/workflows/stats.yml @@ -0,0 +1,60 @@ +name: Stats + +on: + workflow_dispatch: + schedule: + - cron: "0 0 * * 0" # weekly on Sunday + +permissions: + contents: write + +jobs: + stats: + runs-on: ubuntu-latest + steps: + - uses: actions/checkout@v6 + + - uses: actions/setup-node@v6 + with: + node-version: 22 + + - name: Install dependencies + run: npm ci + + - name: Compute stats + run: npx tsx scripts/stats.ts json > stats.json + + - name: Export CSV + run: npx tsx scripts/export-csv.ts + + - name: Update dynamic badges + run: | + STATS=$(cat stats.json) + MODELS=$(echo "$STATS" | jq '.model_files') + PROVIDERS=$(echo "$STATS" | jq '.providers') + cat > .github/badges/models.json << EOF + {"schemaVersion":1,"label":"models","message":"$MODELS","color":"green"} + EOF + cat > .github/badges/providers.json << EOF + {"schemaVersion":1,"label":"providers","message":"$PROVIDERS","color":"blue"} + EOF + + - name: Format badges + run: npx oxfmt --write .github/badges/*.json + + - name: Commit badges + run: | + git config user.name "github-actions[bot]" + git config user.email "github-actions[bot]@users.noreply.github.com" + git add .github/badges/*.json + git diff --cached --quiet || git commit -m "chore: update dynamic badges [skip ci]" + git push + + - name: Upload artifacts + uses: actions/upload-artifact@v7 + with: + name: catalog-data + path: | + stats.json + models.csv + retention-days: 30 diff --git a/.github/workflows/sync-hf.yml b/.github/workflows/sync-hf.yml new file mode 100644 index 00000000..c974da28 --- /dev/null +++ b/.github/workflows/sync-hf.yml @@ -0,0 +1,59 @@ +name: Sync to Hugging Face + +on: + release: + types: [published] + workflow_dispatch: + +jobs: + sync: + runs-on: ubuntu-latest + steps: + - uses: actions/checkout@v6 + + - uses: actions/setup-node@v6 + with: + node-version: 22 + + - name: Compile JSON + run: npx tsx scripts/compile.ts + + - name: Export CSV + run: npx tsx scripts/export-csv.ts + + - name: Push to Hugging Face + env: + HF_TOKEN: ${{ secrets.HF_TOKEN }} + run: | + if [ -z "$HF_TOKEN" ]; then + echo "HF_TOKEN not set โ€” skipping Hugging Face sync" + exit 0 + fi + + pip install huggingface-hub + + python3 -c " + from huggingface_hub import HfApi + import os + + api = HfApi(token=os.environ['HF_TOKEN']) + repo_id = os.environ.get('HF_REPO_ID', 'i-need-token/ai-models') + + api.upload_file( + path_or_fileobj='dist/models.json', + path_in_repo='models.json', + repo_id=repo_id, + repo_type='dataset', + commit_message='Sync models.json from GitHub release', + ) + + api.upload_file( + path_or_fileobj='models.csv', + path_in_repo='models.csv', + repo_id=repo_id, + repo_type='dataset', + commit_message='Sync models.csv from GitHub release', + ) + + print(f'Synced to https://huggingface.co/datasets/{repo_id}') + " diff --git a/.github/workflows/sync.yml b/.github/workflows/sync.yml new file mode 100644 index 00000000..5977a609 --- /dev/null +++ b/.github/workflows/sync.yml @@ -0,0 +1,57 @@ +name: Weekly Sync + +on: + schedule: + - cron: "0 2 * * 1" # Every Monday at 02:00 UTC + workflow_dispatch: + +permissions: + contents: write + pull-requests: write + +jobs: + sync: + runs-on: ubuntu-latest + steps: + - uses: actions/checkout@v6 + + - uses: actions/setup-node@v6 + with: + node-version: "22" + + - name: Install dependencies + run: npm ci + + - name: Run scrape + run: npx tsx scripts/scrape-all.ts + continue-on-error: true + + - name: Check for changes + id: changes + run: | + if git diff --quiet providers/; then + echo "changed=false" >> "$GITHUB_OUTPUT" + else + echo "changed=true" >> "$GITHUB_OUTPUT" + git diff --stat providers/ > /tmp/diff-stat.txt + fi + + - name: Create pull request + if: steps.changes.outputs.changed == 'true' + uses: peter-evans/create-pull-request@v8 + with: + title: "๐Ÿ”„ Weekly model data sync" + body: | + Automated data sync from provider APIs. + + ## Changes + + ```diff + ${{ steps.changes.outputs.diff_stat }} + ``` + + Generated by the [Weekly Sync](/.github/workflows/sync.yml) workflow. + branch: sync/weekly + commit-message: "chore: weekly model data sync" + labels: data-update, automated + delete-branch: true diff --git a/.github/workflows/validate.yml b/.github/workflows/validate.yml new file mode 100644 index 00000000..16e649bb --- /dev/null +++ b/.github/workflows/validate.yml @@ -0,0 +1,73 @@ +name: Validate + +on: + push: + branches: [main] + paths: + - "providers/**/*.yaml" + - "providers/**/*.yml" + - "types/**" + - "scripts/**" + pull_request: + branches: [main] + paths: + - "providers/**/*.yaml" + - "providers/**/*.yml" + - "types/**" + - "scripts/**" + +jobs: + validate: + runs-on: ubuntu-latest + steps: + - uses: actions/checkout@v6 + + - uses: actions/setup-node@v6 + with: + node-version: 22 + + - name: Install dependencies + run: npm ci + + - name: Validate YAML data + run: npx tsx scripts/validate.ts + + - name: Type check + run: npx tsc --noEmit + + - name: Lint + run: npm run lint + + format: + runs-on: ubuntu-latest + steps: + - uses: actions/checkout@v6 + + - uses: actions/setup-node@v6 + with: + node-version: 22 + + - name: Install dependencies + run: npm ci + + - name: Check formatting + run: npm run fmt:check + + stats: + runs-on: ubuntu-latest + steps: + - uses: actions/checkout@v6 + + - name: Count providers + id: count + run: | + providers=$(ls providers/ | wc -l | tr -d ' ') + models=$(find providers -name "*.yaml" -o -name "*.yml" | wc -l | tr -d ' ') + echo "providers=$providers" >> "$GITHUB_OUTPUT" + echo "models=$models" >> "$GITHUB_OUTPUT" + + - name: Report stats + run: | + echo "๐Ÿ“Š Catalog Stats" + echo "Providers: ${{ steps.count.outputs.providers }}" + echo "Model files: ${{ steps.count.outputs.models }}" diff --git a/.github/workflows/welcome.yml b/.github/workflows/welcome.yml new file mode 100644 index 00000000..78a63728 --- /dev/null +++ b/.github/workflows/welcome.yml @@ -0,0 +1,57 @@ +name: Welcome New Contributor + +on: + issues: + types: [opened] + pull_request_target: + types: [opened] + +permissions: + issues: write + pull-requests: write + +jobs: + welcome: + runs-on: ubuntu-latest + steps: + - name: Welcome first-time contributors + uses: actions/github-script@v7 + with: + script: | + const isIssue = context.eventName === 'issues'; + const author = isIssue + ? context.payload.issue.user.login + : context.payload.pull_request.user.login; + + // Check if this is a first-time contributor + const { data: issues } = await github.rest.search.issuesAndPullRequests({ + q: `author:${author} repo:${context.repo.owner}/${context.repo.repo} is:issue`, + per_page: 1, + }); + const { data: prs } = await github.rest.search.issuesAndPullRequests({ + q: `author:${author} repo:${context.repo.owner}/${context.repo.repo} is:pr`, + per_page: 1, + }); + + const totalContributions = issues.total_count + prs.total_count; + if (totalContributions > 1) return; + + const message = isIssue + ? `๐Ÿ‘‹ Welcome @${author}! Thanks for opening your first issue. We'll take a look soon.\n\n๐Ÿ’ก Tip: Check out our [contributing guide](https://github.com/i-need-token/ai-models/blob/main/CONTRIBUTING.md) for ways to get involved.` + : `๐Ÿ‘‹ Welcome @${author}! Thanks for your first pull request! We appreciate your contribution.\n\n๐Ÿ” A maintainer will review your PR shortly. In the meantime, make sure the CI checks pass.`; + + if (isIssue) { + await github.rest.issues.createComment({ + owner: context.repo.owner, + repo: context.repo.repo, + issue_number: context.issue.number, + body: message, + }); + } else { + await github.rest.pulls.createReviewComment({ + owner: context.repo.owner, + repo: context.repo.repo, + pull_number: context.payload.pull_request.number, + body: message, + }); + } diff --git a/.gitignore b/.gitignore index 0b655613..c8346f5b 100644 --- a/.gitignore +++ b/.gitignore @@ -3,3 +3,9 @@ dist/ .claude/ .pi/ *.local +*.tsbuildinfo +dist/ +models.csv +stats.json +social-preview.png +site/models.json diff --git a/.npmignore b/.npmignore new file mode 100644 index 00000000..14ab81cf --- /dev/null +++ b/.npmignore @@ -0,0 +1,36 @@ +# Source files (not needed in npm package) +scripts/ +.github/ +site/ +docs/ +*.ts +!types/**/*.ts + +# Config files +tsconfig.json +tsconfig.build.json +.husky/ +.claude/ +.pi/ + +# Generated / temp files +*.tsbuildinfo +models.csv +stats.json +social-preview.svg + +# Dev dependencies +node_modules/ + +# Misc +.gitignore +AGENTS.md +CHANGELOG.md +CODE_OF_CONDUCT.md +CONTRIBUTING.md +SECURITY.md +CITATION.cff +schema.json +llms.txt +llms-full.txt +action.yml \ No newline at end of file diff --git a/AGENTS.md b/AGENTS.md index 11c1c000..6d222558 100644 --- a/AGENTS.md +++ b/AGENTS.md @@ -10,6 +10,63 @@ A structured catalog of AI model providers and their models, stored as YAML file - [`types/schemas.ts`](types/schemas.ts) โ€” Zod runtime validation schemas - [`docs/data-acquisition.md`](docs/data-acquisition.md) โ€” How we acquire and update model data ([ไธญๆ–‡](docs/zh/data-acquisition.md)) - [`docs/lessons-learned.md`](docs/lessons-learned.md) โ€” Design principles and pitfalls ([ไธญๆ–‡](docs/zh/lessons-learned.md)) +- [`docs/context-windows.md`](docs/context-windows.md) โ€” Context window comparison by size and pricing ([ไธญๆ–‡](docs/zh/context-windows.md)) +- [`docs/large-context-models.md`](docs/large-context-models.md) โ€” 2,195 models with 128K+ context, 397 with 1M+ ([ไธญๆ–‡](docs/zh/large-context-models.md)) +- [`docs/small-models.md`](docs/small-models.md) โ€” 1,153 small/edge models under 10B params ([ไธญๆ–‡](docs/zh/small-models.md)) +- [`docs/provider-comparison.md`](docs/provider-comparison.md) โ€” Top 30 providers by model count and capabilities ([ไธญๆ–‡](docs/zh/provider-comparison.md)) +- [`docs/free-models.md`](docs/free-models.md) โ€” 81 free AI models by capability ([ไธญๆ–‡](docs/zh/free-models.md)) +- [`docs/open-weights.md`](docs/open-weights.md) โ€” 513 open-weight models ([ไธญๆ–‡](docs/zh/open-weights.md)) +- [`docs/reasoning-models.md`](docs/reasoning-models.md) โ€” 1,306 reasoning models ([ไธญๆ–‡](docs/zh/reasoning-models.md)) +- [`docs/tool-calling.md`](docs/tool-calling.md) โ€” 2,350 tool-calling models ([ไธญๆ–‡](docs/zh/tool-calling.md)) +- [`docs/vision-models.md`](docs/vision-models.md) โ€” 1,487 vision models ([ไธญๆ–‡](docs/zh/vision-models.md)) +- [`docs/video-models.md`](docs/video-models.md) โ€” 167 video models ([ไธญๆ–‡](docs/zh/video-models.md)) +- [`docs/image-generation.md`](docs/image-generation.md) โ€” 28 image generation models ([ไธญๆ–‡](docs/zh/image-generation.md)) +- [`docs/audio-models.md`](docs/audio-models.md) โ€” 118 audio input + 34 audio output models ([ไธญๆ–‡](docs/zh/audio-models.md)) +- [`docs/code-models.md`](docs/code-models.md) โ€” 189 code-focused models across 41 providers ([ไธญๆ–‡](docs/zh/code-models.md)) +- [`docs/agentic-models.md`](docs/agentic-models.md) โ€” Models with tool calling + reasoning for AI agents ([ไธญๆ–‡](docs/zh/agentic-models.md)) +- [`docs/openai-alternatives.md`](docs/openai-alternatives.md) โ€” GPT-4/GPT-3.5 alternatives with pricing, free options, OpenAI-compatible providers ([ไธญๆ–‡](docs/zh/openai-alternatives.md)) +- [`docs/chat-models.md`](docs/chat-models.md) โ€” 2,350 models with tool calling for chat applications ([ไธญๆ–‡](docs/zh/chat-models.md)) +- [`docs/multimodal-models.md`](docs/multimodal-models.md) โ€” 1,519 models with image/audio/video input ([ไธญๆ–‡](docs/zh/multimodal-models.md)) +- [`docs/embedding-models.md`](docs/embedding-models.md) โ€” 5 embedding models for search, RAG, similarity ([ไธญๆ–‡](docs/zh/embedding-models.md)) +- [`docs/structured-output.md`](docs/structured-output.md) โ€” 829 structured output models ([ไธญๆ–‡](docs/zh/structured-output.md)) +- [`docs/modality-matrix.md`](docs/modality-matrix.md) โ€” Model capabilities matrix ([ไธญๆ–‡](docs/zh/modality-matrix.md)) +- [`docs/providers.md`](docs/providers.md) โ€” Provider overview by type and market ([ไธญๆ–‡](docs/zh/providers.md)) +- [`docs/model-comparison.md`](docs/model-comparison.md) โ€” Model comparison tables ([ไธญๆ–‡](docs/zh/model-comparison.md)) +- [`docs/pricing-comparison.md`](docs/pricing-comparison.md) โ€” Pricing comparison across providers ([ไธญๆ–‡](docs/zh/pricing-comparison.md)) +- [`docs/cached-pricing.md`](docs/cached-pricing.md) โ€” Models with prompt caching, 50-90% input cost savings ([ไธญๆ–‡](docs/zh/cached-pricing.md)) +- [`docs/data-schema.md`](docs/data-schema.md) โ€” Data schema reference ([ไธญๆ–‡](docs/zh/data-schema.md)) +- [`docs/quick-start.md`](docs/quick-start.md) โ€” Quick start guide ([ไธญๆ–‡](docs/zh/quick-start.md)) +- [`docs/model-selection.md`](docs/model-selection.md) โ€” Model selection guide: free, best value, large context ([ไธญๆ–‡](docs/zh/model-selection.md)) +- [`docs/model-selection-cheatsheet.md`](docs/model-selection-cheatsheet.md) โ€” Model selection cheatsheet: best model by budget and use case ([ไธญๆ–‡](docs/zh/model-selection-cheatsheet.md)) +- [`docs/small-language-models.md`](docs/small-language-models.md) โ€” Small language models guide: 2,002 SLMs for edge and mobile ([ไธญๆ–‡](docs/zh/small-language-models.md)) +- [`docs/benchmarks.md`](docs/benchmarks.md) โ€” AI Model Benchmarks & Leaderboards: key benchmarks, leaderboard landscape, interpretation guide ([ไธญๆ–‡](docs/zh/benchmarks.md)) +- [`docs/migration-guide.md`](docs/migration-guide.md) โ€” Switch providers: pricing, API compatibility, checklist ([ไธญๆ–‡](docs/zh/migration-guide.md)) +- [`docs/api.md`](docs/api.md) โ€” API & programmatic access ([ไธญๆ–‡](docs/zh/api.md)) +- [`docs/code-examples.md`](docs/code-examples.md) โ€” code examples in multiple languages ([ไธญๆ–‡](docs/zh/code-examples.md)) +- [`docs/faq.md`](docs/faq.md) โ€” frequently asked questions ([ไธญๆ–‡](docs/zh/faq.md)) +- [`docs/glossary.md`](docs/glossary.md) โ€” key terms and definitions ([ไธญๆ–‡](docs/zh/glossary.md)) + +## SEO Comparison Pages + +Curated standalone pages targeting high-volume search queries. All cross-linked with JSON-LD Article schema and OpenGraph/Twitter meta tags. + +- [`site/best-ai-models.html`](site/best-ai-models.html) โ€” Best AI Models in 2025 (curated picks, quick compare) +- [`site/free-ai-models.html`](site/free-ai-models.html) โ€” Free AI Models (81 models, zero cost) +- [`site/llm-pricing.html`](site/llm-pricing.html) โ€” LLM Pricing Comparison (95 providers, cheapest per tier) +- [`site/openai-alternatives.html`](site/openai-alternatives.html) โ€” OpenAI Alternatives (95 providers, flagship comparison) +- [`site/ai-models-by-provider.html`](site/ai-models-by-provider.html) โ€” AI Models by Provider (95 providers, 20 detailed sections) +- [`site/context-window-comparison.html`](site/context-window-comparison.html) โ€” Context Window Comparison (7 context tiers, cheapest per tier) +- [`site/best-ai-models-for-coding.html`](site/best-ai-models-for-coding.html) โ€” Best AI Models for Coding (flagship, value, free, open-weight, large context, agentic) +- [`site/best-ai-models-for-agents.html`](site/best-ai-models-for-agents.html) โ€” Best AI Models for Agents (full-stack agentic, TC+reasoning, cheapest TC, free TC) +- [`site/reasoning-models-comparison.html`](site/reasoning-models-comparison.html) โ€” Reasoning Models Comparison (flagship head-to-head, cheapest, free, open weights, reasoning+TC) +- [`site/cheapest-ai-models.html`](site/cheapest-ai-models.html) โ€” Cheapest AI Models (cheapest overall, TC, reasoning, vision, 128K+, per provider) +- [`site/tool-calling-models-comparison.html`](site/tool-calling-models-comparison.html) โ€” Tool Calling Models Comparison (flagship, cheapest, free, open weights, TC+reasoning, TC+vision, TC+large context) +- [`site/ai-model-pricing-calculator.html`](site/ai-model-pricing-calculator.html) โ€” AI Model Pricing Calculator (interactive cost calculator, quick comparison, cheapest tables) +- [`site/best-ai-models-for-image-generation.html`](site/best-ai-models-for-image-generation.html) โ€” Best AI Models for Image Generation (DALLยทE, Imagen, GPT-5 Image, Midjourney, cheapest, free, open-weight) +- [`site/best-ai-models-for-vision.html`](site/best-ai-models-for-vision.html) โ€” Best AI Models for Vision (GPT-4o, Claude, Gemini, 1,487 vision models, cheapest, free, vision+tool_call, vision+large context) +- [`site/structured-output-models-comparison.html`](site/structured-output-models-comparison.html) โ€” Structured Output Models Comparison (829 structured output models, JSON mode, SO+tool_call, SO+reasoning, cheapest, free) +- [`site/open-source-ai-models.html`](site/open-source-ai-models.html) โ€” Open Source AI Models (527 open-weight models, free, tool calling, reasoning, vision, large context) +- [`site/multimodal-ai-models.html`](site/multimodal-ai-models.html) โ€” Multimodal AI Models (1,548 vision/audio/image models, modality breakdown, flagship, free) ## Key Design Decisions diff --git a/CHANGELOG.md b/CHANGELOG.md new file mode 100644 index 00000000..2612d240 --- /dev/null +++ b/CHANGELOG.md @@ -0,0 +1,85 @@ +# Changelog + +All notable changes to the AI Models Catalog. + +## v0.1.0 (2026-05) + +### Core Data + +- **95 providers** with structured YAML model data +- **4,587 model files** covering 2,712 unique model IDs across 441 families +- TypeScript type definitions (`types/model.ts`, `types/pricing.ts`, `types/provider.ts`) +- Zod runtime validation schemas (`types/schemas.ts`) +- JSON Schema for YAML validation (`schema.json`) +- Automated scrape scripts for each provider (`providers//scrape.ts`) +- CLI tools: `scripts/sync.ts`, `scripts/validate.ts`, `scripts/stats.ts`, `scripts/compile.ts`, `scripts/export-csv.ts` + +### Programmatic Access + +- npm package (`ai-models`) with TypeScript types and JSON data +- jsDelivr CDN access (`cdn.jsdelivr.net/npm/ai-models@latest/models.json`) +- CSV export (`models.csv`) available from GitHub Releases +- Reusable GitHub Action (`action.yml`) for CI/CD pipelines +- Hugging Face dataset sync (`huggingface.co/datasets/i-need-token/ai-models`) +- Interactive model catalog on GitHub Pages (`i-need-token.github.io/ai-models/`) + +### Documentation (22 EN + 22 ZH = 44 pages) + +- [Quick Start](docs/quick-start.md) โ€” find the right model in 30 seconds +- [API & Programmatic Access](docs/api.md) โ€” npm, CDN, CSV, GitHub Action, Hugging Face +- [FAQ](docs/faq.md) โ€” common questions about the catalog, data, and contributing +- [Glossary](docs/glossary.md) โ€” key terms and definitions for AI model terminology +- [Code Examples](docs/code-examples.md) โ€” TypeScript, Python, Go, Rust, jq, Excel +- [Model Comparison](docs/model-comparison.md) โ€” flagship, cost-effective, free, open-weight +- [Pricing Comparison](docs/pricing-comparison.md) โ€” side-by-side pricing across providers +- [Context Window Comparison](docs/context-windows.md) โ€” largest context windows by tier +- [Modality Matrix](docs/modality-matrix.md) โ€” which models support what modalities +- [Tool Calling Models](docs/tool-calling.md) โ€” 2,350 tool-calling models +- [Reasoning Models](docs/reasoning-models.md) โ€” 1,306 reasoning models +- [Structured Output](docs/structured-output.md) โ€” 829 JSON-mode models +- [Vision Models](docs/vision-models.md) โ€” 1,487 vision models +- [Video Models](docs/video-models.md) โ€” 167 video input models +- [Audio Models](docs/audio-models.md) โ€” 118 audio input + 34 audio output models +- [Image Generation](docs/image-generation.md) โ€” 28 image generation models +- [Free AI Models](docs/free-models.md) โ€” 81 free models +- [Open-Weight Models](docs/open-weights.md) โ€” 527 open-weight models +- [Provider Overview](docs/providers.md) โ€” all 95 providers by type and market +- [Data Schema Reference](docs/data-schema.md) โ€” complete YAML schema +- [Data Acquisition](docs/data-acquisition.md) โ€” how we acquire and update model data +- [Design Principles](docs/lessons-learned.md) โ€” lessons learned from building the catalog +- All docs available in Chinese (`docs/zh/`) with cross-language links + +### Community & Infrastructure + +- CONTRIBUTING.md with Good First Issues table +- CODE_OF_CONDUCT.md, SECURITY.md, CHANGELOG.md +- CITATION.cff for academic discoverability (18 keywords) +- 6 GitHub issue templates + PR template + config.yml +- 10 CI workflows (validate, stats, release, publish, sync, sync-hf, pages, labeler, auto-merge, welcome) +- PR auto-labeler, Dependabot auto-merge, Renovate config +- Welcome workflow for first-time contributors +- CODEOWNERS, .editorconfig, .npmignore, Makefile +- llms.txt + llms-full.txt for AI discoverability +- Social preview SVG, robots.txt, sitemap.xml for SEO + +### Provider Coverage + +- **Model producers**: OpenAI, Anthropic, Google, Meta, DeepSeek, Alibaba Cloud, Mistral, xAI, Cohere, NVIDIA, IBM, Microsoft, and 18 more +- **Inference platforms**: OpenRouter, Together AI, Fireworks AI, Groq, Cerebras, DeepInfra, and 40+ more +- **Cloud provider hosted**: Amazon Bedrock, Azure OpenAI, Google Vertex AI +- **Chinese market**: 20 providers with CNY pricing +- **European market**: 7 providers with EUR pricing + +### Data Highlights + +- 1,306 reasoning models +- 2,350 tool-calling models +- 829 structured output models +- 527 open-weight models +- 81 free models +- 1,487 vision (image input) models +- 28 image output models +- 118 audio input models +- 34 audio output models +- 167 video input models +- Context windows up to 10M tokens (Llama 4 Scout) diff --git a/CITATION.cff b/CITATION.cff new file mode 100644 index 00000000..2ddb6e4d --- /dev/null +++ b/CITATION.cff @@ -0,0 +1,49 @@ +cff-version: 1.2.0 +message: "If you use this catalog in your research, please cite it as below." +title: "AI Models Catalog" +type: dataset +authors: + - given-names: "i-need-token" +repository-code: "https://github.com/i-need-token/ai-models" +url: "https://github.com/i-need-token/ai-models" +abstract: > + A structured YAML catalog of 4,587 AI models across 95 providers, + including pricing, context windows, modalities, and capabilities. + All data sourced from first-party APIs and official documentation. +keywords: + - ai-models + - llm + - pricing + - model-catalog + - yaml + - structured-data + - open-data + - tool-calling + - reasoning-models + - vision-models + - open-weights + - context-window + - structured-output + - image-generation + - free-models + - github-action + - cdn + - huggingface + - model-selection + - prompt-caching + - cached-pricing + - audio-models + - video-models + - code-models + - agentic-models + - modality-matrix + - chat-models + - multimodal-models + - embedding-models + - migration-guide + - provider-comparison + - large-context-models + - small-models +license: MIT +version: 0.2.2 +date-released: "2026-05-21" diff --git a/CODE_OF_CONDUCT.md b/CODE_OF_CONDUCT.md new file mode 100644 index 00000000..2be142d8 --- /dev/null +++ b/CODE_OF_CONDUCT.md @@ -0,0 +1,77 @@ +# Contributor Covenant Code of Conduct + +## Our Pledge + +We as members, contributors, and leaders pledge to make participation in our community a harassment-free experience for everyone, regardless of age, body size, visible or invisible disability, ethnicity, sex characteristics, gender identity and expression, level of experience, education or socio-economic status, nationality, personal appearance, race, caste, color, religion, or sexual identity and orientation. + +We pledge to act and interact in ways that contribute to an open, welcoming, diverse, inclusive, and healthy community. + +## Our Standards + +Examples of behavior that contributes to a positive environment for our community include: + +- Demonstrating empathy and kindness toward other people +- Being respectful of differing opinions, viewpoints, and experiences +- Giving and gracefully accepting constructive feedback +- Accepting responsibility and apologizing to those affected by our mistakes, and learning from the experience +- Focusing on what is best not just for us as individuals, but for the overall community + +Examples of unacceptable behavior include: + +- The use of sexualized language or imagery, and sexual attention or advances of any kind +- Trolling, insulting or derogatory comments, and personal or political attacks +- Public or private harassment +- Publishing others' private information, such as a physical or email address, without their explicit permission +- Other conduct which could reasonably be considered inappropriate in a professional setting + +## Enforcement Responsibilities + +Community leaders are responsible for clarifying and enforcing our standards of acceptable behavior and will take appropriate and fair corrective action in response to any behavior that they deem inappropriate, threatening, offensive, or harmful. + +Community leaders have the right and responsibility to remove, edit, or reject comments, commits, code, wiki edits, issues, and other contributions that are not aligned to this Code of Conduct, and will communicate reasons for moderation decisions when appropriate. + +## Scope + +This Code of Conduct applies within all community spaces, and also applies when an individual is officially representing the community in public spaces. Examples of representing our community include using an official e-mail address, posting via an official social media account, or acting as an appointed representative at an online or offline event. + +## Enforcement + +Instances of abusive, harassing, or otherwise unacceptable behavior may be reported to the community leaders responsible for enforcement through [GitHub Issues](https://github.com/i-need-token/ai-models/issues) or directly via email. All complaints will be reviewed and investigated promptly and fairly. + +All community leaders are obligated to respect the privacy and security of the reporter of any incident. + +## Enforcement Guidelines + +Community leaders will follow these Community Impact Guidelines in determining the consequences for any action they deem in violation of this Code of Conduct: + +### 1. Correction + +**Community Impact**: Use of inappropriate language or other behavior deemed unprofessional or unwelcome in the community. + +**Consequence**: A private, written warning from community leaders, providing clarity around the nature of the violation and an explanation of why the behavior was inappropriate. A public apology may be requested. + +### 2. Warning + +**Community Impact**: A violation through a single incident or series of actions. + +**Consequence**: A warning with consequences for continued behavior. No interaction with the people involved, including unsolicited interaction with those enforcing the Code of Conduct, for a specified period of time. This includes avoiding interactions in community spaces as well as external channels like social media. Violating these terms may lead to a temporary or permanent ban. + +### 3. Temporary Ban + +**Community Impact**: A serious violation of community standards, including sustained inappropriate behavior. + +**Consequence**: A temporary ban from any sort of interaction or public communication with the community for a specified period of time. No public or private interaction with the people involved, including unsolicited interaction with those enforcing the Code of Conduct, is allowed during this period. Violating these terms may lead to a permanent ban. + +### 4. Permanent Ban + +**Community Impact**: Demonstrating a pattern of violation of community standards, including sustained inappropriate behavior, harassment of an individual, or aggression toward or disparagement of classes of individuals. + +**Consequence**: A permanent ban from any sort of public interaction within the community. + +## Attribution + +This Code of Conduct is adapted from the [Contributor Covenant](https://www.contributor-covenant.org/), version 2.1, available at [https://www.contributor-covenant.org/version/2/1/code_of_conduct.html](https://www.contributor-covenant.org/version/2/1/code_of_conduct.html). + +Community Impact Guidelines were inspired by [Mozilla's code of conduct enforcement ladder](https://github.com/divmain/pull-mozilla-coc). + +For answers to common questions about this code of conduct, see the FAQ at [https://www.contributor-covenant.org/faq](https://www.contributor-covenant.org/faq). Translations are available at [https://www.contributor-covenant.org/translations](https://www.contributor-covenant.org/translations). diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md new file mode 100644 index 00000000..9f10e1b7 --- /dev/null +++ b/CONTRIBUTING.md @@ -0,0 +1,163 @@ +# Contributing to AI Models Catalog + +Thank you for your interest in contributing! This guide covers everything you need to add a new provider, fix data, or improve the catalog. + +## Quick Start + +> ๐Ÿ’ก **Try the [Interactive Catalog](https://i-need-token.github.io/ai-models/)** โ€” search, sort, and filter all 4,587 models in your browser. + +1. Fork the repository +2. Create your feature branch: `git checkout -b feature/my-provider` +3. Make your changes +4. Validate: `npx tsx scripts/validate.ts` +5. Submit a pull request + +## Adding a New Provider + +### 1. Create the Provider Directory + +``` +providers// +โ”œโ”€โ”€ provider.yaml # Provider metadata +โ”œโ”€โ”€ scrape.ts # Data acquisition script +โ””โ”€โ”€ models/ # Generated YAML model files +``` + +### 2. Create `provider.yaml` + +```yaml +id: my-provider +name: My Provider +url: https://my-provider.com +api_docs: https://my-provider.com/docs +apis: + openai: https://api.my-provider.com/v1 +``` + +### 3. Create `scrape.ts` + +Your scrape function must: + +- **Return structured data** โ€” never write files directly +- **Use first-party sources only** โ€” the provider's own API or website +- **Include a discovery step** โ€” fetch the model list dynamically, never hardcode model IDs +- **Skip models with missing data** โ€” don't fabricate values + +```typescript +import type { Model, Provider } from "../types"; +import { defineProvider } from "../scripts/lib/define-provider"; +import { defineModel } from "../scripts/lib/define-model"; + +const provider = defineProvider({ + id: "my-provider", + name: "My Provider", + url: "https://my-provider.com", + api_docs: "https://my-provider.com/docs", + apis: { openai: "https://api.my-provider.com/v1" }, +}); + +export async function scrape(): Promise<{ provider: Provider; models: Model[] }> { + // Discover models from the provider's API + const resp = await fetch("https://api.my-provider.com/v1/models"); + const data = await resp.json(); + + const models = data.data + .filter((m: any) => shouldInclude(m)) + .map((m: any) => + defineModel({ + id: m.id, + name: deriveName(m.id), + family: deriveFamily(m.id), + // ... other fields from the API + }), + ); + + return { provider, models }; +} +``` + +### 4. Run and Validate + +```bash +# Generate YAML files +npx tsx scripts/sync.ts my-provider + +# Validate all data +npx tsx scripts/validate.ts +``` + +## Provider Acceptance Criteria + +### Model Producers + +Providers that develop their own AI models. We welcome all model producers with public APIs or documentation. + +### Inference Platforms + +Inference platforms must meet **all** of these criteria: + +- โœ… Per-token pricing (not per-second, per-credit, or other units) +- โœ… Pricing in USD, CNY, or EUR +- โœ… First-party data source (public API or website) + +**Not accepted:** + +| Category | Examples | Reason | +| ------------------- | ---------------------------------------- | ---------------------------------- | +| Auth-required API | Hyperbolic, Nebius | Can't scrape without credentials | +| Non-token pricing | Replicate (per-second), Databricks (DBU) | Incompatible pricing model | +| GPU cloud | SubModel, GMI Cloud | Rent GPUs, not per-token inference | +| Enterprise/research | Abacus AI, Liquid AI | No public pricing/API | +| Model hub | ModelScope, HuggingFace | Duplicate data from producers | + +## Data Quality Rules + +- **First-party data only** โ€” no copying from third-party aggregators +- **Never fabricate data** โ€” if a field is missing, omit it rather than guessing +- **Include deprecated models** โ€” mark with `deprecated: true` +- **Exclude retired models** โ€” models no longer accessible via API +- **Dynamic discovery** โ€” scrape functions must discover models from the source + +## Code Style + +```bash +# Format +npm run fmt + +# Lint +npm run lint + +# Type check +npm run typecheck + +# All checks +npm run check +``` + +## Good First Issues + +New contributors welcome! These tasks are beginner-friendly and don't require deep knowledge of the codebase: + +| Task | How | Difficulty | +| -------------------------- | ------------------------------------------------------------------------------------------------------------------- | ---------- | +| Fix incorrect model data | Find the model YAML in `providers//models/`, correct it, run `npx tsx scripts/validate.ts` | Easy | +| Add a provider README | Create `providers//README.md` describing the data source and scraping strategy (see existing examples) | Easy | +| Update outdated pricing | Re-run `npx tsx providers//scrape.ts` and review the diff | Easy | +| Add missing model features | Add `tool_call`, `structured_output`, `reasoning`, etc. to model YAML files where the provider docs confirm support | Easy | +| Translate a doc to Chinese | Copy an English doc from `docs/` to `docs/zh/` and translate | Medium | + +Look for issues labeled [`good first issue`](https://github.com/i-need-token/ai-models/labels/good%20first%20issue) or [`help wanted`](https://github.com/i-need-token/ai-models/labels/help%20wanted). + +## Reporting Issues + +- **Incorrect model data** โ€” open an issue with the provider name, model ID, and what's wrong +- **Missing provider** โ€” open an issue with the provider name and a link to their API/docs +- **Bug in scrape script** โ€” open an issue with the error output and steps to reproduce + +## Questions? + +Check the documentation first: + +- [Data Acquisition Guide](docs/data-acquisition.md) โ€” detailed scraping guidelines +- [Design Principles & Pitfalls](docs/lessons-learned.md) โ€” lessons learned from building the catalog +- [ๆ•ฐๆฎ้‡‡้›†๏ผˆไธญๆ–‡๏ผ‰](docs/zh/data-acquisition.md) โ€” ไธญๆ–‡็‰ˆๆ•ฐๆฎ้‡‡้›†ๆŒ‡ๅ— diff --git a/LICENSE b/LICENSE index aab0cadd..5eff32d0 100644 --- a/LICENSE +++ b/LICENSE @@ -1,6 +1,6 @@ MIT License -Copyright (c) 2025 ai-models contributors +Copyright (c) 2025-2026 ai-models contributors Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the "Software"), to deal diff --git a/Makefile b/Makefile new file mode 100644 index 00000000..9684e368 --- /dev/null +++ b/Makefile @@ -0,0 +1,37 @@ +.PHONY: install validate scrape build stats csv clean + +install: + npm install + +validate: + npm run validate + +scrape: + npm run scrape-all + +build: + npm run build + +stats: + npm run stats + +csv: + npm run export-csv + +clean: + rm -rf dist/ *.tsbuildinfo models.csv stats.json + +lint: + npm run lint + +fmt: + npx oxfmt --write . + +fmt-check: + npx oxfmt --check . + +typecheck: + npx tsc --noEmit + +check: fmt-check lint typecheck validate + @echo "All checks passed!" diff --git a/README.md b/README.md index 63d122fa..6551bc95 100644 --- a/README.md +++ b/README.md @@ -1,41 +1,225 @@ -# AI Models Catalog +
-A structured, machine-readable catalog of AI model providers and their models. All data is sourced from first-party APIs and official documentation โ€” no third-party aggregators. +# ๐Ÿค– AI Models Catalog [![Awesome](https://awesome.re/badge-flat2.svg)](https://github.com/sindresorhus/awesome) -## Data Format +**The most comprehensive structured catalog of AI models on GitHub** -Model data is stored as YAML files under `providers//models/`. Each file represents one model with its snapshots: +95 providers ยท 4,587 model files ยท 2,712 unique model IDs ยท First-party data only + +[![License: MIT](https://img.shields.io/badge/License-MIT-blue.svg)](LICENSE) +[![npm version](https://img.shields.io/npm/v/ai-models.svg)](https://www.npmjs.com/package/ai-models) +[![Hugging Face](https://img.shields.io/badge/%F0%9F%A4%97-Dataset-blue)](https://huggingface.co/datasets/i-need-token/ai-models) +[![Models](https://img.shields.io/endpoint?url=https://raw.githubusercontent.com/i-need-token/ai-models/main/.github/badges/models.json)](providers/) +[![Providers](https://img.shields.io/endpoint?url=https://raw.githubusercontent.com/i-need-token/ai-models/main/.github/badges/providers.json)](providers/) +[![CI](https://github.com/i-need-token/ai-models/actions/workflows/validate.yml/badge.svg)](https://github.com/i-need-token/ai-models/actions/workflows/validate.yml) [![GitHub stars](https://img.shields.io/github/stars/i-need-token/ai-models?style=social)](https://github.com/i-need-token/ai-models/stargazers) [![Last Updated](https://img.shields.io/github/last-commit/i-need-token/ai-models?label=updated)](https://github.com/i-need-token/ai-models/commits/main) [![Star History](https://api.star-history.com/svg?repos=i-need-token/ai-models&type=Date)](https://star-history.com/#i-need-token/ai-models&Date) + +
+ +> โญ **If this catalog helps you choose the right model, please star this repo โ€” it helps others discover it!** + +--- + +Machine-readable YAML catalog of every major AI model provider and their models โ€” pricing, context windows, modalities, capabilities, and more. All data sourced from first-party APIs and official documentation, never third-party aggregators. + +**[Quick start โ†’](docs/quick-start.md)** ยท **[Choose a model โ†’](docs/model-selection.md)** ยท **[Compare pricing โ†’](docs/pricing-comparison.md)** ยท **[๐Ÿ” Search โ†’](https://i-need-token.github.io/ai-models/)** ยท **[Download CSV โ†’](https://github.com/i-need-token/ai-models/releases/latest/download/models.csv)** ยท **[JSON โ†’](https://github.com/i-need-token/ai-models/releases/latest/download/models.json)** + +> ๐Ÿ†“ **81 free models** with tool calling, reasoning, and vision โ€” [see the list โ†’](docs/free-models.md) ยท ๐Ÿ’ฐ **Cheapest models from $0.01/M tokens** โ€” [compare pricing โ†’](docs/pricing-comparison.md) ยท ๐Ÿค– **1,080 agentic models** for AI agents โ€” [find yours โ†’](docs/agentic-models.md) + +> ๐Ÿ’ก **Try it now** โ€” fetch model data in one command: +> +> ```bash +> curl -sL https://github.com/i-need-token/ai-models/releases/latest/download/models.json | python3 -c "import sys,json; d=json.load(sys.stdin); print(f'{len(d["models"])} models across {len(set(m["provider"] for m in d["models"]))} providers')" +> ``` + +## ๐Ÿ’ก Quick Value Demo + +> **What's the cheapest model with tool calling?** โ†’ ling-2.6-flash at **$0.01/$0.03** per M tokens ([see all 2,350 โ†’](docs/tool-calling.md)) +> **What's the best free reasoning model?** โ†’ DeepSeek R1 โ€” **92% MATH-500** ([see all 81 free โ†’](docs/free-models.md)) +> **Which model has the largest context window?** โ†’ Gemini 2.5 Pro โ€” **1,048,576 tokens** ([see all context windows โ†’](docs/context-windows.md)) + +## ๐Ÿ–ฅ๏ธ Interactive Catalog + +[![AI Models Catalog โ€” Interactive model comparison tool](docs/images/catalog-screenshot.png)](https://i-need-token.github.io/ai-models/) + +
+๐ŸŽฌ Watch demo (filter, sort, dark mode, calculator) + +![Demo: filter by free models, sort by price, toggle dark mode, use price calculator](docs/images/catalog-demo.gif) + +
+ +**[Try it live โ†’](https://i-need-token.github.io/ai-models/)** โ€” Search, filter, compare 4,587+ models with 25+ features including dark/light theme, keyboard shortcuts, price calculator, and model picker wizard. + +
+๐Ÿ“Š AI Models Landscape โ€” providers, capabilities, pricing, context windows at a glance + +![AI Models Landscape 2025 โ€” 4,587 models across 95 providers](docs/images/ai-models-landscape.png) + +
+ +## Why This Catalog? + +| | | +| --------------------------------------- | ------------------------------------------------------------------------- | +| ๐Ÿ” **Compare models at a glance** | Pricing, context windows, capabilities โ€” all in one place, all structured | +| ๐Ÿ“Š **4,587 models across 95 providers** | From OpenAI to Zhipu, from cloud APIs to open-weights | +| โœ… **First-party data only** | Every data point comes from the provider's own API or docs | +| ๐Ÿค– **Machine-readable YAML** | TypeScript types + Zod validation = programmatic access with confidence | +| ๐Ÿ”„ **Automated sync** | Scrape scripts pull fresh data from provider APIs | + +## Contents + +- [Quick Compare](#quick-compare) +- [๐Ÿ† Model Picks](#-model-picks) +- [Use Cases](#use-cases) +- [Quick Numbers](#quick-numbers) +- [Example Model](#example-model) +- [Programmatic Usage](#programmatic-usage) +- [GitHub Action](#use-as-github-action) +- [Documentation](#documentation) +- [Provider Showcase](#provider-showcase) +- [Contributing](#contributing) +- [Who's Using This](#whos-using-this) +- [License](#license) + +## Quick Compare + +> Popular models at a glance โ€” full data for [4,587 models](docs/model-comparison.md) + +| Model | Provider | Context | Input $/M | Output $/M | Tools | Reason | Vision | +| ---------------- | --------- | ------- | --------- | ---------- | ----- | ------ | ------ | +| gpt-4.1 | openai | 1M | $2 | $8 | โœ“ | | โœ“ | +| gpt-4.1-mini | openai | 1M | $0.40 | $1.60 | โœ“ | | โœ“ | +| gpt-4.1-nano | openai | 1M | $0.10 | $0.40 | โœ“ | | โœ“ | +| o3 | openai | 200K | $10 | $40 | โœ“ | โœ“ | โœ“ | +| o4-mini | openai | 200K | $1.10 | $4.40 | โœ“ | โœ“ | โœ“ | +| claude-opus-4 | anthropic | 200K | $15 | $75 | โœ“ | โœ“ | โœ“ | +| claude-sonnet-4 | anthropic | 200K | $3 | $15 | โœ“ | โœ“ | โœ“ | +| claude-haiku-4 | anthropic | 200K | $1 | $5 | โœ“ | โœ“ | โœ“ | +| gemini-2.5-pro | google | 1M | $1.25 | $10 | โœ“ | โœ“ | โœ“ | +| gemini-2.5-flash | google | 1M | $0.15 | $0.60 | โœ“ | โœ“ | โœ“ | +| deepseek-r1 | deepseek | 128K | $0.55 | $2.19 | | โœ“ | | +| deepseek-chat | deepseek | 128K | $0.14 | $0.28 | โœ“ | | | +| llama-4-maverick | meta | 1M | $0.20 | $0.20 | โœ“ | | โœ“ | +| llama-4-scout | meta | 10M | $0.03 | $0.03 | โœ“ | | โœ“ | +| grok-3 | xai | 131K | $3 | $15 | โœ“ | | โœ“ | +| grok-3-mini | xai | 131K | $0.30 | $0.50 | โœ“ | โœ“ | โœ“ | +| mistral-large | mistral | 128K | $2 | $6 | โœ“ | | โœ“ | +| qwen3-235b-a22b | alibaba | 128K | $0.14 | $0.42 | โœ“ | โœ“ | โœ“ | +| qwen3-30b-a3b | alibaba | 128K | $0.03 | $0.05 | โœ“ | โœ“ | โœ“ | + +
๐Ÿ“– How to read this table + +- **Context**: Maximum context window (input + output tokens) +- **Input/Output $/M**: Price per million tokens +- **Tools**: Supports function/tool calling +- **Reason**: Uses chain-of-thought reasoning +- **Vision**: Accepts image input +- Prices shown are for standard (non-cached) API calls. Many providers offer 50-90% discounts for cached inputs. + +
+ +## ๐Ÿ† Model Picks + +> Curated recommendations for common use cases โ€” from [4,587 models](docs/model-comparison.md) across 95 providers + +| Use Case | Model | Why | Input $/M | Context | +| --------------------- | ---------------- | --------------------------------------- | --------- | ------- | +| **Coding** | gpt-4.1 | Best code generation + 1M context | $2 | 1M | +| **Coding (cheap)** | gpt-4.1-nano | 20x cheaper, great for autocomplete | $0.10 | 1M | +| **Reasoning** | o4-mini | Best cost-effective reasoning | $1.10 | 200K | +| **Reasoning (power)** | claude-opus-4 | Deepest reasoning for hard problems | $15 | 200K | +| **Agents** | claude-sonnet-4 | Best tool use + reasoning balance | $3 | 200K | +| **Agents (cheap)** | gemini-2.5-flash | Fastest agent loop under $1 | $0.15 | 1M | +| **Vision** | gemini-2.5-pro | Best multimodal understanding | $1.25 | 1M | +| **Free** | llama-4-scout | 10M context, open weights, free on Groq | $0 | 10M | +| **Open weights** | deepseek-r1 | Best open reasoning model | $0.55 | 128K | +| **Large context** | gemini-2.5-flash | 1M context at lowest price | $0.15 | 1M | + +## Use Cases + +| Use Case | How This Catalog Helps | +| ------------------------------ | -------------------------------------------------------------------------------------------------------------------------------------------------- | +| ๐Ÿ’ฐ **Find the cheapest model** | [Pricing comparison](docs/pricing-comparison.md) across 95 providers | +| ๐Ÿ”Ž **Pick the right model** | [Model comparison](docs/model-comparison.md) by capability, context, cost | +| ๐Ÿ” **Search & compare models** | [Interactive catalog](https://i-need-token.github.io/ai-models/) โ€” search, filter, compare, price calc, model picker, copy-as-code, share, j/k nav | +| ๐Ÿ”Œ **Build an API gateway** | Structured pricing + modality data for routing decisions | +| ๐Ÿ“Š **Track the AI landscape** | 2,712 models with release dates, deprecation status | +| ๐Ÿค– **Power an AI tool** | TypeScript types + Zod validation = type-safe access | +| ๐ŸŒ **Find local/EU providers** | [Provider overview](docs/providers.md) with market segmentation | +| ๐ŸŽฏ **Choose the right model** | [Model selection guide](docs/model-selection.md) โ€” decision framework | +| ๐Ÿ’ธ **Optimize API costs** | [Cached pricing](docs/cached-pricing.md) โ€” 1,374 models with 50-90% savings | +| ๐Ÿงช **Prototype for free** | [Free models](docs/free-models.md) โ€” 81 models at zero cost | +| ๐Ÿ’ฌ **Build chat apps** | [Chat models](docs/chat-models.md) โ€” 2,350 models with tool calling | +| ๐Ÿ–ผ๏ธ **Process images/audio** | [Multimodal models](docs/multimodal-models.md) โ€” 1,519 models with vision/audio/video | +| ๐Ÿ”Ž **Power semantic search** | [Embedding models](docs/embedding-models.md) โ€” vector search & RAG | +| ๐Ÿค– **Build AI agents** | [Agentic models](docs/agentic-models.md) โ€” 1,080 models with tool_call + reasoning | +| ๐Ÿ’ป **Generate & review code** | [Code models](docs/code-models.md) โ€” 189 code-focused models | +| ๐ŸŽ™๏ธ **Add voice/speech** | [Audio models](docs/audio-models.md) โ€” 118 audio input + 34 audio output | +| ๐Ÿ”„ **Switch from OpenAI** | [OpenAI alternatives](docs/openai-alternatives.md) โ€” pricing, free options, compat | + +## Quick Numbers + +| Metric | Count | +| --------------------------- | ----: | +| Providers | 95 | +| Model files | 4,587 | +| Unique model IDs | 2,712 | +| Model families | 441 | +| Reasoning models | 1,306 | +| Tool-calling models | 2,350 | +| Open-weight models | 527 | +| Free models | 81 | +| Vision (image input) models | 1,487 | +| Image output models | 28 | +| Audio input models | 118 | +| Audio output models | 34 | +| Video input models | 167 | + +## Data at a Glance + +Each model is a single YAML file with structured metadata: ```yaml -id: gpt-4o -name: GPT-4o -family: gpt-4o -reasoning: true +id: gpt-4.1 +name: GPT-4.1 +family: gpt-4.1 tool_call: true -attachment: true structured_output: true pricing: - input: 2.5 - output: 10 - cache_read: 1.25 + input: 2.0 # USD per million tokens + output: 8.0 + cache_read: 0.5 limit: - context: 128000 - output: 16384 + context: 1047576 # tokens (~1M) + output: 32768 modalities: - input: - - text - - image - output: - - text -knowledge: "2023-10" -release_date: "2024-05-13" -last_updated: "2024-08-06" -snapshots: - - id: gpt-4o-2024-08-06 - - id: gpt-4o-2024-05-13 - deprecated: true + input: [text, image] + output: [text] +release_date: "2026-05-18" +last_updated: "2026-05-18" +``` + +
+Same model as JSON (from models.json) + +```json +{ + "id": "gpt-4.1", + "name": "GPT-4.1", + "family": "gpt-4.1", + "tool_call": true, + "structured_output": true, + "pricing": { "input": 2.0, "output": 8.0, "cache_read": 0.5 }, + "limit": { "context": 1047576, "output": 32768 }, + "modalities": { "input": ["text", "image"], "output": ["text"] }, + "release_date": "2026-05-18", + "last_updated": "2026-05-18" +} ``` +
+ ### Pricing Types | Type | When | Example | @@ -45,60 +229,252 @@ snapshots: | `UnitPricing` | Per-image or per-request | `unit: per_image, price: 0.04` | | `FreePricing` | No cost | `unit: free` | -See [`types/pricing.ts`](types/pricing.ts) for the full type definitions. +## Covered Providers + +
+Model Producers (develop their own models) + +- **Anthropic** โ€” Claude series +- **Google** โ€” Gemini series +- **Meta** โ€” Llama series +- **OpenAI** โ€” GPT series +- **DeepSeek** โ€” DeepSeek-V/R series +- **Alibaba Cloud** โ€” Qwen series +- **Mistral AI** โ€” Mistral series +- **Cohere** โ€” Command series +- **xAI** โ€” Grok series +- **Reka AI** โ€” Reka series +- **AI21 Labs** โ€” Jamba series +- **01.AI** โ€” Yi series +- **ByteDance** โ€” Doubao series +- **MiniMax** โ€” MiniMax series +- **Moonshot AI** โ€” Kimi series +- **Zhipu AI** โ€” GLM series +- **NVIDIA** โ€” Nemotron series +- **IBM** โ€” Granite series +- **Microsoft** โ€” Phi series +- **StepFun** โ€” Step series +- **iFlytek** โ€” SparkDesk series +- **Baidu** โ€” ERNIE series +- **Baichuan AI** โ€” Baichuan series +- **Tencent** โ€” Hunyuan series +- **Xiaomi** โ€” MiMo series +- **Sarvam AI** โ€” Sarvam series +- **InclusionAI** โ€” Book series +- **Writer** โ€” Palmyra series +- **Upstage** โ€” Solar series +- **Voyage AI** โ€” Voyage series + +
+ +
+Inference Platforms (host and serve models) + +- **Amazon Bedrock** โ€” Multi-provider inference on AWS +- **Azure OpenAI Service** โ€” OpenAI models on Azure +- **Google Vertex AI** โ€” Multi-provider inference on GCP +- **OpenRouter** โ€” 300+ models with unified API +- **Together AI** โ€” Open-source model hosting +- **Fireworks AI** โ€” Fast inference for open models +- **Groq** โ€” LPU-accelerated inference +- **Cerebras** โ€” CS-3 wafer-scale inference +- **DeepInfra** โ€” Cost-effective model hosting +- **SiliconFlow** โ€” GPU cloud inference +- **Novita AI** โ€” Multi-model API +- **SambaNova** โ€” SN40L accelerated inference +- **Cohere** โ€” Command models + hosted models +- **Databricks** โ€” MosaicML inference +- **Cloudflare Workers AI** โ€” Edge inference +- **DigitalOcean** โ€” GPU Droplets inference +- **Nebius** โ€” AI cloud inference +- **OVHcloud** โ€” AI Endpoints +- **Scaleway** โ€” GPU inference +- **Vultr** โ€” Cloud inference +- **Chutes** โ€” Community inference +- **Kluster AI** โ€” Distributed inference +- **NanoGPT** โ€” Simple API, 500+ models +- **And 40+ more platformsโ€ฆ** + +
+ +
+Full Provider List (95) -## Usage +01.AI ยท 302.AI ยท AI21 Labs ยท AIHubMix ยท AI/ML API ยท Aion Labs ยท Alibaba Cloud ยท Amazon Bedrock ยท Amazon Nova ยท Anthropic ยท Arcee AI ยท Auriko ยท Azure OpenAI ยท Baichuan AI ยท Baidu ยท Baseten ยท Berget ยท ByteDance ยท Cerebras ยท Chutes ยท Clarifai ยท CloudFerro Sherlock ยท Cloudflare Workers AI ยท Cohere ยท Cortecs ยท DInference ยท Databricks ยท DeepInfra ยท DeepSeek ยท DigitalOcean ยท evroc ยท FastRouter ยท Fireworks AI ยท FriendliAI ยท GMI Cloud ยท Google ยท Google Vertex AI ยท Groq ยท HPC-AI Cloud ยท Hyperbolic ยท IBM Granite ยท iFlytek SparkDesk ยท Inception Labs ยท InclusionAI ยท Inference.net ยท Kluster AI ยท LLM Gateway ยท Martian ยท MegaNova ยท Meta Llama ยท Microsoft Phi ยท MiniMax ยท Mistral AI ยท Mixlayer ยท MoArk AI ยท Moonshot AI ยท Morph ยท NanoGPT ยท Nebius ยท NeuralWatt ยท Nous Research ยท Novita AI ยท NVIDIA ยท OpenAI ยท OpenRouter ยท OrcaRouter ยท OVHcloud ยท PPIO ยท Perplexity ยท Privatemode AI ยท Qiniu AI ยท Regolo ยท Reka AI ยท Requesty ยท SambaNova ยท Sarvam AI ยท Scaleway ยท SiliconFlow ยท SiliconFlow CN ยท StepFun ยท SubModel ยท Tencent Cloud TokenHub ยท Tencent Hunyuan ยท TextSynth ยท Together AI ยท Upstage ยท Venice AI ยท Voyage AI ยท Vultr ยท Wafer ยท Writer ยท xAI Grok ยท Xiaomi ยท Zhipu AI ยท ๆŽฅๅฃ AI -### Install Dependencies +
+ +## Quick Start + +### Browse the Data + +No installation needed โ€” just browse `providers//models/` for YAML files. Every file is human-readable. + +### Install from npm ```bash -npm install +npm install ai-models ``` -### Sync Model Data +```typescript +import catalog from "ai-models"; // 4,587 models as JSON +import type { Model } from "ai-models"; // TypeScript types +``` -Fetch the latest model data from a provider's first-party source: +### Install & Sync ```bash -# Sync a specific provider +# Install dependencies +npm install + +# Fetch latest data from a specific provider npx tsx scripts/sync.ts openai npx tsx scripts/sync.ts anthropic -# Sync all providers +# Fetch all providers npx tsx scripts/sync.ts + +# Validate all YAML files +npx tsx scripts/validate.ts + +# Compute catalog statistics +npx tsx scripts/stats.ts + +# Compile to a single models.json +npx tsx scripts/compile.ts +``` + +Or use the Makefile shortcuts: + +```bash +make install # npm install +make validate # validate all YAML +make scrape # sync all providers +make build # compile models.json +make stats # compute statistics +make check # run all checks (fmt + lint + typecheck + validate) ``` -### Validate Model Data +### Use Programmatically -Validate all YAML files against the Zod schemas: +```typescript +import { ModelSchema } from "./types/schemas"; +import { parse } from "yaml"; +import { readFileSync } from "fs"; + +// Load and validate a model +const raw = readFileSync("providers/openai/models/gpt-4.1.yaml", "utf-8"); +const model = ModelSchema.parse(parse(raw)); + +console.log(model.pricing); // { input: 2, output: 8, cache_read: 0.5 } +console.log(model.limit); // { context: 1047576, output: 32768 } +console.log(model.modalities); // { input: ["text", "image"], output: ["text"] } +``` + +### Download Data + +Available in JSON and CSV formats from [GitHub Releases](https://github.com/i-need-token/ai-models/releases/latest): ```bash -npx tsx scripts/validate.ts +# JSON โ€” full metadata (2.3 MB) +curl -sLO https://github.com/i-need-token/ai-models/releases/latest/download/models.json + +# CSV โ€” flat table for Excel/Google Sheets (560 KB) +curl -LO https://github.com/i-need-token/ai-models/releases/latest/download/models.csv +``` + +```html + + +``` + +```python +# Python โ€” no pip install needed +import urllib.request, json +catalog = json.loads(urllib.request.urlopen("https://github.com/i-need-token/ai-models/releases/latest/download/models.json").read()) +print(len(catalog['models'])) # 4587 +``` + +```bash +# Quick stats with jq +curl -sL https://github.com/i-need-token/ai-models/releases/latest/download/models.json | jq '.models | length' +``` + +See [API & Programmatic Access](docs/api.md) for full usage examples in JavaScript and Python. + +### Use as GitHub Action + +```yaml +- uses: i-need-token/ai-models@main + id: catalog + +- name: Use catalog data + run: | + echo "Models: ${{ steps.catalog.outputs.model-count }}" + echo "Providers: ${{ steps.catalog.outputs.provider-count }}" + echo "File: ${{ steps.catalog.outputs.file-path }}" +``` + +Download a specific version or format: + +```yaml +- uses: i-need-token/ai-models@main + with: + version: v0.1.0 # specific release tag + format: csv # csv or json + output-dir: data # directory to save files ``` +See [`action.yml`](action.yml) for all inputs and outputs. + +
+๐ŸŽฌ Live demo output (from our CI) + +``` +๐Ÿ“Š 4587 models from 87 providers +๐Ÿ“ Data saved to model-data/models.json + +๐Ÿ’ฐ Cheapest tool-calling models: + bdc-coder: $0.01/$0.01/M tokens + ling-2.6-flash: $0.01/$0.03/M tokens + klusterai--Meta-Llama-3.1-8B-Instruct-Turbo: $0.015/$0.02/M tokens + granite-4.0-h-micro: $0.017/$0.112/M tokens + +๐Ÿ†“ Free reasoning models: + gemma-4-26b-a4b-it: 262K context + gemma-4-31b-it: 262K context +``` + +_[View the live workflow โ†’](https://github.com/i-need-token/ai-models/actions/workflows/demo.yml)_ + +
+ ## Project Structure ``` -โ”œโ”€โ”€ providers/ -โ”‚ โ”œโ”€โ”€ openai/ -โ”‚ โ”‚ โ”œโ”€โ”€ scrape.ts # Data acquisition from OpenAI's website -โ”‚ โ”‚ โ””โ”€โ”€ models/ # YAML model data files -โ”‚ โ””โ”€โ”€ anthropic/ -โ”‚ โ”œโ”€โ”€ scrape.ts # Data acquisition from Anthropic's website -โ”‚ โ””โ”€โ”€ models/ # YAML model data files -โ”œโ”€โ”€ types/ -โ”‚ โ”œโ”€โ”€ model.ts # Model and Snapshot type definitions -โ”‚ โ”œโ”€โ”€ pricing.ts # Pricing type definitions -โ”‚ โ”œโ”€โ”€ provider.ts # Provider type definitions -โ”‚ โ”œโ”€โ”€ schemas.ts # Zod runtime validation schemas -โ”‚ โ””โ”€โ”€ index.ts # Re-exports -โ”œโ”€โ”€ scripts/ -โ”‚ โ”œโ”€โ”€ sync.ts # Orchestration: scrape โ†’ write YAML -โ”‚ โ”œโ”€โ”€ validate.ts # Validate all YAML against schemas -โ”‚ โ””โ”€โ”€ lib/ # Shared utilities (defineModel, defineProvider, writer) -โ””โ”€โ”€ docs/ - โ”œโ”€โ”€ data-acquisition.md # How we acquire and update model data - โ””โ”€โ”€ lessons-learned.md # Design principles and pitfalls +โ”œโ”€โ”€ providers/ # 95 provider directories +โ”‚ โ””โ”€โ”€ / +โ”‚ โ”œโ”€โ”€ provider.yaml # Provider metadata (name, URL, API endpoints) +โ”‚ โ”œโ”€โ”€ scrape.ts # Data acquisition script +โ”‚ โ”œโ”€โ”€ models/ # YAML model data files +โ”‚ โ””โ”€โ”€ README.md # Provider-specific notes +โ”œโ”€โ”€ types/ # TypeScript type definitions + Zod schemas +โ”‚ โ”œโ”€โ”€ model.ts # Model, Snapshot, ModelModality +โ”‚ โ”œโ”€โ”€ pricing.ts # TokenPricing, VideoPricing, UnitPricing, FreePricing +โ”‚ โ”œโ”€โ”€ provider.ts # Provider, ProviderGroup +โ”‚ โ””โ”€โ”€ schemas.ts # Zod runtime validation +โ”œโ”€โ”€ scripts/ # CLI tools +โ”‚ โ”œโ”€โ”€ sync.ts # Orchestration: scrape โ†’ write YAML +โ”‚ โ”œโ”€โ”€ validate.ts # Validate all YAML against schemas +โ”‚ โ”œโ”€โ”€ stats.ts # Compute catalog statistics +โ”‚ โ”œโ”€โ”€ compile.ts # Compile to dist/models.json +โ”‚ โ””โ”€โ”€ lib/ # Shared utilities +โ””โ”€โ”€ docs/ # Documentation (English + ไธญๆ–‡) ``` ## Adding a New Provider @@ -111,17 +487,217 @@ npx tsx scripts/validate.ts See [`docs/data-acquisition.md`](docs/data-acquisition.md) for detailed guidelines. +## Documentation + +| Document | Description | +| ------------------------------------------------------------------- | --------------------------------------------------------------- | +| [Tool Calling Models](docs/tool-calling.md) | 2,350 tool-calling models โ€” cheapest, largest context, free | +| [Vision Models](docs/vision-models.md) | 1,487 vision models โ€” cheapest, largest context, open-weight | +| [Image Generation](docs/image-generation.md) | 28 image generation models โ€” DALLยทE, Imagen, GPT-5 Image | +| [Audio Models](docs/audio-models.md) | 118 audio input + 34 audio output models | +| [Code Models](docs/code-models.md) | 189 code-focused models across 41 providers | +| [Agentic Models](docs/agentic-models.md) | 1,080 models with tool calling + reasoning for AI agents | +| [Chat Models](docs/chat-models.md) | 2,350 models with tool calling for chat applications | +| [Multimodal Models](docs/multimodal-models.md) | 1,519 models with image/audio/video input | +| [Embedding Models](docs/embedding-models.md) | 5 embedding models for search, RAG, similarity | +| [Video Models](docs/video-models.md) | 167 video input + 4 video output models | +| [Structured Output](docs/structured-output.md) | 829 JSON-mode models โ€” cheapest, free, with tool calling | +| [๐Ÿ” Interactive Catalog](https://i-need-token.github.io/ai-models/) | Search, sort, and filter all 4,587 models in your browser | +| [Quick Start Guide](docs/quick-start.md) | Find the right model in 30 seconds | +| [Model Selection Guide](docs/model-selection.md) | Decision framework: free, best value, large context models | +| [Model Selection Cheatsheet](docs/model-selection-cheatsheet.md) | Quick-reference: best model by budget and use case | +| [AI Model Picker](docs/ai-model-picker.md) | 4-question wizard: find the best model for your use case | +| [Benchmarks & Leaderboards](docs/benchmarks.md) | MMLU, MATH, HumanEval, SWE-bench, Chatbot Arena guide | +| [Migration Guide](docs/migration-guide.md) | Switch providers โ€” pricing, API compatibility, checklist | +| [API & Programmatic Access](docs/api.md) | Download models.json, code examples in JS/Python | +| [Code Examples](docs/code-examples.md) | Practical examples in TypeScript, Python, Go, Rust, jq | +| [FAQ](docs/faq.md) | Common questions about the catalog, data, and contributing | +| [Glossary](docs/glossary.md) | Key terms and definitions for AI model terminology | +| [Model Comparison](docs/model-comparison.md) | Compare flagship, cost-effective, free, and open-weight models | +| [Pricing Comparison](docs/pricing-comparison.md) | Side-by-side pricing across providers and platforms | +| [Cached Pricing](docs/cached-pricing.md) | 1,374 models with prompt caching โ€” 50-90% input cost savings | +| [Modality Matrix](docs/modality-matrix.md) | Vision, image gen, audio, video โ€” which models support what | +| [Context Window Comparison](docs/context-windows.md) | Largest context windows, best value per tier | +| [Large Context Models](docs/large-context-models.md) | 2,195 models with 128K+ context โ€” 397 with 1M+ | +| [Small & Edge Models](docs/small-models.md) | 1,153 models under 10B params for on-device use | +| [Provider Comparison](docs/provider-comparison.md) | Top 30 providers by model count, capabilities, pricing | +| [Free AI Models](docs/free-models.md) | 81 free models โ€” tool calling, reasoning, vision at no cost | +| [Open-Weight Models](docs/open-weights.md) | 513 open-weight models โ€” run on your own infrastructure | +| [Reasoning Models](docs/reasoning-models.md) | 1,306 reasoning models โ€” chain-of-thought and extended thinking | +| [OpenAI Alternatives](docs/openai-alternatives.md) | GPT-4/GPT-3.5 alternatives โ€” pricing, free options, compat | +| [Provider Overview](docs/providers.md) | All 95 providers organized by type and market | +| [Data Schema Reference](docs/data-schema.md) | Complete YAML schema โ€” model, pricing, snapshot, provider | +| [Data Acquisition](docs/data-acquisition.md) | How we acquire and update model data | +| [Design Principles & Pitfalls](docs/lessons-learned.md) | Lessons learned from building the catalog | + +**ไธญๆ–‡ๆ–‡ๆกฃ๏ผš** + +| ๆ–‡ๆกฃ | ๆ่ฟฐ | +| ------------------------------------------------------- | ------------------------------------------------ | +| [ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹](docs/zh/tool-calling.md) | 2,350 ไธชๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹ โ€” ๆœ€ไพฟๅฎœใ€ๆœ€ๅคงไธŠไธ‹ๆ–‡ใ€ๅ…่ดน | +| [่ง†่ง‰ๆจกๅž‹](docs/zh/vision-models.md) | 1,487 ไธช่ง†่ง‰ๆจกๅž‹ โ€” ๆœ€ไพฟๅฎœใ€ๆœ€ๅคงไธŠไธ‹ๆ–‡ใ€ๅผ€ๆบๆƒ้‡ | +| [ๅฟซ้€Ÿๅ…ฅ้—จ](docs/zh/quick-start.md) | 30 ็ง’ๅ†…ๆ‰พๅˆฐ้€‚ๅˆ็š„ๆจกๅž‹ | +| [ๅ›พๅƒ็”Ÿๆˆ](docs/zh/image-generation.md) | 28 ไธชๅ›พๅƒ็”Ÿๆˆๆจกๅž‹ โ€” DALLยทEใ€Imagenใ€GPT-5 Image | +| [้Ÿณ้ข‘ๆจกๅž‹](docs/zh/audio-models.md) | 118 ไธช้Ÿณ้ข‘่พ“ๅ…ฅ + 34 ไธช้Ÿณ้ข‘่พ“ๅ‡บๆจกๅž‹ | +| [่ง†้ข‘ๆจกๅž‹](docs/zh/video-models.md) | 167 ไธช่ง†้ข‘่พ“ๅ…ฅ + 4 ไธช่ง†้ข‘่พ“ๅ‡บๆจกๅž‹ | +| [API ไธŽ็ผ–็จ‹่ฎฟ้—ฎ](docs/zh/api.md) | ไธ‹่ฝฝ models.json๏ผŒJS/Python ไปฃ็ ็คบไพ‹ | +| [ไปฃ็ ็คบไพ‹](docs/zh/code-examples.md) | TypeScriptใ€Pythonใ€Goใ€Rustใ€jq ๅฎž็”จ็คบไพ‹ | +| [ๅธธ่ง้—ฎ้ข˜](docs/zh/faq.md) | ๅ…ณไบŽ็›ฎๅฝ•ใ€ๆ•ฐๆฎๅ’Œ่ดก็Œฎ็š„ๅธธ่ง้—ฎ้ข˜ | +| [็ป“ๆž„ๅŒ–่พ“ๅ‡บ](docs/zh/structured-output.md) | 829 ไธช JSON ๆจกๅผๆจกๅž‹ โ€” ๆœ€ไพฟๅฎœใ€ๅ…่ดนใ€ๅธฆๅทฅๅ…ท่ฐƒ็”จ | +| [ๆจกๅž‹ๅฏนๆฏ”](docs/zh/model-comparison.md) | ๆ——่ˆฐใ€้ซ˜ๆ€งไปทๆฏ”ใ€ๅ…่ดนๅ’Œๅผ€ๆบๆจกๅž‹ๅฏนๆฏ” | +| [ๅฎšไปทๅฏนๆฏ”](docs/zh/pricing-comparison.md) | ๅ„ๆไพ›ๅ•†ๅ’ŒๅนณๅฐๅฎšไปทๅนถๆŽ’ๅฏนๆฏ” | +| [็ผ“ๅญ˜ๅฎšไปท](docs/zh/cached-pricing.md) | 1,374 ไธชๆ”ฏๆŒๆ็คบ็ผ“ๅญ˜็š„ๆจกๅž‹ โ€” ่พ“ๅ…ฅๆˆๆœฌ่Š‚็œ 50-90% | +| [ๆจกๆ€็Ÿฉ้˜ต](docs/zh/modality-matrix.md) | ่ง†่ง‰ใ€ๅ›พๅƒ็”Ÿๆˆใ€้Ÿณ้ข‘ใ€่ง†้ข‘ โ€” ๅ„ๆจกๅž‹ๆ”ฏๆŒไป€ไนˆ | +| [ไธŠไธ‹ๆ–‡็ช—ๅฃๅฏนๆฏ”](docs/zh/context-windows.md) | ๆœ€ๅคงไธŠไธ‹ๆ–‡็ช—ๅฃ๏ผŒๅ„ๅฑ‚็บงๆœ€ไฝณๆ€งไปทๆฏ” | +| [ๅคงไธŠไธ‹ๆ–‡ๆจกๅž‹](docs/zh/large-context-models.md) | 2,195 ไธช 128K+ ไธŠไธ‹ๆ–‡ๆจกๅž‹ โ€” 397 ไธช 1M+ | +| [ๅฐๅž‹/่พน็ผ˜ๆจกๅž‹](docs/zh/small-models.md) | 1,153 ไธช 10B ๅ‚ๆ•ฐไปฅไธ‹ๆจกๅž‹๏ผŒ้€‚ๅˆ็ซฏไพง้ƒจ็ฝฒ | +| [ๆไพ›ๅ•†ๅฏนๆฏ”](docs/zh/provider-comparison.md) | ๆŒ‰ๆจกๅž‹ๆ•ฐ้‡ใ€่ƒฝๅŠ›ใ€ๅฎšไปทๅฏนๆฏ”ๅ‰ 30 ไธชๆไพ›ๅ•† | +| [ๅ…่ดน AI ๆจกๅž‹](docs/zh/free-models.md) | 81 ไธชๅ…่ดนๆจกๅž‹ โ€” ๅทฅๅ…ท่ฐƒ็”จใ€ๆŽจ็†ใ€่ง†่ง‰้›ถๆˆๆœฌ | +| [ๅผ€ๆบๆƒ้‡ๆจกๅž‹](docs/zh/open-weights.md) | 513 ไธชๅผ€ๆบๆƒ้‡ๆจกๅž‹ โ€” ่‡ชๆœ‰ๅŸบ็ก€่ฎพๆ–ฝ่ฟ่กŒ | +| [ๆไพ›ๅ•†ๆฆ‚่งˆ](docs/zh/providers.md) | 95 ไธชๆไพ›ๅ•†ๆŒ‰็ฑปๅž‹ๅ’Œๅธ‚ๅœบๅˆ†็ฑป | +| [ๆŽจ็†ๆจกๅž‹](docs/zh/reasoning-models.md) | 1,306 ไธชๆŽจ็†ๆจกๅž‹ โ€” ้“พๅผๆ€็ปดๅ’Œๆ‰ฉๅฑ•ๆ€่€ƒ | +| [ๆ•ฐๆฎ Schema ๅ‚่€ƒ](docs/zh/data-schema.md) | ๅฎŒๆ•ด YAML Schema โ€” ๆจกๅž‹ใ€ๅฎšไปทใ€ๅฟซ็…งใ€ๆไพ›ๅ•† | +| [ๆ•ฐๆฎ้‡‡้›†](docs/zh/data-acquisition.md) | ๆ•ฐๆฎ้‡‡้›†ๆŒ‡ๅ— | +| [่ฎพ่ฎกๅŽŸๅˆ™ไธŽ้™ท้˜ฑ](docs/zh/lessons-learned.md) | ็ป้ชŒๆ•™่ฎญ | +| [ๆ™บ่ƒฝไฝ“ๆจกๅž‹](docs/zh/agentic-models.md) | 1,080 ไธชๅทฅๅ…ท่ฐƒ็”จ+ๆŽจ็†ๆจกๅž‹๏ผŒ็”จไบŽ AI ๆ™บ่ƒฝไฝ“ | +| [ไปฃ็ ๆจกๅž‹](docs/zh/code-models.md) | 189 ไธชไปฃ็ ๆจกๅž‹๏ผš็”Ÿๆˆใ€ๅฎกๆŸฅใ€่ฐƒ่ฏ• | +| [OpenAI ๆ›ฟไปฃๆ–นๆกˆ](docs/zh/openai-alternatives.md) | GPT-4/GPT-3.5 ๆ›ฟไปฃๆ–นๆกˆ๏ผšๅฎšไปทใ€ๅ…่ดน้€‰้กนใ€ๅ…ผๅฎนๆ€ง | +| [่Šๅคฉๆจกๅž‹](docs/zh/chat-models.md) | 2,350 ไธชๅธฆๅทฅๅ…ท่ฐƒ็”จ็š„่Šๅคฉๆจกๅž‹ | +| [ๅคšๆจกๆ€ๆจกๅž‹](docs/zh/multimodal-models.md) | 1,519 ไธชๆ”ฏๆŒๅ›พๅƒ/้Ÿณ้ข‘/่ง†้ข‘่พ“ๅ…ฅ็š„ๆจกๅž‹ | +| [ๅตŒๅ…ฅๆจกๅž‹](docs/zh/embedding-models.md) | 5 ไธชๅตŒๅ…ฅๆจกๅž‹็”จไบŽๆœ็ดขใ€RAGใ€็›ธไผผๅบฆ | +| [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](docs/zh/model-selection.md) | ๅ†ณ็ญ–ๆก†ๆžถ๏ผšๅ…่ดนใ€ๆœ€ไฝณๆ€งไปทๆฏ”ใ€ๅคงไธŠไธ‹ๆ–‡ๆจกๅž‹ | +| [ๆจกๅž‹้€‰ๆ‹ฉ้€ŸๆŸฅ่กจ](docs/zh/model-selection-cheatsheet.md) | ๆŒ‰้ข„็ฎ—ๅ’Œไฝฟ็”จๅœบๆ™ฏๅฟซ้€Ÿ้€‰ๆ‹ฉๆจกๅž‹ | +| [่ฟ็งปๆŒ‡ๅ—](docs/zh/migration-guide.md) | ๅˆ‡ๆขๆไพ›ๅ•†๏ผšๅฎšไปทใ€API ๅ…ผๅฎนๆ€งใ€ๆฃ€ๆŸฅๆธ…ๅ• | +| [ๆœฏ่ฏญ่กจ](docs/zh/glossary.md) | AI ๆจกๅž‹ๆœฏ่ฏญ็š„ๅ…ณ้”ฎ่ฏๅ’Œๅฎšไน‰ | + ## Design Principles - **First-party data only** โ€” all model data comes from the provider's own API or website - **Dynamic discovery** โ€” scrape functions discover models from the source, not from hardcoded lists -- **Include deprecated, exclude retired** โ€” deprecated models are included with a `deprecated: true` flag; retired (inaccessible) models are excluded +- **Include deprecated, exclude retired** โ€” deprecated models are included with `deprecated: true`; retired (inaccessible) models are excluded - **Never fabricate data** โ€” if required data is missing, skip the model with a warning rather than filling in guessed values - **YAML source format** โ€” human-readable, supports comments, machine-parseable - **Snapshot inheritance** โ€” dated model versions are nested within the parent model, inheriting all fields -See [`docs/lessons-learned.md`](docs/lessons-learned.md) for the full set of design principles and pitfalls. +## Contributing + +Contributions are welcome! Whether it's adding a new provider, fixing data, or improving documentation: + +1. Fork the repository +2. Create your feature branch (`git checkout -b feature/my-provider`) +3. Follow the [data acquisition guidelines](docs/data-acquisition.md) +4. Validate your changes (`npx tsx scripts/validate.ts`) +5. Submit a pull request + +Please read [CONTRIBUTING.md](CONTRIBUTING.md) for detailed guidelines. + +## Alternatives + +| Project | Scope | Data Source | Format | Auto-Update | Free | +| ------------------------------------------------------------------------- | --------------------------- | ---------------- | ----------------- | ----------- | ------- | +| **This catalog** | 95 providers, 4,587+ models | First-party APIs | YAML + JSON + CSV | Weekly CI | โœ… | +| [Artificial Analysis](https://artificialanalysis.ai/) | ~30 providers | Mixed | Web UI | โœ… | Partial | +| [LLM Price](https://llmprice.com/) | ~25 providers | Mixed | Web UI | โœ… | โœ… | +| [OpenRouter models](https://openrouter.ai/models) | OpenRouter only | OpenRouter API | Web UI | โœ… | โœ… | +| [Helicone models](https://helicone.ai/models) | ~20 providers | Mixed | Web UI | โœ… | Partial | +| [BerriAI/litellm](https://github.com/BerriAI/litellm) | 100+ providers | Community | Python config | โœ… | โœ… | +| [dariubs/awesome-ai-models](https://github.com/dariubs/awesome-ai-models) | ~20 providers | Manual | Markdown list | โŒ | โœ… | +| [Vellum AI](https://www.vellum.ai/) | ~15 providers | Mixed | Web UI + API | โœ… | Partial | +| [openai/models](https://github.com/openai/openai-python) | OpenAI only | OpenAI API | Python SDK | โœ… | โœ… | + +**Key differentiators of this catalog:** + +- **First-party data only** โ€” scraped directly from provider APIs, not aggregated from third parties +- **Machine-readable YAML** โ€” structured data with Zod validation, not just a web UI +- **Multiple access formats** โ€” npm, CDN, CSV, GitHub Action, Hugging Face dataset +- **Comprehensive metadata** โ€” pricing, context windows, modalities, capabilities, snapshots +- **Bilingual docs** โ€” 34 English + 34 Chinese documentation pages +- **Open data** โ€” all model data is open and programmatically accessible + +## Ecosystem & Integrations + +| Integration | Description | Link | +| ------------------------ | ------------------------------------------------------- | ---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- | +| **npm package** | Install models.json via npm | [`npm install ai-models`](https://www.npmjs.com/package/ai-models) | +| **jsDelivr CDN** | Fetch models.json from CDN | [cdn.jsdelivr.net/npm/ai-models](https://cdn.jsdelivr.net/npm/ai-models@latest/models.json) | +| **GitHub Action** | Use in CI/CD workflows | [action.yml](action.yml) | +| **Hugging Face** | Dataset on HF Hub | [huggingface.co/datasets/i-need-token/ai-models](https://huggingface.co/datasets/i-need-token/ai-models) | +| **CSV download** | Import into Excel/Sheets | [GitHub Releases](https://github.com/i-need-token/ai-models/releases) | +| **Interactive catalog** | Search, filter, compare, price calculator, model picker | [i-need-token.github.io/ai-models](https://i-need-token.github.io/ai-models/) | +| **SEO comparison pages** | 21 curated comparison pages for discoverability | [Best Models](https://i-need-token.github.io/ai-models/best-ai-models.html), [Free Models](https://i-need-token.github.io/ai-models/free-ai-models.html), [Pricing](https://i-need-token.github.io/ai-models/llm-pricing.html), [OpenAI Alt](https://i-need-token.github.io/ai-models/openai-alternatives.html), [By Provider](https://i-need-token.github.io/ai-models/ai-models-by-provider.html), [Context](https://i-need-token.github.io/ai-models/context-window-comparison.html), [Coding](https://i-need-token.github.io/ai-models/best-ai-models-for-coding.html), [Agents](https://i-need-token.github.io/ai-models/best-ai-models-for-agents.html), [Reasoning](https://i-need-token.github.io/ai-models/reasoning-models-comparison.html), [Cheapest](https://i-need-token.github.io/ai-models/cheapest-ai-models.html), [Tool Calling](https://i-need-token.github.io/ai-models/tool-calling-models-comparison.html), [Pricing Calc](https://i-need-token.github.io/ai-models/ai-model-pricing-calculator.html), [Image Gen](https://i-need-token.github.io/ai-models/best-ai-models-for-image-generation.html), [Vision](https://i-need-token.github.io/ai-models/best-ai-models-for-vision.html), [Structured Output](https://i-need-token.github.io/ai-models/structured-output-models-comparison.html), [Open Source](https://i-need-token.github.io/ai-models/open-source-ai-models.html), [Multimodal](https://i-need-token.github.io/ai-models/multimodal-ai-models.html), [State of AI](https://i-need-token.github.io/ai-models/state-of-ai-models.html), [Benchmarks](https://i-need-token.github.io/ai-models/ai-model-benchmarks.html), [ChatGPT vs Claude vs Gemini](https://i-need-token.github.io/ai-models/chatgpt-vs-claude-vs-gemini.html), [Comparison Chart](https://i-need-token.github.io/ai-models/ai-model-comparison-chart.html) | + +## What's New + +### v0.2.0 (May 2025) + +- **21 SEO comparison pages** โ€” Best Models, Free Models, LLM Pricing, OpenAI Alternatives, By Provider, Context Windows, Coding, Agents, Reasoning, Cheapest, Tool Calling, Pricing Calculator, Image Generation, Open Source, Multimodal, State of AI Models 2025 +- **Interactive catalog** โ€” 25+ features including dark/light theme, keyboard shortcuts, model detail modal, price calculator, model picker wizard, copy as code, share button, j/k vim navigation +- **95 providers** โ€” comprehensive coverage of all major AI providers +- **4,587+ models** โ€” with pricing, context windows, modalities, and capabilities +- **GitHub Action v2** โ€” version, format, and output-dir inputs +- **npm package** โ€” `npm install ai-models` +- **70 docs** โ€” 35 EN + 35 ZH, all bilingual, all cross-linked + +## Roadmap + +- [x] ~~Embedding models documentation~~ โ†’ [docs/embedding-models.md](docs/embedding-models.md) +- [x] ~~Provider comparison~~ โ†’ [docs/provider-comparison.md](docs/provider-comparison.md) +- [x] ~~Large context models~~ โ†’ [docs/large-context-models.md](docs/large-context-models.md) +- [x] ~~Small/edge models~~ โ†’ [docs/small-models.md](docs/small-models.md) +- [x] ~~Migration guide~~ โ†’ [docs/migration-guide.md](docs/migration-guide.md) +- [ ] Model benchmarking data integration +- [ ] Streaming support metadata +- [ ] Fine-tuning availability tracking +- [ ] Regional availability data +- [ ] Community-contributed model reviews +- ๐Ÿ”œ **REST API** โ€” hosted API for querying the catalog +- ๐Ÿ”œ **Historical pricing** โ€” track pricing changes over time +- ๐Ÿ”œ **Community scrapers** โ€” enable community-contributed scrape scripts with automated validation + +## Who's Using This? + +Built something with this catalog? [Open a PR](https://github.com/i-need-token/ai-models/edit/main/README.md) to add your project! + +| Use Case | How the Catalog Is Used | +| -------------------------- | ------------------------------------------------------------------------ | +| **AI API gateways** | Route requests to the cheapest provider with real-time pricing data | +| **Model comparison tools** | Compare capabilities, context windows, and costs across providers | +| **Cost optimization** | Find the cheapest model for each task (reasoning, vision, tool calling) | +| **AI agent frameworks** | Select models with tool calling + structured output for agent workflows | +| **Research & analysis** | Track the AI landscape โ€” 2,712 models with release dates and deprecation | +| **CI/CD pipelines** | Use the [GitHub Action](action.yml) to fetch model data in workflows | +| **Data dashboards** | Import CSV into Excel/Google Sheets for visual pricing analysis | +| **Chatbot builders** | Pick the right model by context window, modality, and budget | + +## Contributors + +Thanks to everyone who has contributed to this catalog! + + + + +Want to contribute? Check out [CONTRIBUTING.md](CONTRIBUTING.md) for guidelines. + +- ๐Ÿ“‹ [Changelog](CHANGELOG.md) โ€” what's new in each release +- ๐Ÿ”’ [Security Policy](SECURITY.md) โ€” reporting vulnerabilities + +## Project Timeline + +| Date | Milestone | +| ------- | ----------------------------------------------------------- | +| 2026-05 | ๐Ÿš€ Public launch โ€” 4,587 models, 95 providers, 68 docs | +| 2026-05 | ๐Ÿ“Š Interactive catalog live at GitHub Pages | +| 2026-05 | ๐Ÿ“ฆ npm package, CSV export, GitHub Action | +| 2026-05 | ๐ŸŒ Bilingual docs โ€” 34 EN + 34 ZH pages | +| 2026-05 | ๐Ÿค– 1,080 agentic models, 2,350 tool-calling models | +| Future | ๐Ÿ“ˆ More providers, REST API, historical pricing, benchmarks | + +[![Star History Chart](https://api.star-history.com/svg?repos=i-need-token/ai-models&type=Date)](https://star-history.com/#i-need-token/ai-models&Date) + +## Sponsors + +Support this project by [sponsoring us on GitHub](https://github.com/sponsors/i-need-token). Your sponsorship helps maintain and expand the catalog. ## License -MIT +[MIT](LICENSE) diff --git a/SECURITY.md b/SECURITY.md new file mode 100644 index 00000000..79af03c5 --- /dev/null +++ b/SECURITY.md @@ -0,0 +1,24 @@ +# Security Policy + +## Reporting a Vulnerability + +If you discover a security vulnerability in this project, please report it by opening a [GitHub Security Advisory](https://github.com/i-need-token/ai-models/security/advisories/new). + +Please do not report security vulnerabilities through public GitHub issues. + +## Scope + +This project is a data catalog โ€” it contains YAML model data files, TypeScript type definitions, and scrape scripts. Security vulnerabilities in this context would include: + +- Malicious code in scrape scripts that could compromise the build environment +- Supply chain vulnerabilities in dependencies +- Data integrity issues where model data is intentionally corrupted + +Out of scope: + +- Incorrect model pricing or capability data (report as a [bug](https://github.com/i-need-token/ai-models/issues/new?labels=bug&template=bug_report.md)) +- Missing providers or models (report as a [provider request](https://github.com/i-need-token/ai-models/issues/new?labels=enhancement&template=provider_request.md)) + +## Response Time + +We aim to acknowledge security reports within 48 hours and provide a fix within 7 days. diff --git a/action.yml b/action.yml new file mode 100644 index 00000000..af4a71c7 --- /dev/null +++ b/action.yml @@ -0,0 +1,71 @@ +name: "AI Models Catalog" +description: "Download AI model metadata (pricing, context windows, capabilities) from the AI Models Catalog" +author: "i-need-token" +branding: + icon: "database" + color: "blue" + +inputs: + version: + description: "Release version to download (latest, or a specific tag like v0.1.0)" + required: false + default: "latest" + format: + description: "Output format: json or csv" + required: false + default: "json" + output-dir: + description: "Directory to save the downloaded file" + required: false + default: "ai-models" + +outputs: + model-count: + description: "Number of models in the catalog" + value: ${{ steps.download.outputs.model-count }} + provider-count: + description: "Number of providers in the catalog" + value: ${{ steps.download.outputs.provider-count }} + file-path: + description: "Path to the downloaded file" + value: ${{ steps.download.outputs.file-path }} + +runs: + using: "composite" + steps: + - id: download + shell: bash + run: | + VERSION="${{ inputs.version }}" + FORMAT="${{ inputs.format }}" + OUTPUT_DIR="${{ inputs.output-dir }}" + BASE_URL="https://github.com/i-need-token/ai-models/releases" + + mkdir -p "$OUTPUT_DIR" + + if [ "$VERSION" = "latest" ]; then + DOWNLOAD_URL="$BASE_URL/latest/download/models.$FORMAT" + else + DOWNLOAD_URL="$BASE_URL/download/$VERSION/models.$FORMAT" + fi + + echo "๐Ÿ“ฅ Downloading models.$FORMAT from $DOWNLOAD_URL" + HTTP_CODE=$(curl -sL -w "%{http_code}" -o "$OUTPUT_DIR/models.$FORMAT" "$DOWNLOAD_URL") + + if [ "$HTTP_CODE" -ne 200 ]; then + echo "โŒ Failed to download (HTTP $HTTP_CODE)" + exit 1 + fi + + FILE_SIZE=$(wc -c < "$OUTPUT_DIR/models.$FORMAT" | tr -d ' ') + echo "โœ… Downloaded models.$FORMAT ($FILE_SIZE bytes)" + + if [ "$FORMAT" = "json" ]; then + MODEL_COUNT=$(python3 -c "import json; d=json.load(open('$OUTPUT_DIR/models.json')); print(len(d.get('models', d)))" 2>/dev/null || echo "0") + PROVIDER_COUNT=$(python3 -c "import json; d=json.load(open('$OUTPUT_DIR/models.json')); print(len(d.get('providers', [])))" 2>/dev/null || echo "0") + echo "๐Ÿ“Š $MODEL_COUNT models from $PROVIDER_COUNT providers" + echo "model-count=$MODEL_COUNT" >> "$GITHUB_OUTPUT" + echo "provider-count=$PROVIDER_COUNT" >> "$GITHUB_OUTPUT" + fi + + echo "file-path=$OUTPUT_DIR/models.$FORMAT" >> "$GITHUB_OUTPUT" diff --git a/docs/agentic-models.md b/docs/agentic-models.md new file mode 100644 index 00000000..e2ef293f --- /dev/null +++ b/docs/agentic-models.md @@ -0,0 +1,97 @@ +**English** | [ไธญๆ–‡](./zh/agentic-models.md) + +# Agentic AI Models โ€” 1,080 Models for AI Agents + +Models with **tool calling + reasoning** capabilities โ€” the essential building blocks for AI agents, autonomous workflows, and multi-step task execution. All data sourced from first-party APIs via the [AI Models Catalog](https://github.com/i-need-token/ai-models). + +## What Makes a Model "Agentic"? + +An agentic model can: + +- **Call tools/functions** โ€” interact with APIs, databases, and external systems +- **Reason step-by-step** โ€” plan, decompose tasks, and verify results +- **Act autonomously** โ€” make decisions and take actions without human intervention + +These capabilities are what separate chatbots from AI agents. + +## Stats + +| Metric | Count | +| ---------------------- | ----- | +| Agentic models | 1076 | +| Providers | 51 | +| With vision | 617 | +| With structured output | 453 | +| Free | 30 | +| Open weights | 64 | + +## Cheapest Agentic Models (Direct Providers) + +| Model | Provider | Context | Input $/1M | Output $/1M | Vision | +| ------------------------------ | ------------ | ------- | ---------- | ----------- | ------ | +| qwen--qwen3-4b-fp8 | novitaai | 125K | $0.03 | $0.03 | | +| openai--gpt-oss-20b | neuralwatt | 0 | $0.03 | $0.16 | | +| openai--gpt-oss-120b | novitaai | 128K | $0.05 | $0.25 | โœ… | +| gpt-oss-120b | inferencenet | 128K | $0.05 | $0.45 | | +| Qwen--Qwen3.6-35B-A3B | neuralwatt | 0 | $0.05 | $0.1 | โœ… | +| qwen3-30b-a3b-fp8 | cloudflare | 40K | $0.051 | $0.335 | | +| glm-4.7-flash | cloudflare | 128K | $0.06 | $0.4 | | +| Nemotron-3-Nano-Omni | nebius | 125K | $0.06 | $0.24 | โœ… | +| hermes-4-llama-3.1-8b | nousresearch | 128K | $0.06 | $0.12 | | +| zai-org--glm-4.7-flash | novitaai | 195K | $0.07 | $0.4 | | +| ring-2.6-1t | inclusionai | 256K | $0.07 | $0.62 | | +| seed-1.6-flash | bytedance | 256K | $0.07 | $0.3 | โœ… | +| microsoft-phi-4-mini-reasoning | microsoft | 125K | $0.075 | $0.3 | | +| Qwen--Qwen3-32B-TEE | chutes | 40K | $0.08 | $0.24 | | +| qwen--qwen3-30b-a3b-fp8 | novitaai | 40K | $0.09 | $0.45 | | + +## Free Agentic Models + +| Model | Provider | Context | Vision | Structured Output | +| --------------------------------- | -------- | ------- | ------ | ----------------- | +| glm-4.1v-thinking-flash | zhipuai | 62K | โœ… | โœ… | +| qwen--qwen3-omni-30b-a3b-thinking | novitaai | 64K | โœ… | โœ… | +| qwen--qwen3.5-4b-free | mixlayer | 128K | | | + +## Largest Context Agentic Models + +| Model | Provider | Context | Input $/1M | Output $/1M | +| --------------------------- | ----------- | ------- | ---------- | ----------- | +| deepseek-v4-flash | baidu | 1024K | $0.126 | $0.252 | +| deepseek-v4-pro | siliconflow | 1024K | $1.74 | $3.48 | +| deepseek-v4-flash | siliconflow | 1024K | $0.14 | $0.28 | +| deepseek--deepseek-v4-pro | novitaai | 1024K | $1.67 | $3.38 | +| xiaomimimo--mimo-v2.5-pro | novitaai | 1024K | $2 | $6 | +| deepseek--deepseek-v4-flash | novitaai | 1024K | $0.14 | $0.28 | +| gemini-2.5-flash | google | 1024K | $0.15 | $3.5 | +| gemini-2.5-pro | google | 1024K | $1.25 | $10 | +| deepseek-v4-pro | fireworks | 1024K | $1.74 | $3.48 | +| xiaomi--mimo-v2.5-pro | hpc-ai | 1024K | $1 | $3 | +| xiaomi--mimo-v2.5 | hpc-ai | 1024K | $0.4 | $2 | +| mimo-v2.5-pro | xiaomi | 1024K | $1 | $3 | +| mimo-v2-pro | xiaomi | 1024K | $1 | $3 | +| minimaxai--minimax-m1-80k | novitaai | 976K | $0.55 | $2.2 | +| qwen3.6-flash | alibaba | 976K | $1.2 | $7.2 | + +## Building AI Agents + +| Agent Type | Recommended Models | Key Capabilities | +| ---------------- | --------------------------- | ------------------------------ | +| Code agents | Claude Sonnet 4, GPT-4.1 | Tool call + reasoning + code | +| Research agents | Gemini 2.5 Pro, DeepSeek R1 | Large context + reasoning | +| Data agents | Claude Sonnet 4, Qwen3 | Structured output + tool call | +| Vision agents | GPT-4o, Gemini 2.5 Flash | Vision + tool call + reasoning | +| Customer support | Llama 4 Scout, Qwen3 | Free/cheap + tool call | + +## Related Documentation + +- [Tool Calling Models](tool-calling.md) โ€” 2,350 models with function calling +- [Reasoning Models](reasoning-models.md) โ€” 1,306 models with chain-of-thought +- [Structured Output](structured-output.md) โ€” 829 models with JSON mode +- [OpenAI Alternatives](openai-alternatives.md) โ€” GPT-4 alternatives with agent capabilities +- [Vision Models](vision-models.md) โ€” 1,487 models with image understanding +- [Free AI Models](free-models.md) โ€” 81 models at zero cost + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/ai-model-picker.md b/docs/ai-model-picker.md new file mode 100644 index 00000000..e30d73e8 --- /dev/null +++ b/docs/ai-model-picker.md @@ -0,0 +1,64 @@ +# AI Model Picker + +Answer 4 simple questions to find the best AI model for your use case. + +**[Try the interactive picker โ†’](https://i-need-token.github.io/ai-models/ai-model-picker.html)** + +## How It Works + +The AI Model Picker asks you four questions: + +1. **What are you building?** โ€” AI Agents, Code Generation, Chat/RAG, Math & Reasoning, Vision/Multimodal, or High-Volume Production +2. **What's your budget?** โ€” Free, Under $0.10/M tokens, Under $1/M, or Premium +3. **How much context do you need?** โ€” Under 32K, 32Kโ€“128K, 128Kโ€“512K, or 512K+ +4. **What matters most?** โ€” Lowest Cost, Best Quality, Lowest Latency, or Privacy/On-Device + +Based on your answers, the picker scores and ranks all 4,587+ models across 95 providers, filtering by budget and context requirements, then weighting by use case and priority. + +## Scoring Logic + +| Use Case | Key Capabilities | Weight | +| ---------------------- | --------------------------------------------------------- | --------------------------------- | +| AI Agents | Tool Calling (+10), Reasoning (+5) | Cost penalty for expensive models | +| Code Generation | Tool Calling (+8), Reasoning (+5), Structured Output (+3) | โ€” | +| Chat / RAG | Large Context (+5), Tool Calling (+3) | โ€” | +| Math & Reasoning | Reasoning (+10), Tool Calling (+3) | โ€” | +| Vision / Multimodal | Image Input (+10), Tool Calling (+3) | โ€” | +| High-Volume Production | Tool Calling (+5) | Cost penalty scaled 5ร— | + +Aggregator providers (OpenRouter, Requesty, etc.) are excluded to avoid duplicate model entries. + +## Quick Recommendations + +### Best Free Models by Use Case + +| Use Case | Top Pick | Why | +| --------------- | ------------------------ | --------------------------- | +| AI Agents | DeepSeek V4 Flash (Free) | Tool calling + 1M context | +| Code Generation | Qwen3 Coder (Free) | Tool calling + 1M context | +| Chat / RAG | DeepSeek V4 Flash (Free) | 1M context window | +| Reasoning | DeepSeek R1 (Free) | 92% MATH-500, reasoning | +| Vision | โ€” | Limited free vision options | + +### Best Budget Models (Under $0.10/M) + +| Use Case | Top Pick | Price | +| --------------- | -------------- | --------------- | +| AI Agents | ling-2.6-flash | $0.01/$0.03/M | +| Code Generation | bdc-coder | $0.01/$0.01/M | +| Reasoning | qwen3.5-0.8b | $0.01/$0.05/M | +| General | Mistral Nemo | $0.008/$0.001/M | + +## Related Documentation + +- [Free Models](free-models.md) โ€” Complete list of 81 free models +- [Pricing Comparison](pricing-comparison.md) โ€” Compare costs across all providers +- [Tool Calling](tool-calling.md) โ€” 2,350 models with tool calling +- [Reasoning Models](reasoning-models.md) โ€” 1,306 reasoning models +- [Context Windows](context-windows.md) โ€” Compare context window sizes +- [Model Selection Cheatsheet](model-selection-cheatsheet.md) โ€” Decision tree and budget table +- [Quick Start](quick-start.md) โ€” Get started with the catalog + +## Data Source + +All data is sourced from first-party APIs and official documentation. See [Data Acquisition](data-acquisition.md) for details. diff --git a/docs/api.md b/docs/api.md new file mode 100644 index 00000000..0ba83ea7 --- /dev/null +++ b/docs/api.md @@ -0,0 +1,222 @@ +**English** | [ไธญๆ–‡](./zh/api.md) + +# API & Programmatic Access + +Use the catalog data in your applications. + +## npm Package + +Install the catalog as an npm dependency: + +```bash +npm install ai-models +``` + +```typescript +import catalog from "ai-models"; // 4,587 models as JSON +import type { Model } from "ai-models"; // TypeScript types + +// Find models with tool calling under $1/1M input +const affordable = catalog.models.filter((m) => m.tool_call && m.pricing.input < 1); +``` + +The package includes: + +- `dist/models.json` โ€” full catalog as JSON +- `dist/index.d.ts` โ€” TypeScript type definitions +- `types/` โ€” source type definitions (Model, Snapshot, Provider, Pricing) + +## CDN Access (No Install) + +The compiled JSON is available via [jsDelivr CDN](https://www.jsdelivr.com/package/npm/ai-models) โ€” no download or install needed. The CDN automatically serves the latest npm release: + +```html + + +``` + +```bash +# Direct curl (always up-to-date) +curl -s https://github.com/i-need-token/ai-models/releases/latest/download/models.json | jq '.models | length' + +# Pin to a specific version +curl -s https://github.com/i-need-token/ai-models/releases/download/v0.1.0/models.json | jq '.stats' +``` + +```python +# Python โ€” no pip install needed +import urllib.request, json +catalog = json.loads(urllib.request.urlopen("https://github.com/i-need-token/ai-models/releases/latest/download/models.json").read()) +print(len(catalog["models"])) # 4587 +``` + +```go +// Go โ€” no dependencies needed +resp, err := http.Get("https://github.com/i-need-token/ai-models/releases/latest/download/models.json") +``` + +### CDN vs GitHub Releases + +| Feature | jsDelivr CDN | GitHub Releases | +| ------------- | -------------------------------------------- | --------------------------------------------- | +| URL stability | `cdn.jsdelivr.net/npm/ai-models@latest/...` | `github.com/.../releases/latest/download/...` | +| CORS | โœ… Yes โ€” works in browsers | โŒ No โ€” download only | +| Caching | 7 days (versioned), 5 min (`@latest`) | No caching | +| Speed | Global CDN, 300+ edge locations | GitHub CDN | +| Best for | Web apps, browser scripts, quick prototyping | CLI tools, CI/CD, batch processing | + +## Compiled JSON + +All model data is available from [GitHub Releases](https://github.com/i-need-token/ai-models/releases/latest) in two formats: + +| File | Format | Size | Best For | +| ------------- | ------ | ------- | ----------------------------------------- | +| `models.json` | JSON | ~2.3 MB | Programmatic access, web apps, TypeScript | +| `models.csv` | CSV | ~560 KB | Excel, Google Sheets, data analysis | +| `stats.json` | JSON | ~1 KB | Catalog statistics summary | + +Also available on [Hugging Face Datasets](https://huggingface.co/datasets/i-need-token/ai-models) for the ML community. + +```bash +# Download JSON (full metadata) +curl -LO https://github.com/i-need-token/ai-models/releases/latest/download/models.json + +# Download CSV (flat table for spreadsheets) +curl -LO https://github.com/i-need-token/ai-models/releases/latest/download/models.csv + +# Specific version +curl -LO https://github.com/i-need-token/ai-models/releases/download/v0.1.0/models.json +``` + +### Compile Locally + +```bash +npm install +npx tsx scripts/compile.ts +# Output: dist/models.json (2.3 MB) +``` + +### JSON Structure + +```json +{ + "generated_at": "2026-05-21T02:13:04.076Z", + "stats": { + "providers": 95, + "models": 4587, + "unique_model_ids": 2712, + "families": 441 + }, + "providers": { + "openai": { "name": "OpenAI", "model_count": 28 }, + "anthropic": { "name": "Anthropic", "model_count": 11 } + }, + "models": [ + { + "id": "gpt-4.1", + "name": "GPT-4.1", + "family": "gpt-4.1", + "provider": "openai", + "tool_call": true, + "structured_output": true, + "pricing": { "currency": "USD", "input": 2, "output": 8, "cache_read": 0.5 }, + "limit": { "context": 1047576, "output": 32768 }, + "modalities": { "input": ["text", "image"], "output": ["text"] } + } + ] +} +``` + +### Usage Examples + +**JavaScript/TypeScript:** + +```javascript +const catalog = require("./models.json"); + +// Find all models with tool calling under $1/1M input tokens +const cheap = catalog.models.filter( + (m) => m.tool_call && m.pricing?.input < 1 && m.pricing?.currency === "USD", +); + +// Find the cheapest model per provider +const byProvider = {}; +for (const m of catalog.models) { + if (!m.pricing?.input) continue; + if (!byProvider[m.provider] || m.pricing.input < byProvider[m.provider].pricing.input) { + byProvider[m.provider] = m; + } +} + +// Get all vision models +const vision = catalog.models.filter((m) => m.modalities?.input?.includes("image")); +``` + +**Python:** + +```python +import json + +with open("models.json") as f: + catalog = json.load(f) + +# Find all reasoning models +reasoning = [m for m in catalog["models"] if m.get("reasoning")] + +# Find models with largest context windows +by_context = sorted( + catalog["models"], + key=lambda m: (m.get("limit", {}) or {}).get("context", 0), + reverse=True, +)[:10] +``` + +## Individual YAML Files + +For type-safe access to individual models, use the YAML files directly with Zod validation: + +```typescript +import { ModelSchema } from "./types/schemas"; +import { parse } from "yaml"; +import { readFileSync } from "fs"; + +const raw = readFileSync("providers/openai/models/gpt-4.1.yaml", "utf-8"); +const model = ModelSchema.parse(parse(raw)); // Runtime-validated + +console.log(model.pricing); // { input: 2, output: 8, cache_read: 0.5 } +``` + +## CLI Tools + +```bash +# Validate all YAML data +npx tsx scripts/validate.ts + +# Compute catalog statistics +npx tsx scripts/stats.ts # table format +npx tsx scripts/stats.ts json # JSON format + +# Compile to models.json +npx tsx scripts/compile.ts + +# Sync data from providers +npx tsx scripts/sync.ts openai # single provider +npx tsx scripts/sync.ts # all providers +``` + +## Related Documentation + +- [Quick Start](quick-start.md) โ€” find the right model in 30 seconds +- [Code Examples](code-examples.md) โ€” TypeScript, Python, Go, Rust, jq +- [Data Schema](data-schema.md) โ€” complete YAML schema reference +- [FAQ](faq.md) โ€” common questions +- [Model Selection Guide](model-selection.md) โ€” decision framework + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/audio-models.md b/docs/audio-models.md new file mode 100644 index 00000000..733db149 --- /dev/null +++ b/docs/audio-models.md @@ -0,0 +1,83 @@ +**English** | [ไธญๆ–‡](./zh/audio-models.md) + +# Audio AI Models โ€” Speech, Voice, and Audio Understanding + +Models with **audio input** (speech recognition, voice understanding) and **audio output** (text-to-speech, voice generation) capabilities. All data sourced from first-party APIs via the [AI Models Catalog](https://github.com/i-need-token/ai-models). + +## Stats + +| Metric | Count | +| ------------------- | ----- | +| Audio input models | 115 | +| Audio output models | 34 | +| Total audio models | 133 | +| Providers | 20 | +| With tool calling | 69 | +| Free | 8 | + +## Audio Input Models (Speech/Voice Understanding) + +Models that can process audio input โ€” transcribe speech, analyze audio, understand voice commands: + +| Model | Provider | Context | Input $/1M | Output $/1M | Tool Call | +| ------------------------------- | -------------- | ------- | ---------- | ----------- | --------- | +| mistral-voxtral-mini | amazon-bedrock | 125K | $0.04 | $0.04 | | +| voxtral-mini | mistral | 125K | $0.04 | $0.04 | | +| gemini-2.0-flash-lite | google | 1024K | $0.075 | $0.3 | โœ… | +| gemini-2-0-flash-lite | google-vertex | 1024K | $0.075 | $0.3 | โœ… | +| microsoft-phi-4-mini-multimodal | microsoft | 125K | $0.08 | $0.32 | โœ… | +| gemini-2.0-flash | google | 1024K | $0.1 | $0.4 | โœ… | +| gemini-2.5-flash-lite | google | 1024K | $0.1 | $0.4 | โœ… | +| mistral-voxtral-small | amazon-bedrock | 125K | $0.1 | $0.3 | | +| voxtral-small | mistral | 125K | $0.1 | $0.3 | | +| amazon-nova-2.0-lite | amazon | 62K | $0.15 | $1.25 | โœ… | +| gemini-2.5-flash | google | 1024K | $0.15 | $3.5 | โœ… | +| gemini-2-0-flash | google-vertex | 1024K | $0.15 | $0.6 | โœ… | +| voxtral-small-24b-2507 | scaleway | 128K | $0.15 | $0.35 | | +| amazon-nova-2.0-omni | amazon | 62K | $0.2 | $1.3 | โœ… | +| xiaomi--mimo-v2.5 | hpc-ai | 1024K | $0.4 | $2 | โœ… | + +## Audio Output Models (Text-to-Speech / Voice Generation) + +Models that can generate audio output โ€” text-to-speech, voice synthesis: + +| Model | Provider | Input $/1M | Output $/1M | +| ---------------------- | -------- | ---------- | ----------- | +| gpt-4o-audio | openai | $2.5 | $10 | +| gpt-4o-realtime | openai | $5 | $20 | +| step-audio-2 | stepfun | $10 | $70 | +| stepaudio-2.5-realtime | stepfun | $10 | $70 | +| o1-realtime | openai | $15 | $60 | +| step-1o-audio | stepfun | $25 | $60 | + +## Free Audio Models + +| Model | Provider | Audio In | Audio Out | Context | +| --------------------------------- | -------- | -------- | --------- | ------- | +| qwen--qwen3-omni-30b-a3b-instruct | novitaai | โœ… | โœ… | 64K | +| qwen--qwen3-omni-30b-a3b-thinking | novitaai | โœ… | | 64K | +| gemma-3n-E2B-it | google | โœ… | | 128K | +| gemma-3n-E4B-it | google | โœ… | | 128K | +| step-audio-r1.1 | stepfun | โœ… | โœ… | 0 | + +## Choosing an Audio Model + +| Use Case | Recommended | Key Feature | +| ------------------- | ------------------------- | ------------------------- | +| Voice assistants | GPT-4o-audio | Audio in/out + tool call | +| Transcription | Whisper, Gemini 2.5 Flash | Fast, cheap audio input | +| Voice agents | GPT-4o-realtime | Real-time audio streaming | +| Text-to-speech | OpenAI TTS, ElevenLabs | Natural voice output | +| Multilingual speech | Gemini 2.5 Pro | 100+ languages | + +## Related Documentation + +- [Multimodal Models](multimodal-models.md) โ€” 1,519 models with image/audio/video +- [Vision Models](vision-models.md) โ€” 1,487 models with image understanding +- [Chat Models](chat-models.md) โ€” 2,350 models with tool calling +- [Tool Calling Models](tool-calling.md) โ€” function calling capabilities +- [Free AI Models](free-models.md) โ€” 81 models at zero cost + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/benchmarks.md b/docs/benchmarks.md new file mode 100644 index 00000000..d024a867 --- /dev/null +++ b/docs/benchmarks.md @@ -0,0 +1,109 @@ +# AI Model Benchmarks & Leaderboards + +[ไธญๆ–‡](zh/benchmarks.md) + +How AI models are evaluated โ€” key benchmarks, leaderboard landscape, and what the numbers mean for model selection. + +Data sourced from the [AI Models Catalog](https://github.com/i-need-token/ai-models). + +## Why Benchmarks Matter + +Benchmarks provide standardized ways to compare AI models across tasks. However, no single benchmark tells the whole story. This guide covers the major benchmarks, how to interpret them, and how to use them alongside our catalog data (pricing, context windows, capabilities) for informed model selection. + +## Major Benchmarks + +### General Language Understanding + +| Benchmark | What It Tests | Top Models | Notes | +| --------- | ---------------------------------- | -------------------------------------- | ------------------------------------------------------------- | +| MMLU | Multi-task knowledge (57 subjects) | GPT-4.1, Claude Opus 4, Gemini 2.5 Pro | Standard academic benchmark; may not reflect real-world usage | +| MMLU-Pro | Harder MMLU with reasoning | o3, Claude Sonnet 4, Gemini 2.5 Pro | More challenging version | +| GPQA | Graduate-level science Q&A | o3, Gemini 2.5 Pro | Expert-level reasoning | +| HellaSwag | Common-sense reasoning | Most frontier models near ceiling | Near-saturated | + +### Reasoning & Math + +| Benchmark | What It Tests | Top Models | Notes | +| ------------- | ----------------------- | --------------------------- | -------------------------- | +| MATH-500 | Competition mathematics | o3, DeepSeek R1, Qwen3-235B | Key for quantitative tasks | +| AIME 2024 | Math competition | o3, DeepSeek R1 | Very challenging | +| GSM8K | Grade-school math | Most models >90% | Near-saturated | +| ARC-Challenge | Scientific reasoning | Most frontier models | Grade-school science | + +### Coding + +| Benchmark | What It Tests | Top Models | Notes | +| ------------- | ---------------------------- | ------------------------------------- | ----------------------------- | +| HumanEval | Python code generation | Claude Sonnet 4, GPT-4.1, DeepSeek V3 | 164 Python problems | +| SWE-bench | Real GitHub issue resolution | Claude Sonnet 4, o3 | More realistic than HumanEval | +| LiveCodeBench | Continuously updated coding | Various | Avoids data contamination | +| MBPP | Basic Python programming | Most models >80% | Near-saturated | + +### Multimodal + +| Benchmark | What It Tests | Top Models | Notes | +| --------- | ------------------------- | ------------------------------- | ------------------------------- | +| MMMU | Multi-modal understanding | Gemini 2.5 Pro, Claude Sonnet 4 | Images + text | +| MathVista | Visual math reasoning | Gemini 2.5 Pro | Diagrams + math | +| AI2D | Science diagrams | Gemini 2.5 Pro | Scientific figure understanding | +| DocVQA | Document understanding | Gemini 2.5 Pro | Text in images | + +### Tool Use & Agents + +| Benchmark | What It Tests | Top Models | Notes | +| --------- | ------------------------- | ------------------------ | ------------------------------------- | +| BFCL v3 | Function calling accuracy | GPT-4.1, Claude Sonnet 4 | Berkeley Function Calling Leaderboard | +| ฯ„-bench | Agent task completion | Various | Terminal-based agent tasks | +| WebArena | Web interaction | Various | Realistic web tasks | + +## Key Leaderboards + +| Leaderboard | Focus | URL | +| -------------------- | ------------------------- | ----------------------------------------------------------------------- | +| LMSYS Chatbot Arena | Human preference ranking | https://chat.lmsys.org/ | +| Open LLM Leaderboard | Open-source model ranking | https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard | +| AlpacaEval | Instruction-following | https://tatsu-lab.github.io/alpaca_eval/ | +| MT-Bench | Multi-turn conversation | Part of Chatbot Arena | +| BigBench | Beyond basic tasks | https://github.com/google/BIG-bench | +| MTEB | Embedding models | https://huggingface.co/spaces/mteb/leaderboard | + +## How to Use Benchmarks with Our Catalog + +Benchmarks alone are insufficient for model selection. Combine them with our catalog data: + +1. **Start with your use case** โ†’ See [Model Selection Guide](model-selection.md) +2. **Filter by capabilities** โ†’ Tool calling, reasoning, vision, etc. +3. **Check benchmark scores** โ†’ For your specific task domain +4. **Compare pricing** โ†’ Use our [Pricing Comparison](pricing-comparison.md) +5. **Consider context windows** โ†’ See [Context Windows](context-windows.md) +6. **Test with your data** โ†’ Benchmarks are proxies; real performance may differ + +## Benchmark Limitations + +- **Data contamination**: Models may have seen benchmark data during training +- **Task narrowness**: Benchmarks test specific skills, not general utility +- **Leaderboard gaming**: Optimizing for benchmarks can hurt real-world performance +- **Staleness**: Benchmarks age as models improve; saturated benchmarks become uninformative +- **Cultural bias**: Most benchmarks are English-centric and Western-focused +- **Cost blindness**: Benchmarks ignore pricing, latency, and availability + +## Practical Recommendations + +- For **coding**: Use SWE-bench over HumanEval (more realistic) +- For **agents**: Test with your actual tool suite; BFCL is a starting point +- For **reasoning**: MATH-500 and GPQA are more discriminating than MMLU +- For **chat**: Chatbot Arena correlates best with human preference +- For **cost-sensitive**: Use our [Free Models](free-models.md) guide first + +## Related Documentation + +- [Model Selection Guide](model-selection.md) โ€” Decision framework for choosing models +- [Pricing Comparison](pricing-comparison.md) โ€” Cost analysis across providers +- [Free Models](free-models.md) โ€” 81 free models with capabilities +- [Tool Calling Models](tool-calling.md) โ€” 2,350 models with function calling +- [Reasoning Models](reasoning-models.md) โ€” 1,306 models with extended thinking +- [Vision Models](vision-models.md) โ€” 1,487 models with image understanding +- [Code Models](code-models.md) โ€” Models optimized for programming +- [Open Weights](open-weights.md) โ€” 527 open-weight models +- [Context Windows](context-windows.md) โ€” Context window comparison +- [Interactive Catalog](https://i-need-token.github.io/ai-models/) โ€” Browse and compare all models diff --git a/docs/cached-pricing.md b/docs/cached-pricing.md new file mode 100644 index 00000000..edfe5629 --- /dev/null +++ b/docs/cached-pricing.md @@ -0,0 +1,245 @@ +# Cached Pricing + +[ไธญๆ–‡](zh/cached-pricing.md) + +AI models with prompt caching support, showing standard vs. cached pricing. Cached inputs can be **50-90% cheaper** than standard input tokens. + +Data sourced from the [AI Models Catalog](https://github.com/i-need-token/ai-models). + +## Why Cached Pricing Matters + +Prompt caching lets you store repeated prompt prefixes (system prompts, few-shot examples, tool definitions) and reuse them across requests. This dramatically reduces: + +- **Cost**: 50-90% savings on input tokens +- **Latency**: Faster time-to-first-token for cached content +- **Throughput**: More efficient use of rate limits + +## Stats + +| Metric | Count | +| ------------------------- | ----- | +| Models with cache pricing | 1374 | +| Providers | 39 | + +## Providers + +`aihubmix`, `aion`, `amazon-bedrock`, `auriko`, `baidu`, `baseten`, `chutes`, `clarifai`, `cloudflare`, `cortecs`, `databricks`, `deepinfra`, `deepseek`, `digitalocean`, `fastrouter`, `friendli`, `google`, `google-vertex`, `groq`, `hpc-ai`, `inception`, `jiekou`, `llmgateway`, `martian`, `minimax`, `moonshotai`, `nanogpt`, `openai`, `openrouter`, `ppio`, `privatemode`, `requesty`, `siliconflow`, `stepfun`, `tencent-tokenhub`, `togetherai`, `upstage`, `venice`, `wafer` + +## Model Pricing + +| Model | Provider | Context | Input $/M | Cache Read $/M | Cache Write $/M | Savings | +| --------------------------------------------- | -------------- | ------- | ------------------- | -------------------- | --------------- | ------- | +| aistudio_gemini-2.0-flash | aihubmix | โ€” | $0.05 | $0.125 | โ€” | -150% | +| aistudio_gpt-4.1-mini | aihubmix | โ€” | $0.2 | $0.05 | โ€” | 75% | +| anthropic-opus-4-6 | aihubmix | โ€” | $2.5 | $0.25 | $3.125 | 90% | +| claude-haiku-4-5 | aihubmix | โ€” | $0.55 | $0.055 | $0.6875 | 90% | +| claude-sonnet-4-0 | aihubmix | โ€” | $1.65 | $0.165 | $2.0625 | 90% | +| claude-sonnet-4-5 | aihubmix | โ€” | $1.65 | $0.165 | $2.0625 | 90% | +| claude-sonnet-4-5-think | aihubmix | โ€” | $1.65 | $0.165 | $2.0625 | 90% | +| codex-mini-latest | aihubmix | โ€” | $0.75 | $0.1875 | โ€” | 75% | +| deepseek-v3.2 | aihubmix | โ€” | $0.151 | $0.0151 | โ€” | 90% | +| deepseek-v3.2-exp | aihubmix | โ€” | $0.137 | $0.0137 | โ€” | 90% | +| deepseek-v3.2-exp-think | aihubmix | โ€” | $0.137 | $0.0137 | โ€” | 90% | +| deepseek-v3.2-think | aihubmix | โ€” | $0.151 | $0.0151 | โ€” | 90% | +| doubao-1.5-lite-32k | aihubmix | โ€” | $0.025 | $0.005 | โ€” | 80% | +| doubao-1.5-pro-32k | aihubmix | โ€” | $0.067 | $0.0134 | โ€” | 80% | +| doubao-lite-32k | aihubmix | โ€” | $0.03 | $0.006 | โ€” | 80% | +| doubao-pro-32k | aihubmix | โ€” | $0.07 | $0.014 | โ€” | 80% | +| doubao-seed-1-6 | aihubmix | โ€” | $0.09 | $0.018 | โ€” | 80% | +| doubao-seed-1-6-250615 | aihubmix | โ€” | $0.09 | $0.018 | โ€” | 80% | +| doubao-seed-1-6-flash | aihubmix | โ€” | $0.022 | $0.0044 | โ€” | 80% | +| doubao-seed-1-6-flash-250615 | aihubmix | โ€” | $0.022 | $0.0044 | โ€” | 80% | +| doubao-seed-1-6-lite | aihubmix | โ€” | $0.041 | $0.0082 | โ€” | 80% | +| doubao-seed-1-6-thinking | aihubmix | โ€” | $0.09 | $0.018 | โ€” | 80% | +| doubao-seed-1-6-thinking-250615 | aihubmix | โ€” | $0.09 | $0.018 | โ€” | 80% | +| doubao-seed-1-6-vision-250815 | aihubmix | โ€” | $0.054795 | $0.010959 | โ€” | 80% | +| doubao-seed-1-8 | aihubmix | โ€” | $0.054795 | $0.010959 | โ€” | 80% | +| gemini-2.0-flash | aihubmix | โ€” | $0.05 | $0.0125 | โ€” | 75% | +| gemini-2.0-flash-001 | aihubmix | โ€” | $0.05 | $0.125 | โ€” | -150% | +| gemini-2.0-flash-search | aihubmix | โ€” | $0.05 | $0.0125 | โ€” | 75% | +| gemini-2.5-flash | aihubmix | โ€” | $0.15 | $0.015 | โ€” | 90% | +| gemini-2.5-flash-lite | aihubmix | โ€” | $0.05 | $0.005 | โ€” | 90% | +| gemini-2.5-flash-lite-nothink | aihubmix | โ€” | $0.05 | $0.005 | โ€” | 90% | +| gemini-2.5-flash-lite-preview-09-2025 | aihubmix | โ€” | $0.05 | $0.005 | โ€” | 90% | +| gemini-2.5-flash-lite-preview-09-2025-nothink | aihubmix | โ€” | $0.05 | $0.005 | โ€” | 90% | +| gemini-2.5-flash-nothink | aihubmix | โ€” | $0.15 | $0.015 | โ€” | 90% | +| gemini-2.5-flash-preview-05-20-nothink | aihubmix | โ€” | $0.15 | $0.015 | โ€” | 90% | +| gemini-2.5-flash-preview-05-20-search | aihubmix | โ€” | $0.15 | $0.015 | โ€” | 90% | +| gemini-2.5-flash-preview-09-2025 | aihubmix | โ€” | $0.15 | $0.015 | โ€” | 90% | +| gemini-2.5-flash-search | aihubmix | โ€” | $0.15 | $0.015 | โ€” | 90% | +| gemini-2.5-pro | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gemini-2.5-pro-exp-03-25 | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gemini-2.5-pro-preview-03-25 | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gemini-2.5-pro-preview-03-25-search | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gemini-2.5-pro-preview-05-06 | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gemini-2.5-pro-preview-05-06-search | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gemini-2.5-pro-preview-06-05 | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gemini-2.5-pro-preview-06-05-search | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gemini-2.5-pro-search | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| glm-4.5-airx | aihubmix | โ€” | $0.55 | $0.11 | โ€” | 80% | +| glm-4.5-x | aihubmix | โ€” | $1.1 | $0.22 | โ€” | 80% | +| glm-4.6 | aihubmix | โ€” | $0.136987 | $0.027397 | โ€” | 80% | +| glm-4.6v | aihubmix | โ€” | $0.0685 | $0.0137 | โ€” | 80% | +| glm-4.7 | aihubmix | โ€” | $0.136987 | $0.027397 | โ€” | 80% | +| gpt-4.1 | aihubmix | โ€” | $1 | $0.25 | โ€” | 75% | +| gpt-4.1-mini | aihubmix | โ€” | $0.2 | $0.05 | โ€” | 75% | +| gpt-4.1-nano | aihubmix | โ€” | $0.05 | $0.0125 | โ€” | 75% | +| gpt-4o | aihubmix | โ€” | $1.25 | $0.625 | โ€” | 50% | +| gpt-4o-2024-08-06 | aihubmix | โ€” | $1.25 | $0.625 | โ€” | 50% | +| gpt-4o-2024-08-06-global | aihubmix | โ€” | $1.25 | $0.625 | โ€” | 50% | +| gpt-4o-2024-11-20 | aihubmix | โ€” | $1.25 | $0.625 | โ€” | 50% | +| gpt-4o-mini | aihubmix | โ€” | $0.075 | $0.0375 | โ€” | 50% | +| gpt-4o-mini-2024-07-18 | aihubmix | โ€” | $0.075 | $0.0375 | โ€” | 50% | +| gpt-4o-mini-global | aihubmix | โ€” | $0.075 | $0.0375 | โ€” | 50% | +| gpt-4o-mini-search-preview | aihubmix | โ€” | $0.075 | $0.0375 | โ€” | 50% | +| gpt-4o-search-preview | aihubmix | โ€” | $1.25 | $0.625 | โ€” | 50% | +| gpt-5 | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gpt-5-chat-latest | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gpt-5-codex | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gpt-5-mini | aihubmix | โ€” | $0.125 | $0.0125 | โ€” | 90% | +| gpt-5-nano | aihubmix | โ€” | $0.025 | $0.0025 | โ€” | 90% | +| gpt-5.1 | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gpt-5.1-chat-latest | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gpt-5.1-codex | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gpt-5.1-codex-max | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gpt-5.1-codex-mini | aihubmix | โ€” | $0.125 | $0.0125 | โ€” | 90% | +| gpt-5.2 | aihubmix | โ€” | $0.875 | $0.0875 | โ€” | 90% | +| gpt-5.2-chat-latest | aihubmix | โ€” | $0.875 | $0.0875 | โ€” | 90% | +| gpt-5.2-codex | aihubmix | โ€” | $0.875 | $0.0875 | โ€” | 90% | +| gpt-5.2-high | aihubmix | โ€” | $0.875 | $0.0875 | โ€” | 90% | +| gpt-5.2-low | aihubmix | โ€” | $0.875 | $0.0875 | โ€” | 90% | +| gpt-5.2-pro | aihubmix | โ€” | $10.5 | $1.05 | โ€” | 90% | +| grok-4 | aihubmix | โ€” | $1.65 | $0.4125 | โ€” | 75% | +| grok-4-1-fast-non-reasoning | aihubmix | โ€” | $0.1 | $0.025 | โ€” | 75% | +| grok-4-1-fast-reasoning | aihubmix | โ€” | $0.1 | $0.025 | โ€” | 75% | +| grok-4-fast-non-reasoning | aihubmix | โ€” | $0.1 | $0.025 | โ€” | 75% | +| grok-4-fast-reasoning | aihubmix | โ€” | $0.1 | $0.025 | โ€” | 75% | +| grok-4.20-beta-0309-non-reasoning | aihubmix | โ€” | $1 | $0.1 | โ€” | 90% | +| grok-4.20-beta-0309-reasoning | aihubmix | โ€” | $1 | $0.1 | โ€” | 90% | +| grok-4.20-multi-agent-0309 | aihubmix | โ€” | $1 | $0.1 | โ€” | 90% | +| grok-4.20-multi-agent-beta-0309 | aihubmix | โ€” | $1 | $0.1 | โ€” | 90% | +| grok-code-fast-1 | aihubmix | โ€” | $0.1 | $0.025 | โ€” | 75% | +| kimi-k2-thinking | aihubmix | โ€” | $0.274 | $0.0685 | โ€” | 75% | +| kimi-k2-turbo-preview | aihubmix | โ€” | $0.6 | $0.15 | โ€” | 75% | +| kimi-k2.5 | aihubmix | โ€” | $0.3 | $0.0525 | โ€” | 82% | +| mimo-v2-flash | aihubmix | โ€” | $0.0959 | $0.01918 | โ€” | 80% | +| mimo-v2-omni | aihubmix | โ€” | $0.22 | $0.044 | โ€” | 80% | +| mimo-v2-pro | aihubmix | โ€” | $0.55 | $0.11 | โ€” | 80% | +| nvidia-nemotron-3-super-120b-a12b | aihubmix | โ€” | $0.055 | $0.01375 | โ€” | 75% | +| o1 | aihubmix | โ€” | $7.5 | $3.75 | โ€” | 50% | +| o1-2024-12-17 | aihubmix | โ€” | $7.5 | $3.75 | โ€” | 50% | +| o1-global | aihubmix | โ€” | $7.5 | $3.75 | โ€” | 50% | +| o1-mini | aihubmix | โ€” | $1.5 | $0.75 | โ€” | 50% | +| o1-mini-2024-09-12 | aihubmix | โ€” | $1.5 | $0.75 | โ€” | 50% | +| o1-preview | aihubmix | โ€” | $7.5 | $3.75 | โ€” | 50% | +| o1-preview-2024-09-12 | aihubmix | โ€” | $7.5 | $3.75 | โ€” | 50% | +| o3 | aihubmix | โ€” | $1 | $0.25 | โ€” | 75% | +| o3-deep-research | aihubmix | โ€” | $5 | $1.25 | โ€” | 75% | +| o3-global | aihubmix | โ€” | $1 | $0.25 | โ€” | 75% | +| o3-mini | aihubmix | โ€” | $0.55 | $0.275 | โ€” | 50% | +| o3-mini-global | aihubmix | โ€” | $0.55 | $0.275 | โ€” | 50% | +| o4-mini | aihubmix | โ€” | $0.55 | $0.1375 | โ€” | 75% | +| qwen-plus | aihubmix | โ€” | $0.0563 | $0.01126 | $0.070375 | 80% | +| qwen-plus-2025-04-28 | aihubmix | โ€” | $0.0563 | $0.01126 | $0.070375 | 80% | +| qwen-plus-2025-07-28 | aihubmix | โ€” | $0.0563 | $0.01126 | $0.070375 | 80% | +| qwen-plus-latest | aihubmix | โ€” | $0.0563 | $0.01126 | $0.070375 | 80% | +| qwen-turbo | aihubmix | โ€” | $0.023 | $0.0046 | โ€” | 80% | +| qwen-turbo-latest | aihubmix | โ€” | $0.023 | $0.0046 | โ€” | 80% | +| qwen3-coder-plus | aihubmix | โ€” | $0.27 | $0.054 | โ€” | 80% | +| qwen3-max | aihubmix | โ€” | $0.2254 | $0.04508 | $0.28175 | 80% | +| qwen3-max-2026-01-23 | aihubmix | โ€” | $0.2254 | $0.04508 | $0.28175 | 80% | +| qwen3-max-preview | aihubmix | โ€” | $0.423 | $0.0846 | โ€” | 80% | +| qwen3-vl-flash | aihubmix | โ€” | $0.0103 | $0.00206 | โ€” | 80% | +| qwen3-vl-plus | aihubmix | โ€” | $0.0685 | $0.0137 | โ€” | 80% | +| zai-glm-5-turbo | aihubmix | โ€” | $0.6 | $0.12 | โ€” | 80% | +| aion-2.0 | aion | โ€” | $0.7999999999999999 | $0.19999999999999998 | โ€” | 75% | +| aion-2.5 | aion | โ€” | $1 | $0.35 | โ€” | 65% | +| amazon-nova-2-lite | amazon-bedrock | โ€” | $0.33 | $0.0825 | โ€” | 75% | +| amazon-nova-lite | amazon-bedrock | โ€” | $0.06 | $0.015 | โ€” | 75% | +| amazon-nova-micro | amazon-bedrock | โ€” | $0.035 | $0.00875 | โ€” | 75% | +| amazon-nova-premier | amazon-bedrock | โ€” | $2.5 | $0.625 | โ€” | 75% | +| amazon-nova-pro | amazon-bedrock | โ€” | $0.8 | $0.2 | โ€” | 75% | +| claude-haiku-4-5-20251001 | auriko | โ€” | $1 | $0.1 | $1.25 | 90% | +| claude-opus-4-1-20250805 | auriko | โ€” | $15 | $1.5 | $18.75 | 90% | +| claude-opus-4-20250514 | auriko | โ€” | $15 | $1.5 | $18.75 | 90% | +| claude-opus-4-5-20251101 | auriko | โ€” | $5 | $0.5 | $6.25 | 90% | +| claude-opus-4-6 | auriko | โ€” | $5 | $0.5 | $6.25 | 90% | +| claude-opus-4-7 | auriko | โ€” | $5 | $0.5 | $6.25 | 90% | +| claude-sonnet-4-20250514 | auriko | โ€” | $3 | $0.3 | $3.75 | 90% | +| claude-sonnet-4-5-20250929 | auriko | โ€” | $3 | $0.3 | $3.75 | 90% | +| claude-sonnet-4-6 | auriko | โ€” | $3 | $0.3 | $3.75 | 90% | +| deepseek-r1-0528 | auriko | โ€” | $0.5 | $0.35 | โ€” | 30% | +| deepseek-v3-0324 | auriko | โ€” | $0.2 | $0.135 | โ€” | 32% | +| deepseek-v3.1 | auriko | โ€” | $0.21 | $0.13 | โ€” | 38% | +| deepseek-v3.1-terminus | auriko | โ€” | $0.27 | $0.13 | โ€” | 52% | +| deepseek-v3.2 | auriko | โ€” | $0.26 | $0.13 | โ€” | 50% | +| deepseek-v4-flash | auriko | โ€” | $0.14 | $0.0028 | โ€” | 98% | +| deepseek-v4-pro | auriko | โ€” | $0.435 | $0.003625 | โ€” | 99% | +| gemini-2.5-flash | auriko | โ€” | $0.3 | $0.03 | โ€” | 90% | +| gemini-2.5-flash-lite | auriko | โ€” | $0.1 | $0.01 | โ€” | 90% | +| gemini-2.5-pro | auriko | โ€” | $1.25 | $0.125 | โ€” | 90% | +| gemini-3-flash-preview | auriko | โ€” | $0.5 | $0.05 | โ€” | 90% | +| gemini-3.1-flash-lite | auriko | โ€” | $0.25 | $0.025 | โ€” | 90% | +| gemini-3.1-flash-lite-preview | auriko | โ€” | $0.25 | $0.025 | โ€” | 90% | +| gemini-3.1-pro-preview | auriko | โ€” | $2 | $0.2 | โ€” | 90% | +| gemini-3.1-pro-preview-customtools | auriko | โ€” | $2 | $0.2 | โ€” | 90% | +| gemini-flash-latest | auriko | โ€” | $0.5 | $0.05 | โ€” | 90% | +| gemini-flash-lite-latest | auriko | โ€” | $0.1 | $0.01 | โ€” | 90% | +| gemini-pro-latest | auriko | โ€” | $2 | $0.2 | โ€” | 90% | +| glm-4.5 | auriko | โ€” | $0.6 | $0.11 | โ€” | 82% | +| glm-4.5-air | auriko | โ€” | $0.2 | $0.03 | โ€” | 85% | +| glm-4.5-airx | auriko | โ€” | $1.1 | $0.22 | โ€” | 80% | +| glm-4.5-x | auriko | โ€” | $2.2 | $0.45 | โ€” | 80% | +| glm-4.5v | auriko | โ€” | $0.6 | $0.11 | โ€” | 82% | +| glm-4.6 | auriko | โ€” | $0.6 | $0.11 | โ€” | 82% | +| glm-4.6v | auriko | โ€” | $0.3 | $0.05 | โ€” | 83% | +| glm-4.6v-flashx | auriko | โ€” | $0.04 | $0.004 | โ€” | 90% | +| glm-4.7 | auriko | โ€” | $0.6 | $0.11 | โ€” | 82% | +| glm-4.7-flashx | auriko | โ€” | $0.07 | $0.01 | โ€” | 86% | +| glm-5 | auriko | โ€” | $1 | $0.2 | โ€” | 80% | +| glm-5-turbo | auriko | โ€” | $1.2 | $0.24 | โ€” | 80% | +| glm-5.1 | auriko | โ€” | $1.4 | $0.26 | โ€” | 81% | +| glm-5v-turbo | auriko | โ€” | $1.2 | $0.24 | โ€” | 80% | +| gpt-4.1-2025-04-14 | auriko | โ€” | $2 | $0.5 | โ€” | 75% | +| gpt-4.1-mini-2025-04-14 | auriko | โ€” | $0.4 | $0.1 | โ€” | 75% | +| gpt-4.1-nano-2025-04-14 | auriko | โ€” | $0.1 | $0.025 | โ€” | 75% | +| gpt-4o-2024-08-06 | auriko | โ€” | $2.5 | $1.25 | โ€” | 50% | +| gpt-4o-2024-11-20 | auriko | โ€” | $2.5 | $1.25 | โ€” | 50% | +| gpt-4o-mini-2024-07-18 | auriko | โ€” | $0.15 | $0.075 | โ€” | 50% | +| gpt-5-2025-08-07 | auriko | โ€” | $1.25 | $0.125 | โ€” | 90% | +| gpt-5-chat-latest | auriko | โ€” | $1.25 | $0.125 | โ€” | 90% | +| gpt-5-mini-2025-08-07 | auriko | โ€” | $0.25 | $0.025 | โ€” | 90% | +| gpt-5-nano-2025-08-07 | auriko | โ€” | $0.05 | $0.005 | โ€” | 90% | +| gpt-5.1-2025-11-13 | auriko | โ€” | $1.25 | $0.125 | โ€” | 90% | +| gpt-5.1-chat-latest | auriko | โ€” | $1.25 | $0.125 | โ€” | 90% | +| gpt-5.2-2025-12-11 | auriko | โ€” | $1.75 | $0.175 | โ€” | 90% | +| gpt-5.2-chat-latest | auriko | โ€” | $1.75 | $0.175 | โ€” | 90% | +| gpt-5.3-chat-latest | auriko | โ€” | $1.75 | $0.175 | โ€” | 90% | +| gpt-5.4-2026-03-05 | auriko | โ€” | $2.5 | $0.25 | โ€” | 90% | +| gpt-5.4-mini-2026-03-17 | auriko | โ€” | $0.75 | $0.075 | โ€” | 90% | +| gpt-5.4-nano-2026-03-17 | auriko | โ€” | $0.2 | $0.02 | โ€” | 90% | +| gpt-5.5-2026-04-23 | auriko | โ€” | $5 | $0.5 | โ€” | 90% | +| gpt-oss-120b | auriko | โ€” | $0.15 | $0.01 | โ€” | 93% | +| gpt-oss-20b | auriko | โ€” | $0.07 | $0.04 | โ€” | 43% | +| grok-4.20-0309-non-reasoning | auriko | โ€” | $1.25 | $0.2 | โ€” | 84% | +| grok-4.20-0309-reasoning | auriko | โ€” | $1.25 | $0.2 | โ€” | 84% | +| grok-4.3 | auriko | โ€” | $1.25 | $0.2 | โ€” | 84% | +| hy3-preview | auriko | โ€” | $0.066 | $0.029 | โ€” | 56% | +| kimi-k2-0711-preview | auriko | โ€” | $0.6 | $0.15 | โ€” | 75% | +| kimi-k2-0905-preview | auriko | โ€” | $0.6 | $0.15 | โ€” | 75% | +| kimi-k2-thinking | auriko | โ€” | $0.6 | $0.15 | โ€” | 75% | +| kimi-k2-thinking-turbo | auriko | โ€” | $1.15 | $0.15 | โ€” | 87% | + +> ๐Ÿ“„ Showing first 200 of 1374 models. Use the [interactive catalog](https://i-need-token.github.io/ai-models/) to browse all. + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. + +## Related Documentation + +- [Model Selection Guide](model-selection.md) โ€” cost optimization tips +- [Pricing Comparison](pricing-comparison.md) โ€” side-by-side pricing across providers +- [Free AI Models](free-models.md) โ€” 81 free models +- [Context Window Comparison](context-windows.md) โ€” largest context windows +- [Open-Weight Models](open-weights.md) โ€” 527 models you can run yourself diff --git a/docs/chat-models.md b/docs/chat-models.md new file mode 100644 index 00000000..e4bdd4cd --- /dev/null +++ b/docs/chat-models.md @@ -0,0 +1,99 @@ +# Chat Models + +[ไธญๆ–‡](zh/chat-models.md) + +AI models with **tool calling** support โ€” the essential capability for building chat-based applications, AI assistants, and conversational agents. These models can understand natural language, generate responses, and invoke external tools. + +Data sourced from the [AI Models Catalog](https://github.com/i-need-token/ai-models). + +## Why Chat Models Matter + +Chat models are the backbone of modern AI applications: + +- **Conversational AI** โ€” natural language dialogue with context +- **AI Assistants** โ€” task-oriented chat with tool use +- **Customer Support** โ€” automated support with knowledge base access +- **Content Generation** โ€” writing, summarization, translation +- **Data Analysis** โ€” natural language queries over structured data + +Tool calling is the key differentiator โ€” it allows models to go beyond text generation and take actions in the real world. + +## Stats + +| Metric | Count | +| ------------------------------- | ----- | +| Chat models (with tool calling) | 2350 | +| Providers | 71 | +| Free chat models | 54 | +| Open-weight chat models | 278 | +| With reasoning | 1080 | +| With structured output | 758 | + +## Providers + +`01ai`, `302ai`, `aihubmix`, `aimlapi`, `alibaba`, `amazon`, `amazon-bedrock`, `anthropic`, `arcee`, `auriko`, `baidu`, `baseten`, `berget`, `bytedance`, `cerebras`, `chutes`, `clarifai`, `cloudferro-sherlock`, `cloudflare`, `cortecs`, `databricks`, `deepseek`, `digitalocean`, `dinference`, `evroc` and 46 more + +## Free Chat Models + +Free models with tool calling โ€” zero-cost chat applications. + +| Model | Provider | Context | Input $/M | Output $/M | Capabilities | +| ---------------------------------------------------- | ---------- | ------- | --------- | ---------- | ------------ | +| openrouter--owl-alpha | openrouter | 1M | Free | Free | ๐Ÿ“‹ | +| deepseek--deepseek-v4-flash--free | openrouter | 1M | Free | Free | ๐Ÿง  | +| qwen--qwen3-coder--free | openrouter | 1M | Free | Free | | +| nvidia--nemotron-3-super-120b-a12b--free | openrouter | 1M | Free | Free | ๐Ÿง  ๐Ÿ“‹ | +| google--gemma-4-26b-a4b-it--free | openrouter | 262K | Free | Free | ๐Ÿง  ๐Ÿ“‹ | +| arcee-ai--trinity-large-thinking--free | openrouter | 262K | Free | Free | ๐Ÿง  | +| google--gemma-4-31b-it--free | openrouter | 262K | Free | Free | ๐Ÿง  ๐Ÿ“‹ | +| gemma-4-26b-a4b-it | auriko | 262K | Free | Free | ๐Ÿง  ๐Ÿ“‹ | +| gemma-4-31b-it | auriko | 262K | Free | Free | ๐Ÿง  ๐Ÿ“‹ | +| nvidia--nemotron-3-nano-omni-30b-a3b-reasoning--free | openrouter | 256K | Free | Free | ๐Ÿง  | + +## Cheapest Chat Models + +Best value chat models for production. + +| Model | Provider | Context | Input $/M | Output $/M | Capabilities | +| ------------------------------------------- | ------------ | ------- | --------- | ---------- | ------------ | +| ernie-4.5-0.3b | aihubmix | 0 | $0.0068 | $0.0272 | ๐Ÿ“‹ | +| bdc-coder | inferencenet | 131K | $0.01 | $0.01 | ๐Ÿ”“ | +| inclusionai--ling-2.6-flash | openrouter | 262K | $0.01 | $0.03 | ๐Ÿ“‹ | +| ling-2.6-flash | inclusionai | 262K | $0.01 | $0.03 | | +| qwen-3.5-0.8b | auriko | 262K | $0.01 | $0.05 | ๐Ÿง  | +| qwen3-vl-flash-2026-01-22 | aihubmix | 0 | $0.0103 | $0.103 | ๐Ÿ“‹ | +| qwen3-vl-flash | aihubmix | 0 | $0.0103 | $0.103 | ๐Ÿ“‹ | +| klusterai--Meta-Llama-3.1-8B-Instruct-Turbo | klusterai | 131K | $0.015 | $0.02 | | +| granite-4.0-h-micro | cloudflare | 131K | $0.017 | $0.112 | ๐Ÿ”“ | +| llama-3.1-8b-instruct | cortecs | 0 | $0.018 | $0.054 | ๐Ÿง  | + +## Largest Context Chat Models + +Chat models with the largest context windows โ€” for long conversations and document analysis. + +| Model | Provider | Context | Input $/M | Output $/M | Capabilities | +| ---------------------------- | ---------- | ------- | --------- | ---------- | ------------ | +| meta-llama--llama-4-scout | openrouter | 10M | $0.08 | $0.3 | ๐Ÿ“‹ | +| meta-llama-4-scout | meta | 10M | $0.17 | $0.66 | | +| gemini-1.5-pro | google | 2M | $1.25 | $5 | ๐Ÿ“‹ | +| grok-code-fast-1 | jiekou | 2M | $0.19 | $0.475 | | +| gpt-4o | jiekou | 2M | $1.9 | $5.7 | | +| grok-4.20-0309-non-reasoning | jiekou | 2M | $0.19 | $0.475 | | +| grok-4.20-0309-reasoning | jiekou | 2M | $1.9 | $5.7 | | +| grok-4-1-fast-reasoning | jiekou | 2M | $0.19 | $0.475 | | +| grok-4-fast-reasoning | jiekou | 2M | $0.19 | $0.475 | | +| x-ai--grok-4-fast | fastrouter | 2M | $0.2 | $0.5 | | + +## Related Documentation + +- [Agentic Models](agentic-models.md) โ€” 1,080 models with tool calling + reasoning +- [Reasoning Models](reasoning-models.md) โ€” 1,306 models with reasoning +- [Code Models](code-models.md) โ€” 189 code-focused models +- [Free AI Models](free-models.md) โ€” 81 free models by capability +- [Structured Output](structured-output.md) โ€” 829 JSON-mode models +- [Model Selection Guide](model-selection.md) โ€” decision framework +- [Cached Pricing](cached-pricing.md) โ€” 1,374 models with prompt caching + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/code-examples.md b/docs/code-examples.md new file mode 100644 index 00000000..662fb2cd --- /dev/null +++ b/docs/code-examples.md @@ -0,0 +1,371 @@ +# Code Examples + +**English** | [ไธญๆ–‡](./zh/code-examples.md) + +Practical code examples for working with the AI Models Catalog data in multiple languages. + +## Download the Data + +```bash +# JSON โ€” full metadata (2.3 MB) +curl -LO https://github.com/i-need-token/ai-models/releases/latest/download/models.json + +# CSV โ€” flat table for Excel/Google Sheets (560 KB) +curl -LO https://github.com/i-need-token/ai-models/releases/latest/download/models.csv +``` + +Or use the [jsDelivr CDN](https://www.jsdelivr.com/package/npm/ai-models) (no download needed, CORS-enabled): + +```bash +# Always up-to-date, works in browsers +curl -s https://github.com/i-need-token/ai-models/releases/latest/download/models.json | jq '.models | length' +``` + +## TypeScript / JavaScript + +### Install the npm package + +```bash +npm install ai-models +``` + +### Basic usage + +```typescript +import catalog from "ai-models"; +import type { Model } from "ai-models"; + +// Total number of models +console.log(`Total models: ${catalog.models.length}`); + +// Find models by provider +const openaiModels = catalog.models.filter((m) => m.provider === "openai"); +console.log(`OpenAI models: ${openaiModels.length}`); +``` + +### Find the cheapest tool-calling models + +```typescript +import catalog from "ai-models"; + +const affordable = catalog.models + .filter((m) => m.tool_call && m.pricing?.input && m.pricing.input < 1) + .sort((a, b) => a.pricing.input - b.pricing.input) + .slice(0, 10); + +for (const m of affordable) { + console.log(`${m.name}: $${m.pricing.input}/1M input, $${m.pricing.output}/1M output`); +} +``` + +### Find models with the largest context windows + +```typescript +import catalog from "ai-models"; + +const largest = catalog.models + .filter((m) => m.limit?.context) + .sort((a, b) => b.limit.context - a.limit.context) + .slice(0, 10); + +for (const m of largest) { + console.log(`${m.name}: ${(m.limit.context / 1_000_000).toFixed(1)}M context`); +} +``` + +### Find free models with vision + +```typescript +import catalog from "ai-models"; + +const freeVision = catalog.models.filter( + (m) => m.pricing?.unit === "free" && m.modalities?.input?.includes("image"), +); + +console.log(`Free vision models: ${freeVision.length}`); +for (const m of freeVision) { + console.log(`- ${m.name} (${m.provider})`); +} +``` + +## Python + +### Using the JSON data + +```python +import json +import urllib.request + +# Download the latest data +url = "https://github.com/i-need-token/ai-models/releases/latest/download/models.json" +urllib.request.urlretrieve(url, "models.json") + +with open("models.json") as f: + catalog = json.load(f) + +print(f"Total models: {len(catalog['models'])}") +``` + +### Find reasoning models under $5/1M output + +```python +reasoning_cheap = [ + m for m in catalog["models"] + if m.get("reasoning") + and m.get("pricing", {}).get("output") + and m["pricing"]["output"] < 5 +] + +for m in sorted(reasoning_cheap, key=lambda x: x["pricing"]["output"]): + print(f"{m['name']}: ${m['pricing']['output']}/1M output") +``` + +### Using pandas with the CSV + +```python +import pandas as pd + +df = pd.read_csv("https://github.com/i-need-token/ai-models/releases/latest/download/models.csv") + +# Filter and sort +tool_calling = df[df["tool_call"] == True].sort_values("pricing_input") +print(tool_calling[["name", "provider", "pricing_input", "pricing_output"]].head(10)) +``` + +### Find open-weight models with tool calling + +```python +open_tool = [ + m for m in catalog["models"] + if m.get("open_weights") and m.get("tool_call") +] + +print(f"Open-weight models with tool calling: {len(open_tool)}") +for m in open_tool[:10]: + print(f" - {m['name']} ({m['provider']})") +``` + +## Go + +```go +package main + +import ( + "encoding/json" + "fmt" + "net/http" +) + +type Catalog struct { + Models []Model `json:"models"` +} + +type Model struct { + ID string `json:"id"` + Name string `json:"name"` + Provider string `json:"provider"` + ToolCall bool `json:"tool_call"` + Pricing Pricing `json:"pricing"` +} + +type Pricing struct { + Input float64 `json:"input"` + Output float64 `json:"output"` +} + +func main() { + resp, err := http.Get("https://github.com/i-need-token/ai-models/releases/latest/download/models.json") + if err != nil { + panic(err) + } + defer resp.Body.Close() + + var catalog Catalog + json.NewDecoder(resp.Body).Decode(&catalog) + + fmt.Printf("Total models: %d\n", len(catalog.Models)) + + // Find tool-calling models under $1/1M input + for _, m := range catalog.Models { + if m.ToolCall && m.Pricing.Input > 0 && m.Pricing.Input < 1 { + fmt.Printf("%s: $%.2f/1M input\n", m.Name, m.Pricing.Input) + } + } +} +``` + +## Rust + +```rust +use serde::Deserialize; + +#[derive(Deserialize)] +struct Catalog { + models: Vec, +} + +#[derive(Deserialize)] +struct Model { + id: String, + name: String, + provider: String, + #[serde(default)] + tool_call: bool, + pricing: Option, +} + +#[derive(Deserialize)] +struct Pricing { + input: f64, + output: f64, +} + +fn main() -> Result<(), Box> { + let data = reqwest::blocking::get( + "https://github.com/i-need-token/ai-models/releases/latest/download/models.json" + )?.text()?; + + let catalog: Catalog = serde_json::from_str(&data)?; + println!("Total models: {}", catalog.models.len()); + + // Find reasoning models + let reasoning: Vec<_> = catalog.models.iter() + .filter(|m| m.tool_call) + .collect(); + + println!("Tool-calling models: {}", reasoning.len()); + Ok(()) +} +``` + +## Shell / jq + +```bash +# Download the data +curl -sLO https://github.com/i-need-token/ai-models/releases/latest/download/models.json + +# Count total models +jq '.models | length' models.json + +# Find all OpenAI models +jq '.models[] | select(.provider == "openai") | .name' models.json + +# Find the cheapest models with tool calling +jq '[.models[] | select(.tool_call == true and .pricing.input != null)] | sort_by(.pricing.input) | .[:5] | .[] | {name, provider, input: .pricing.input}' models.json + +# Find free models +jq '[.models[] | select(.pricing.unit == "free")] | length' models.json + +# List all providers +jq '.providers | keys' models.json +``` + +## Excel / Google Sheets + +1. Download the CSV: `https://github.com/i-need-token/ai-models/releases/latest/download/models.csv` +2. Open in Excel or import into Google Sheets +3. Use filters to find models by provider, capability, or price range + +## Common Queries + +### Find the best model for coding + +```typescript +import catalog from "ai-models"; + +const codingModels = catalog.models.filter( + (m) => + m.tool_call && + m.structured_output && + m.limit?.context >= 128000 && + m.pricing?.input && + m.pricing.input <= 5, +); + +// Sort by context window (descending), then price (ascending) +codingModels.sort((a, b) => { + const ctxDiff = (b.limit?.context ?? 0) - (a.limit?.context ?? 0); + if (ctxDiff !== 0) return ctxDiff; + return (a.pricing?.input ?? 0) - (b.pricing?.input ?? 0); +}); +``` + +### Compare pricing across providers for the same model family + +```typescript +import catalog from "ai-models"; + +// Group by family +const families = new Map(); +for (const m of catalog.models) { + if (!m.family) continue; + const list = families.get(m.family) ?? []; + list.push(m); + families.set(m.family, list); +} + +// Find families available on multiple providers +for (const [family, models] of families) { + const providers = new Set(models.map((m) => m.provider)); + if (providers.size > 1) { + console.log(`\n${family}:`); + for (const m of models) { + console.log(` ${m.provider}: $${m.pricing?.input}/1M in, $${m.pricing?.output}/1M out`); + } + } +} +``` + +### Build a model selector for your app + +```typescript +import catalog from "ai-models"; +import type { Model } from "ai-models"; + +interface ModelRequirements { + toolCall?: boolean; + vision?: boolean; + reasoning?: boolean; + structuredOutput?: boolean; + minContext?: number; + maxInputPrice?: number; + maxOutputPrice?: number; + openWeights?: boolean; + provider?: string; +} + +function findModels(req: ModelRequirements): Model[] { + return catalog.models.filter((m) => { + if (req.toolCall && !m.tool_call) return false; + if (req.vision && !m.modalities?.input?.includes("image")) return false; + if (req.reasoning && !m.reasoning) return false; + if (req.structuredOutput && !m.structured_output) return false; + if (req.minContext && (m.limit?.context ?? 0) < req.minContext) return false; + if (req.maxInputPrice && (m.pricing?.input ?? Infinity) > req.maxInputPrice) return false; + if (req.maxOutputPrice && (m.pricing?.output ?? Infinity) > req.maxOutputPrice) return false; + if (req.openWeights && !m.open_weights) return false; + if (req.provider && m.provider !== req.provider) return false; + return true; + }); +} + +// Example: Find a cheap vision model with tool calling +const results = findModels({ + vision: true, + toolCall: true, + maxInputPrice: 1, + maxOutputPrice: 5, +}); +``` + +## Related Documentation + +- [API & Programmatic Access](api.md) โ€” npm, CDN, CSV, GitHub Action +- [Quick Start](quick-start.md) โ€” find the right model in 30 seconds +- [Data Schema](data-schema.md) โ€” complete YAML schema reference +- [FAQ](faq.md) โ€” common questions +- [Glossary](glossary.md) โ€” key terms and definitions + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/code-models.md b/docs/code-models.md new file mode 100644 index 00000000..05c7828f --- /dev/null +++ b/docs/code-models.md @@ -0,0 +1,61 @@ +**English** | [ไธญๆ–‡](./zh/code-models.md) + +# Code AI Models โ€” 189 Models for Code Generation & Understanding + +Models optimized for **code generation, code review, debugging, and software engineering** tasks. All data sourced from first-party APIs via the [AI Models Catalog](https://github.com/i-need-token/ai-models). + +## Stats + +| Metric | Count | +| ------------------- | ----- | +| Code-focused models | 0 | +| Providers | 0 | +| With tool calling | 0 | +| With reasoning | 0 | +| With vision | 0 | +| Free | 0 | +| Open weights | 0 | + +## Cheapest Code Models (Direct Providers) + +| Model | Provider | Context | Input $/1M | Output $/1M | Reasoning | +| ----- | -------- | ------- | ---------- | ----------- | --------- | + +## Code Models with Reasoning (Best for Complex Tasks) + +| Model | Provider | Context | Input $/1M | Output $/1M | Tool Call | +| ----- | -------- | ------- | ---------- | ----------- | --------- | + +## Free Code Models + +| Model | Provider | Context | Reasoning | Tool Call | +| ----- | -------- | ------- | --------- | --------- | + +## Largest Context Code Models + +| Model | Provider | Context | Input $/1M | Output $/1M | +| ----- | -------- | ------- | ---------- | ----------- | + +## Choosing a Code Model + +| Use Case | Recommended | Why | +| ------------ | -------------------------- | --------------------- | +| Autocomplete | Qwen2.5-Coder, DeepSeek V3 | Fast, cheap | +| Code review | Claude Sonnet 4, GPT-4.1 | Reasoning + tool call | +| Bug fixing | DeepSeek R1, Claude Opus 4 | Deep reasoning | +| Refactoring | Gemini 2.5 Pro | Large context | +| Code agents | Claude Sonnet 4, GPT-4.1 | Tool call + reasoning | +| Self-hosted | Qwen2.5-Coder, Llama 4 | Open weights | + +## Related Documentation + +- [Reasoning Models](reasoning-models.md) โ€” 1,306 models with chain-of-thought +- [Tool Calling Models](tool-calling.md) โ€” 2,350 models with function calling +- [Agentic Models](agentic-models.md) โ€” 1,080 models for AI agents +- [OpenAI Alternatives](openai-alternatives.md) โ€” GPT-4 alternatives +- [Free AI Models](free-models.md) โ€” 81 models at zero cost +- [Open-Weight Models](open-weights.md) โ€” 527 models with open weights + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/context-windows.md b/docs/context-windows.md new file mode 100644 index 00000000..83f50239 --- /dev/null +++ b/docs/context-windows.md @@ -0,0 +1,77 @@ +**English** | [ไธญๆ–‡](./zh/context-windows.md) + +# Context Window Comparison + +Which models have the largest context windows? This page lists models by context window size and pricing. + +> For the full list, download [models.json](https://github.com/i-need-token/ai-models/releases/latest) or browse `providers/`. + +## Context Window Distribution + +| Tier | Models | Description | +| ---------------- | -----: | ---------------------------------------------------------- | +| 1M+ tokens | 391 | Can process entire books, codebases, or long conversations | +| 256Kโ€“1M tokens | 459 | Large documents, multi-turn conversations | +| 128Kโ€“256K tokens | 1,310 | Standard long-context, most modern models | +| 32Kโ€“128K tokens | 194 | Medium-length documents | +| 8Kโ€“32K tokens | 97 | Short documents, single-turn queries | +| <8K tokens | 19 | Legacy models, very short inputs | + +## Largest Context Windows (1M+ tokens) + +| Model | Provider | Context | Input $/1M | Output $/1M | Tool Call | Reasoning | +| ----------------------------- | ------------- | ------- | ---------: | ----------: | --------- | --------- | +| Llama 4 Scout | Meta | 10M | โ€” | โ€” | โœ… | โŒ | +| Llama 4 Scout | OpenRouter | 10M | $0.08 | $0.30 | โœ… | โŒ | +| Gemini 3 Pro Preview | Google | 2M | $2.00 | $12.00 | โœ… | โŒ | +| Gemini 3.1 Flash Lite Preview | Google | 2M | $0.25 | $1.50 | โœ… | โŒ | +| Gemini 3.1 Pro Preview | Google | 2M | $2.00 | $12.00 | โœ… | โŒ | +| Grok 4 Fast Reasoning | xAI | 2M | $0.20 | $0.50 | โœ… | โœ… | +| GPT-4.1 | OpenAI | ~1M | $2.00 | $8.00 | โœ… | โŒ | +| Gemini 2.5 Pro | Google | 1M | $1.25 | $10.00 | โœ… | โœ… | +| Gemini 2.5 Flash | Google | 1M | $0.15 | $0.60 | โœ… | โœ… | +| Llama 4 Maverick | Meta | 1M | โ€” | โ€” | โœ… | โŒ | +| Qwen3-235B-A22B | Alibaba Cloud | 128K\* | ยฅ1.00 | ยฅ4.00 | โœ… | โœ… | +| DeepSeek-V3 | DeepSeek | 128K | $0.27 | $1.10 | โœ… | โŒ | + +\*Note: Some models have different context limits on different platforms. Check the specific provider's YAML file for exact values. + +## Best Value per Context Tier + +### 1M+ tokens (cheapest) + +| Model | Provider | Input $/1M | Output $/1M | +| ---------------- | ----------- | -----------------: | ----------: | +| Llama 4 Scout | OpenRouter | $0.08 | $0.30 | +| Gemini 2.5 Flash | Google | $0.15 | $0.60 | +| Llama 4 Scout | Together AI | $0.15 | $0.60 | +| Llama 4 Scout | Meta | Free (open-weight) | โ€” | + +### 128Kโ€“256K tokens (cheapest) + +| Model | Provider | Input $/1M | Output $/1M | +| ------------- | ------------- | ---------: | ----------: | +| DeepSeek-V3 | DeepSeek | $0.27 | $1.10 | +| Qwen3-30B-A3B | Alibaba Cloud | ยฅ0.10 | ยฅ0.30 | +| Phi-4 | Microsoft | $0.10 | $0.40 | +| Gemma 3 27B | Google | $0.20 | $0.80 | + +## Key Takeaways + +- **Llama 4 Scout** has the largest context window at **10M tokens** โ€” 10x more than any other model +- **1M+ context** is now available from 6+ providers, including free open-weight models +- **128K context** is the most common tier (1,310 models) โ€” sufficient for most use cases +- **Cost scales with context**: 1M+ context models cost 2โ€“10x more per token than 128K models +- **Cache read pricing** can reduce costs significantly for repeated queries (up to 90% discount) + +## Related Documentation + +- [Model Selection Guide](model-selection.md) โ€” large context model recommendations +- [Pricing Comparison](pricing-comparison.md) โ€” side-by-side pricing across providers +- [Free AI Models](free-models.md) โ€” 81 free models by context window +- [Vision Models](vision-models.md) โ€” 1,487 vision models with context info +- [Cached Pricing](cached-pricing.md) โ€” 1,374 models with prompt caching + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/data-acquisition.md b/docs/data-acquisition.md index 1cb80259..28a8ca6a 100644 --- a/docs/data-acquisition.md +++ b/docs/data-acquisition.md @@ -256,3 +256,15 @@ Providers that host and serve models produced by others. They are added **after 2. Updates the YAML file directly 3. Sets `last_updated` to current date 4. Validates with `npm run validate` + +## Related Documentation + +- [Data Schema](data-schema.md) โ€” complete YAML schema reference +- [Design Principles](lessons-learned.md) โ€” lessons learned +- [Provider Overview](providers.md) โ€” all 95 providers +- [FAQ](faq.md) โ€” common questions +- [Contributing](https://github.com/i-need-token/ai-models/blob/main/CONTRIBUTING.md) โ€” how to contribute + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/data-schema.md b/docs/data-schema.md new file mode 100644 index 00000000..0fb1dc0d --- /dev/null +++ b/docs/data-schema.md @@ -0,0 +1,221 @@ +**English** | [ไธญๆ–‡](./zh/data-schema.md) + +# Data Schema Reference + +Complete reference for the YAML data schema used in this catalog. All model data files conform to the TypeScript types in [`types/`](../types/) and are validated at runtime by Zod schemas in [`types/schemas.ts`](../types/schemas.ts). + +## Model Schema + +Every model is a single YAML file at `providers//models/.yaml`. + +### Required Fields + +| Field | Type | Description | Example | +| -------------- | ------- | ---------------------------------------- | ------------------------------------------ | +| `id` | string | Stable model ID (no date suffix) | `gpt-4o`, `claude-sonnet-4-5` | +| `name` | string | Display name | `GPT-4o`, `Claude Sonnet 4.5` | +| `family` | string | Model family (broad lineage) | `gpt-4o`, `claude-sonnet` | +| `pricing` | Pricing | Model pricing (see below) | โ€” | +| `modalities` | object | Input/output modalities | `{ input: [text, image], output: [text] }` | +| `last_updated` | string | Last data update (YYYY-MM-DD or YYYY-MM) | `2024-08-06` | + +### Optional Fields + +| Field | Type | Default | Description | Example | +| ------------------- | ------- | ------- | -------------------------------- | ------------------------------------ | +| `reasoning` | boolean | `false` | Supports reasoning/thinking mode | `true` | +| `temperature` | boolean | `true` | Supports temperature parameter | `false` | +| `tool_call` | boolean | `false` | Supports tool/function calling | `true` | +| `attachment` | boolean | `false` | Supports file attachments | `true` | +| `structured_output` | boolean | `false` | Supports structured/JSON output | `true` | +| `open_weights` | boolean | `false` | Open-weight model | `true` | +| `deprecated` | boolean | `false` | Deprecated but still accessible | `true` | +| `limit` | object | โ€” | Token limits | `{ context: 128000, output: 16384 }` | +| `limit.context` | number | โ€” | Context window size (tokens) | `128000` | +| `limit.output` | number | โ€” | Max output tokens | `16384` | +| `knowledge` | string | โ€” | Training data cutoff | `2023-10` | +| `release_date` | string | โ€” | Model release date | `2024-05-13` | +| `snapshots` | array | โ€” | Dated model versions | See below | + +### Modality Types + +| Modality | Description | +| -------- | --------------------- | +| `text` | Text input or output | +| `image` | Image input or output | +| `video` | Video input | +| `audio` | Audio input or output | +| `pdf` | PDF document input | + +## Pricing Schema + +Pricing is a union of four types. Each model uses exactly one. + +### TokenPricing (most common) + +Per-million-token pricing. Currency defaults to USD, unit defaults to `per_mtok`. + +```yaml +pricing: + currency: USD # optional, defaults to USD + unit: per_mtok # optional, defaults to per_mtok + input: 2.5 # $/M input tokens + output: 10 # $/M output tokens + cache_write: 1.25 # optional, $/M cache write + cache_read: 0.625 # optional, $/M cache read +``` + +**Advanced: Tiered pricing by context length** + +```yaml +pricing: + input: + - up_to: 128000 # โ‰ค 128K context + price: 2.5 + - price: 5.0 # > 128K context (no up_to = final tier) + output: 10 +``` + +**Advanced: Per-modality pricing** + +```yaml +pricing: + input: + text: 1.25 + image: 2.5 + audio: 5.0 + output: + text: 5.0 + audio: 10.0 +``` + +### VideoPricing + +Per-second pricing, optionally tiered by resolution. + +```yaml +pricing: + currency: USD + unit: per_second + price: 0.03 # fixed price per second +``` + +```yaml +pricing: + unit: per_second + price: # per-resolution pricing + 720p: 0.02 + 1080p: 0.03 + 4k: 0.05 +``` + +### UnitPricing + +Per-image or per-request pricing. + +```yaml +pricing: + unit: per_image + price: 0.04 +``` + +```yaml +pricing: + unit: per_request + price: 0.005 +``` + +### FreePricing + +No cost. + +```yaml +pricing: + unit: free +``` + +## Snapshot Schema + +Snapshots represent dated versions of a model. They inherit all parent fields and only override what differs. + +```yaml +id: gpt-4o +name: GPT-4o +# ... parent fields ... +snapshots: + - id: gpt-4o-2024-08-06 # newest first + last_updated: "2024-08-06" + - id: gpt-4o-2024-05-13 + deprecated: true # this snapshot is deprecated + last_updated: "2024-05-13" +``` + +A snapshot can override any optional field from the parent: + +```yaml +snapshots: + - id: gemini-2.0-flash-exp + limit: + context: 1048576 # different context window + output: 8192 + pricing: + unit: free # experimental = free +``` + +## Provider Schema + +Each provider has a `provider.yaml` file at `providers//provider.yaml`. + +| Field | Type | Required | Description | Example | +| ---------------- | ------ | -------- | ------------------------------------ | ---------------------------------- | +| `id` | string | โœ… | Provider ID (matches directory name) | `openai` | +| `name` | string | โœ… | Display name | `OpenAI` | +| `url` | string | โœ… | Official website URL | `https://openai.com` | +| `api_docs` | string | โŒ | API documentation URL | `https://platform.openai.com/docs` | +| `apis` | object | โœ… | API endpoints keyed by format | See below | +| `apis.openai` | string | โŒ | OpenAI-compatible API endpoint | `https://api.openai.com/v1` | +| `apis.anthropic` | string | โŒ | Anthropic API endpoint | โ€” | +| `apis.google` | string | โŒ | Google AI API endpoint | โ€” | +| `currency` | string | โŒ | Default currency (USD/CNY/EUR) | `USD` | + +### API Formats + +| Format | Description | Used by | +| ----------- | -------------------------------------- | ----------------- | +| `openai` | OpenAI-compatible chat completions API | Most providers | +| `anthropic` | Anthropic Messages API | Anthropic | +| `google` | Google Generative AI API | Google, Vertex AI | + +## Currency Reference + +| Currency | Code | Used by | +| ------------ | ----- | -------------------------------------------- | +| US Dollar | `USD` | Most providers (default) | +| Chinese Yuan | `CNY` | Alibaba, 302.AI, AIHubMix, PPIO, etc. | +| Euro | `EUR` | Berget, CloudFerro, OVHcloud, Scaleway, etc. | + +## Validation + +All YAML files are validated against Zod schemas at runtime: + +```bash +# Validate all model data +npx tsx scripts/validate.ts + +# Validate a specific provider +npx tsx scripts/validate.ts openai +``` + +The validation uses `ModelSchema` from [`types/schemas.ts`](../types/schemas.ts), which mirrors the TypeScript types exactly. Any YAML file that doesn't conform to the schema will produce a validation error with the specific field path and issue. + +## Related Documentation + +- [Data Acquisition](data-acquisition.md) โ€” how we acquire and update data +- [API & Programmatic Access](api.md) โ€” npm, CDN, CSV access +- [Code Examples](code-examples.md) โ€” practical code examples +- [Design Principles](lessons-learned.md) โ€” lessons learned +- [FAQ](faq.md) โ€” common questions + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/embedding-models.md b/docs/embedding-models.md new file mode 100644 index 00000000..bce44d64 --- /dev/null +++ b/docs/embedding-models.md @@ -0,0 +1,71 @@ +# Embedding Models + +[ไธญๆ–‡](zh/embedding-models.md) + +AI models that generate **vector embeddings** โ€” numerical representations of text, images, and other data. Essential for semantic search, RAG (Retrieval-Augmented Generation), clustering, and similarity tasks. + +Data sourced from the [AI Models Catalog](https://github.com/i-need-token/ai-models). + +## Why Embedding Models Matter + +Embedding models are the foundation of many AI systems: + +- **Semantic Search** โ€” find relevant documents by meaning, not keywords +- **RAG** โ€” retrieve context for LLMs to generate grounded answers +- **Clustering** โ€” group similar items together +- **Similarity** โ€” find duplicates, recommendations, and related content +- **Classification** โ€” zero-shot and few-shot classification via embeddings + +## Stats + +| Metric | Count | +| ---------------------------- | ----- | +| Embedding models | 5 | +| Providers | 3 | +| Free embedding models | 0 | +| Open-weight embedding models | 1 | + +## Providers + +`openai`, `tencent`, `upstage` + +## Free Embedding Models + +Free embedding models โ€” zero-cost semantic search and RAG. + +| Model | Provider | Context | Input $/M | +| ----- | -------- | ------- | --------- | + +## Cheapest Embedding Models + +Best value embedding models for production. + +| Model | Provider | Context | Input $/M | +| ----------------------- | -------- | ------- | --------- | --- | +| text-embedding-3-small | openai | 8K | $0.02 | | +| solar-embedding-1-large | upstage | 0 | $0.1 | ๐Ÿ”“ | +| text-embedding-ada-002 | openai | 8K | $0.1 | | +| text-embedding-3-large | openai | 8K | $0.13 | | +| hunyuan-embedding | tencent | 0 | $0.7 | | + +## Largest Context Embedding Models + +Embedding models with the largest context windows โ€” for embedding long documents. + +| Model | Provider | Context | Input $/M | +| ---------------------- | -------- | ------- | --------- | --- | +| text-embedding-ada-002 | openai | 8K | $0.1 | | +| text-embedding-3-small | openai | 8K | $0.02 | | +| text-embedding-3-large | openai | 8K | $0.13 | | + +## Related Documentation + +- [Free AI Models](free-models.md) โ€” 81 free models by capability +- [Open Weights](open-weights.md) โ€” 527 open-weight models +- [Model Selection Guide](model-selection.md) โ€” decision framework +- [API Reference](api.md) โ€” programmatic access +- [Quick Start](quick-start.md) โ€” get started in 5 minutes + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/faq.md b/docs/faq.md new file mode 100644 index 00000000..52535794 --- /dev/null +++ b/docs/faq.md @@ -0,0 +1,114 @@ +# Frequently Asked Questions + +[ไธญๆ–‡](zh/faq.md) + +## General + +### What is AI Models Catalog? + +AI Models Catalog is a structured YAML catalog of AI model metadata from 95+ providers. It includes pricing, context windows, modalities, capabilities, and more โ€” all sourced from first-party APIs and official documentation. + +### How is this different from other model directories? + +- **First-party data only** โ€” all data comes directly from provider APIs and official docs, not third-party aggregators +- **Structured YAML** โ€” machine-readable with TypeScript types and Zod validation +- **Comprehensive metadata** โ€” pricing, context windows, modalities, capabilities, snapshots +- **Programmatic access** โ€” npm package, CDN, GitHub Action, CSV export +- **Open source** โ€” community-driven with automated scraping + +### How often is the data updated? + +Data is synced weekly via automated CI workflows. Provider APIs are scraped on a Monday cron schedule, and the npm package is automatically published when new releases are created. + +## Access & Usage + +### How do I get the data? + +There are several ways: + +| Method | Use Case | +| ------------------------------------------------------------------------------------- | ------------------------------ | +| `npm install ai-models` | TypeScript/JavaScript projects | +| `curl https://github.com/i-need-token/ai-models/releases/latest/download/models.json` | Quick access from any language | +| GitHub Action | CI/CD pipelines | +| CSV download | Excel, data analysis | +| Hugging Face dataset | ML workflows | + +See [Quick Start](quick-start.md) for detailed instructions. + +### Is the data free to use? + +Yes! The catalog data is released under the MIT License. You can use it in commercial and non-commercial projects without restriction. + +### How accurate is the pricing data? + +Pricing data is sourced directly from each provider's official API and documentation. However, providers may change pricing without notice. Always verify critical pricing decisions against the provider's own website. + +## Technical + +### Why YAML instead of JSON? + +YAML supports comments, is more human-readable for manual editing, and allows snapshot inheritance within a model file. The data is compiled to JSON for programmatic consumption. + +### What is snapshot inheritance? + +Within a single model file, snapshots inherit fields from their parent model and only override what differs. This keeps model files DRY without cross-model inheritance. + +### How do I validate my YAML files? + +```bash +# Using the built-in validator +npx tsx scripts/validate.ts + +# Using the JSON Schema +npx ajv validate -s schema.json -d providers/openai/models/gpt-4o.yaml +``` + +### Can I use this in my CI/CD pipeline? + +Yes! Use the reusable GitHub Action: + +```yaml +- uses: i-need-token/ai-models@v1 + with: + format: json + filter: "[?tool_call && open_weights]" +``` + +See [API Documentation](api.md) for details. + +## Contributing + +### How do I add a new provider? + +See [Contributing Guide](https://github.com/i-need-token/ai-models/blob/main/CONTRIBUTING.md) for step-by-step instructions. In short: + +1. Create `providers//provider.yaml` +2. Create `providers//scrape.ts` with a `scrape()` function +3. Run `npx tsx scripts/validate.ts` to verify + +### How do I report incorrect data? + +Open a [Data Update issue](https://github.com/i-need-token/ai-models/issues/new?template=data_update.md) with the provider name, model ID, and what needs correcting. + +### Can I help without writing code? + +Absolutely! You can: + +- โญ Star the repo to help others discover it +- ๐Ÿ“ข Share it with your network +- ๐Ÿ› Report data issues or bugs +- ๐Ÿ“– Improve documentation +- ๐Ÿท๏ธ Suggest new providers to add + +--- + +More questions? [Open an issue](https://github.com/i-need-token/ai-models/issues/new) or start a [discussion](https://github.com/i-need-token/ai-models/discussions). + +## Related Documentation + +- [Quick Start](quick-start.md) โ€” find the right model in 30 seconds +- [API & Programmatic Access](api.md) โ€” npm, CDN, CSV access +- [Glossary](glossary.md) โ€” key terms and definitions +- [Data Schema](data-schema.md) โ€” complete YAML schema +- [Model Selection Guide](model-selection.md) โ€” decision framework diff --git a/docs/free-models.md b/docs/free-models.md new file mode 100644 index 00000000..c69b1131 --- /dev/null +++ b/docs/free-models.md @@ -0,0 +1,124 @@ +**English** | [ไธญๆ–‡](./zh/free-models.md) + +# Free AI Models + +81 models in this catalog are free to use. This page lists them by capability so you can find the right free model for your project. + +> All data sourced from first-party APIs and documentation. Free tiers may have rate limits โ€” check the provider's website for details. + +## Quick Stats + +| Capability | Free Models | +| ------------------------- | ----------: | +| Total free models | 81 | +| With tool calling | 45 | +| With reasoning | 11 | +| With vision (image input) | 17 | + +## Free Models with Tool Calling + +These models support function/tool calling at no cost โ€” ideal for building AI agents and automation: + +| Model | Provider | Context | Vision | +| ------------------------------ | -------- | ------- | ------ | +| gemini-2.0-flash | Google | 1M | โœ… | +| gemini-2.5-flash-preview-05-20 | Google | 1M | โœ… | +| gemma-3-27b-it | Chutes | 128K | โœ… | +| qwen3-235b-a22b | Chutes | 128K | โœ… | +| qwen3-30b-a3b | Chutes | 128K | โœ… | +| qwen3-4b | Chutes | 128K | โœ… | +| deepseek-r1 | Chutes | 128K | โŒ | +| deepseek-v3-0324 | Chutes | 128K | โŒ | +| llama-4-maverick | Chutes | 1M | โœ… | +| llama-4-scout | Chutes | 10M | โœ… | +| llama-3.3-70b-instruct | Chutes | 128K | โŒ | +| qwen2.5-72b-instruct | Chutes | 128K | โŒ | +| mistral-small-3.1-24b-instruct | Chutes | 128K | โœ… | +| phi-4 | Chutes | 16K | โŒ | +| command-r | Chutes | 128K | โŒ | + +## Free Models with Reasoning + +These models support chain-of-thought reasoning at no cost: + +| Model | Provider | Context | +| ------------------------------ | -------- | ------- | +| gemini-2.5-flash-preview-05-20 | Google | 1M | +| deepseek-r1 | Chutes | 128K | +| deepseek-r1-0528 | Chutes | 128K | +| qwen3-235b-a22b | Chutes | 128K | +| qwen3-30b-a3b | Chutes | 128K | +| qwen3-4b | Chutes | 128K | +| gemma-3-27b-it | Chutes | 128K | +| phi-4-reasoning | Chutes | 32K | + +## Free Models with Vision + +These models accept image input at no cost: + +| Model | Provider | Context | +| ------------------------------ | -------- | ------- | +| gemini-2.0-flash | Google | 1M | +| gemini-2.5-flash-preview-05-20 | Google | 1M | +| gemma-3-27b-it | Chutes | 128K | +| qwen3-235b-a22b | Chutes | 128K | +| llama-4-maverick | Chutes | 1M | +| llama-4-scout | Chutes | 10M | +| mistral-small-3.1-24b-instruct | Chutes | 128K | + +## Free Models by Provider + +### Google (via AI Studio) + +Google offers free access to Gemini models through AI Studio with rate limits: + +- gemini-2.0-flash โ€” 1M context, tool calling, vision, reasoning +- gemini-2.5-flash-preview-05-20 โ€” 1M context, tool calling, vision, reasoning + +### Chutes + +Chutes provides free community-hosted inference for open-weight models: + +- 70+ free models including Llama 4, Qwen3, DeepSeek-R1, Gemma 3, Mistral, Phi-4 +- Largest free model: Llama 4 Scout (10M context) +- Best free reasoning: DeepSeek-R1, Qwen3-235B-A22B + +### Cloudflare Workers AI + +Cloudflare offers free inference on edge for select models: + +- Various small and medium models with rate limits +- Edge deployment for low latency + +### Cerebras + +Cerebras offers free tier for some models with rate limits: + +- Fast inference using CS-3 wafer-scale engine + +### Groq + +Groq offers free tier for some models with rate limits: + +- Ultra-fast inference using LPU acceleration + +## Key Takeaways + +- **Google AI Studio** offers the best free models overall โ€” 1M context, tool calling, vision, and reasoning +- **Chutes** has the largest selection of free models โ€” 70+ including all major open-weight models +- **Llama 4 Scout** on Chutes offers the largest free context window at 10M tokens +- Free tiers typically have rate limits (requests per minute) โ€” check provider docs for specifics +- For production use, consider upgrading to paid tiers for reliability and higher rate limits + +## Related Documentation + +- [Model Selection Guide](model-selection.md) โ€” decision framework for choosing models +- [Open-Weight Models](open-weights.md) โ€” 527 models you can run yourself +- [Cached Pricing](cached-pricing.md) โ€” 1,374 models with prompt caching +- [Tool Calling Models](tool-calling.md) โ€” 2,350 models with tool calling +- [Reasoning Models](reasoning-models.md) โ€” 1,306 models with reasoning +- [OpenAI Alternatives](openai-alternatives.md) โ€” free GPT-4 alternatives + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/glossary.md b/docs/glossary.md new file mode 100644 index 00000000..e830f4f0 --- /dev/null +++ b/docs/glossary.md @@ -0,0 +1,83 @@ +# Glossary + +[ไธญๆ–‡](zh/glossary.md) + +A quick reference for terms used throughout the AI Models Catalog. + +## Model Properties + +| Term | Definition | +| -------------- | --------------------------------------------------------------------------------------------------------------------------------------------- | +| **Model ID** | The stable, unique identifier for a model (e.g., `gpt-4.1`, `claude-sonnet-4`). No date suffix, no aliases. | +| **Family** | A group of related models sharing the same architecture or brand (e.g., `gpt-4.1` family includes `gpt-4.1`, `gpt-4.1-mini`, `gpt-4.1-nano`). | +| **Snapshot** | A dated version of a model, nested within the parent model file. Inherits all parent fields and only overrides what differs. | +| **Deprecated** | A model still listed in the provider's API but no longer recommended for new projects. Marked with `deprecated: true`. | +| **Retired** | A model completely removed from the provider's API. Excluded from the catalog. | + +## Capabilities + +| Term | Definition | +| --------------------- | ---------------------------------------------------------------------------------------------------------------------------------------------------------------------- | +| **Tool calling** | The model can invoke external tools/functions during generation (e.g., web search, calculator, API calls). Also known as "function calling". | +| **Structured output** | The model can generate responses in a specific format (typically JSON) conforming to a provided schema. Also known as "JSON mode". | +| **Reasoning** | The model uses chain-of-thought or extended thinking to solve complex problems step-by-step before producing a final answer. | +| **Open weights** | The model's weights are publicly available, allowing you to run it on your own infrastructure. Not all open-weight models are truly "open source" โ€” check the license. | + +## Modalities + +| Term | Definition | +| ------------------------ | ------------------------------------------------------------------------------------------------ | +| **Text input** | The model accepts text prompts as input. | +| **Text output** | The model generates text as output. | +| **Image input (Vision)** | The model can process images as part of the input. Also known as "vision" or "multimodal input". | +| **Image output** | The model can generate images (e.g., DALLยทE, Imagen). Also known as "image generation". | +| **Audio input** | The model can process audio files or speech as input. | +| **Audio output** | The model can generate audio or speech as output (e.g., TTS models). | +| **Video input** | The model can process video files as input. | +| **Video output** | The model can generate video as output. | +| **Embedding output** | The model produces vector embeddings rather than text, used for similarity search and retrieval. | + +## Pricing + +| Term | Definition | +| --------------------- | ---------------------------------------------------------------------------------------------------------- | +| **Input price** | Cost per million input tokens, in USD (or CNY/EUR for some providers). | +| **Output price** | Cost per million output tokens, in USD (or CNY/EUR for some providers). | +| **Cache read price** | Discounted price for reading from a previously cached prompt. Typically 50-90% cheaper than regular input. | +| **Cache write price** | Price for writing a prompt to the provider's cache. Some providers charge this separately. | +| **Free** | The model has zero cost for both input and output tokens. May have rate limits. | +| **Token** | A unit of text processing. Approximately 4 characters or 0.75 words in English. | + +## Context & Limits + +| Term | Definition | +| ------------------ | ------------------------------------------------------------------------------------------------------------------------------------- | +| **Context window** | Maximum number of tokens the model can process in a single request (input + output combined in some providers, input-only in others). | +| **Output limit** | Maximum number of tokens the model can generate in a single response. | +| **Rate limit** | Maximum number of requests or tokens per minute/hour, set by the provider. Not included in the catalog (check provider docs). | + +## Data & Architecture + +| Term | Definition | +| ------------------------ | ----------------------------------------------------------------------------------------------------------------------------------- | +| **YAML** | The source format for all model data. Human-readable, supports comments, and allows snapshot inheritance. | +| **Snapshot inheritance** | Within a model file, snapshots inherit all fields from the parent model and only override what differs. No cross-model inheritance. | +| **First-party data** | Data sourced directly from the provider's own API or official documentation, never from third-party aggregators. | +| **Zod schema** | Runtime validation schema used to ensure all YAML model files conform to the expected structure. | +| **models.json** | The compiled JSON output containing all models, generated from YAML source files. Available via npm, CDN, and GitHub Releases. | + +--- + +See [Data Schema Reference](data-schema.md) for the complete YAML field specification. + +## Related Documentation + +- [FAQ](faq.md) โ€” common questions +- [Data Schema](data-schema.md) โ€” complete YAML schema reference +- [Quick Start](quick-start.md) โ€” find the right model in 30 seconds +- [Model Comparison](model-comparison.md) โ€” compare models +- [Modality Matrix](modality-matrix.md) โ€” all modalities at a glance + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/image-generation.md b/docs/image-generation.md new file mode 100644 index 00000000..a50cbbfc --- /dev/null +++ b/docs/image-generation.md @@ -0,0 +1,70 @@ +**English** | [ไธญๆ–‡](./zh/image-generation.md) + +# AI Image Generation Models + +28 models in this catalog can generate images (image output modality). This page covers text-to-image, image editing, and multimodal generation models. + +> All data sourced from first-party APIs and documentation. "Image output" means the model generates images as part of its response. + +## Quick Stats + +| Capability | Image Gen Models | +| ----------------------------- | ---------------: | +| Total image generation models | 28 | +| Unique model IDs | 19 | +| With reasoning | 5 | +| With tool calling | 1 | +| Free to use | 9 | + +## All Image Generation Models + +| Model | Input | Output $/1M | Context | Reasoning | Free Tier | +| ------------------------------ | ------------------------- | ----------: | ------- | --------- | --------- | +| DALLยทE 3 | text | โ€” | โ€” | โŒ | โœ… | +| Imagen 4.0 Fast | text, image | โ€” | โ€” | โŒ | โœ… | +| Imagen 4.0 | text, image | โ€” | โ€” | โŒ | โœ… | +| Image 01 | text, image | โ€” | โ€” | โŒ | โœ… | +| Image 01 Live | text, image | โ€” | โ€” | โŒ | โœ… | +| Step 1X Edit | text, image | โ€” | โ€” | โŒ | โœ… | +| Step 1X Medium | text, image | โ€” | โ€” | โŒ | โœ… | +| Step 2X Large | text, image | โ€” | โ€” | โŒ | โœ… | +| Step Image Edit 2 | text, image | โ€” | โ€” | โŒ | โœ… | +| Gemini 2.5 Flash Image | text, image | $0.039 | 33K | โŒ | โŒ | +| Gemini 3.1 Flash Image Preview | text, image | $1.50 | 66K | โœ… | โŒ | +| Gemini 3 Pro Image Preview | text, image | $12.00 | 131K | โœ… | โŒ | +| GPT-5 Image Mini | text, image, PDF | $2.00 | 400K | โœ… | โŒ | +| GPT-5 Image | text, image, PDF | $10.00 | 400K | โœ… | โŒ | +| GPT-5.4 Image 2 | text, image, PDF | $15.00 | 272K | โœ… | โŒ | +| Amazon Nova 2.0 Omni | text, image, audio, video | $1.30 | 64K | โœ… | โŒ | + +## Best Value Image Generation + +| Use Case | Best Model | Why | +| ---------------------------------- | ----------------------------------- | --------------------------------------- | +| **Free text-to-image** | DALLยทE 3, Imagen 4.0 | Zero cost, high quality | +| **Free image editing** | Step 1X Edit, Step Image Edit 2 | Edit existing images at no cost | +| **Cheapest API** | Gemini 2.5 Flash Image | $0.039/1M output tokens | +| **Best quality** | GPT-5.4 Image 2, Gemini 3 Pro Image | State-of-the-art generation | +| **Multimodal (audio+video+image)** | Amazon Nova 2.0 Omni | Only model with all modalities | +| **Large context** | GPT-5 Image Mini | 400K context for complex prompts | +| **Reasoning + generation** | GPT-5 Image Mini | $2.50/1M input, 400K context, reasoning | + +## Key Takeaways + +- **9 free image generation models** โ€” DALLยทE 3, Imagen 4.0, Step models, and more +- **Gemini 2.5 Flash Image** is the cheapest API option at $0.039/1M output tokens +- **GPT-5 Image Mini** offers the best combination of reasoning + generation + large context +- **Amazon Nova 2.0 Omni** is the only model that generates images from audio and video input +- Most image generation models accept both text and image input (for editing/reference) + +## Related Documentation + +- [Vision Models](vision-models.md) โ€” 1,487 vision models +- [Video Models](video-models.md) โ€” 167 video input/output models +- [Modality Matrix](modality-matrix.md) โ€” all modalities at a glance +- [Model Selection Guide](model-selection.md) โ€” decision framework +- [Free AI Models](free-models.md) โ€” 81 free models + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/images/actions-demo.png b/docs/images/actions-demo.png new file mode 100644 index 00000000..e068fd8e Binary files /dev/null and b/docs/images/actions-demo.png differ diff --git a/docs/images/ai-models-landscape.png b/docs/images/ai-models-landscape.png new file mode 100644 index 00000000..4e182cca Binary files /dev/null and b/docs/images/ai-models-landscape.png differ diff --git a/docs/images/calculator-screenshot.png b/docs/images/calculator-screenshot.png new file mode 100644 index 00000000..de1afc20 Binary files /dev/null and b/docs/images/calculator-screenshot.png differ diff --git a/docs/images/catalog-dark.png b/docs/images/catalog-dark.png new file mode 100644 index 00000000..f035da69 Binary files /dev/null and b/docs/images/catalog-dark.png differ diff --git a/docs/images/catalog-demo.gif b/docs/images/catalog-demo.gif new file mode 100644 index 00000000..832ffd88 Binary files /dev/null and b/docs/images/catalog-demo.gif differ diff --git a/docs/images/catalog-light.png b/docs/images/catalog-light.png new file mode 100644 index 00000000..9a6a5f0a Binary files /dev/null and b/docs/images/catalog-light.png differ diff --git a/docs/images/catalog-screenshot.png b/docs/images/catalog-screenshot.png new file mode 100644 index 00000000..de1afc20 Binary files /dev/null and b/docs/images/catalog-screenshot.png differ diff --git a/docs/images/picker-screenshot.png b/docs/images/picker-screenshot.png new file mode 100644 index 00000000..77e7f31b Binary files /dev/null and b/docs/images/picker-screenshot.png differ diff --git a/docs/large-context-models.md b/docs/large-context-models.md new file mode 100644 index 00000000..c45dc882 --- /dev/null +++ b/docs/large-context-models.md @@ -0,0 +1,112 @@ +# Large Context Models + +[ไธญๆ–‡](zh/large-context-models.md) + +AI models with **128K+ token context windows** โ€” process entire codebases, long documents, and multi-hour conversations in a single request. + +Data sourced from the [AI Models Catalog](https://github.com/i-need-token/ai-models). + +## Why Large Context Matters + +Large context windows unlock capabilities impossible with smaller models: + +- **Full codebase analysis** โ€” understand entire repositories in one prompt +- **Document processing** โ€” analyze 100+ page PDFs without chunking +- **Multi-turn conversations** โ€” maintain context across long chat sessions +- **Data analysis** โ€” process large datasets in a single request +- **Legal/medical review** โ€” review lengthy contracts and medical records +- **Content creation** โ€” maintain consistency across long-form writing + +## Stats + +| Metric | Count | +| ---------------------------- | ----- | +| Large context models (128K+) | 2195 | +| 256K+ context | 861 | +| 1M+ context | 397 | +| Providers | 78 | +| Free large context models | 51 | +| With tool calling | 1637 | + +## Providers + +`302ai`, `ai21`, `aimlapi`, `aion`, `alibaba`, `amazon`, `amazon-bedrock`, `anthropic`, `arcee`, `auriko`, `baichuan`, `baidu`, `baseten`, `bytedance`, `cerebras`, `chutes`, `clarifai`, `cloudferro-sherlock`, `cloudflare`, `databricks`, `deepinfra`, `deepseek`, `digitalocean`, `dinference`, `evroc` and 53 more + +## Largest Context Windows + +Models with the biggest context windows available. + +| Model | Provider | Context | Input $/M | Output $/M | Capabilities | +| ------------------------------ | ---------- | ------- | --------- | ---------- | ------------ | +| meta-llama--llama-4-scout | openrouter | 10M | $0.08 | $0.3 | ๐Ÿ”ง ๐Ÿ“‹ | +| meta-llama-4-scout | meta | 10M | $0.17 | $0.66 | ๐Ÿ”ง | +| gemini-1.5-pro | google | 2M | $1.25 | $5 | ๐Ÿ”ง ๐Ÿ“‹ | +| grok-code-fast-1 | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ”ง | +| gpt-4o | jiekou | 2M | $1.9 | $5.7 | ๐Ÿ”ง | +| grok-4.20-0309-non-reasoning | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ”ง | +| grok-4.20-0309-reasoning | jiekou | 2M | $1.9 | $5.7 | ๐Ÿ”ง | +| grok-4-1-fast-reasoning | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ”ง | +| grok-4-fast-reasoning | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ”ง | +| x-ai--grok-4-fast | fastrouter | 2M | $0.2 | $0.5 | ๐Ÿ”ง | +| x-ai--grok-4.1-fast | fastrouter | 2M | $0.2 | $0.5 | ๐Ÿ”ง | +| xai--grok-4-fast-reasoning | aimlapi | 2M | $0.52 | $1.3 | ๐Ÿ”ง | +| xai--grok-4-fast-non-reasoning | aimlapi | 2M | $0.52 | $1.3 | ๐Ÿ”ง | +| grok-4-20-multi-agent | venice | 2M | $1.42 | $2.83 | ๐Ÿง  ๐Ÿ“‹ | +| grok-4-20 | venice | 2M | $1.42 | $2.83 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ“‹ | + +## Cheapest 1M+ Context Models + +Best value models with 1M+ token context โ€” for processing very long inputs. + +| Model | Provider | Context | Input $/M | Output $/M | Capabilities | +| --------------------------------- | ------------- | ------- | --------- | ---------- | ------------ | +| gemini-1.5-flash-8b | deepinfra | 1M | $0.0375 | $0.15 | | +| gpt-5-nano | meganova | 1M | $0.04 | $0.32 | ๐Ÿ”ง | +| qwen--qwen3.5-flash-02-23 | openrouter | 1M | $0.065 | $0.26 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ“‹ | +| google--gemini-2.0-flash-lite-001 | openrouter | 1M | $0.075 | $0.3 | ๐Ÿ”ง ๐Ÿ“‹ | +| google--gemini-2.0-flash-lite-001 | fastrouter | 1M | $0.075 | $0.3 | ๐Ÿ”ง | +| gemini-1.5-flash | deepinfra | 1M | $0.075 | $0.3 | | +| gemini-2.0-flash-lite | google | 1M | $0.075 | $0.3 | ๐Ÿ”ง ๐Ÿ“‹ | +| gemini-1.5-flash | google | 1M | $0.075 | $0.3 | ๐Ÿ”ง ๐Ÿ“‹ | +| gemini-1.5-flash-8b | google | 1M | $0.075 | $0.3 | ๐Ÿ”ง ๐Ÿ“‹ | +| gemini-2-0-flash-lite | google-vertex | 1M | $0.075 | $0.3 | ๐Ÿ”ง | + +## Free Large Context Models + +Free models with 128K+ context โ€” zero-cost long document processing. + +| Model | Provider | Context | Input $/M | Output $/M | Capabilities | +| ---------------------------------------- | ---------- | ------- | --------- | ---------- | ------------ | +| openrouter--owl-alpha | openrouter | 1M | Free | Free | ๐Ÿ”ง ๐Ÿ“‹ | +| deepseek--deepseek-v4-flash--free | openrouter | 1M | Free | Free | ๐Ÿ”ง ๐Ÿง  | +| google--lyria-3-clip-preview | openrouter | 1M | Free | Free | ๐Ÿ“‹ | +| google--lyria-3-pro-preview | openrouter | 1M | Free | Free | ๐Ÿ“‹ | +| qwen--qwen3-coder--free | openrouter | 1M | Free | Free | ๐Ÿ”ง | +| nvidia--nemotron-3-super-120b-a12b--free | openrouter | 1M | Free | Free | ๐Ÿ”ง ๐Ÿง  ๐Ÿ“‹ | +| google--gemma-4-26b-a4b-it--free | openrouter | 262K | Free | Free | ๐Ÿ”ง ๐Ÿง  ๐Ÿ“‹ | +| arcee-ai--trinity-large-thinking--free | openrouter | 262K | Free | Free | ๐Ÿ”ง ๐Ÿง  | +| google--gemma-4-31b-it--free | openrouter | 262K | Free | Free | ๐Ÿ”ง ๐Ÿง  ๐Ÿ“‹ | +| gemma-4-26b-a4b-it | auriko | 262K | Free | Free | ๐Ÿ”ง ๐Ÿง  ๐Ÿ“‹ | + +## Context Window Tiers + +| Tier | Context | Use Case | Example Models | +| -------- | ------- | ------------------------------ | ------------------------- | +| Standard | 128K | Long documents, code files | gpt-4.1, claude-sonnet-4 | +| Extended | 256K | Codebases, multi-file analysis | claude-opus-4, o3 | +| Ultra | 1M | Full repositories, books | gemini-2.5-flash, gpt-4.1 | +| Massive | 10M | Entire datasets, video | llama-4-scout | + +## Related Documentation + +- [Context Windows](context-windows.md) โ€” detailed context window comparison +- [Chat Models](chat-models.md) โ€” 2,350 models with tool calling +- [Code Models](code-models.md) โ€” 189 code-focused models +- [Free AI Models](free-models.md) โ€” 81 free models by capability +- [Model Selection Guide](model-selection.md) โ€” decision framework +- [Migration Guide](migration-guide.md) โ€” switching providers +- [Provider Comparison](provider-comparison.md) โ€” top 30 providers + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/lessons-learned.md b/docs/lessons-learned.md index 1ebea94a..9fe44211 100644 --- a/docs/lessons-learned.md +++ b/docs/lessons-learned.md @@ -298,3 +298,15 @@ Platforms like OpenRouter and nano-gpt are router/aggregators that don't produce - **nano-gpt**: Public API for model list + JS bundle for per-token USD pricing (555 models). These are treated as inference platforms, not rejected as "just routers", because they provide verifiable first-party per-token pricing data. + +## Related Documentation + +- [Data Acquisition](data-acquisition.md) โ€” how we acquire and update data +- [Data Schema](data-schema.md) โ€” complete YAML schema reference +- [Provider Overview](providers.md) โ€” all 95 providers +- [FAQ](faq.md) โ€” common questions +- [Contributing](https://github.com/i-need-token/ai-models/blob/main/CONTRIBUTING.md) โ€” how to contribute + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/migration-guide.md b/docs/migration-guide.md new file mode 100644 index 00000000..21f9760b --- /dev/null +++ b/docs/migration-guide.md @@ -0,0 +1,100 @@ +# Migration Guide: Switching AI Model Providers + +[ไธญๆ–‡](zh/migration-guide.md) + +A practical guide for switching between AI model providers โ€” compare pricing, capabilities, and context windows to find the best alternative for your use case. + +Data sourced from the [AI Models Catalog](https://github.com/i-need-token/ai-models). + +## Why Switch Providers? + +- **Cost savings** โ€” some providers offer the same models at 2-10ร— lower prices +- **Better capabilities** โ€” newer models may offer tool calling, reasoning, or vision +- **Larger context** โ€” process more data in a single request +- **Reliability** โ€” reduce dependency on a single provider +- **Compliance** โ€” data residency requirements may require specific providers + +## Major Provider Comparison + +| Provider | Models | Cheapest Input $/M | Largest Context | Tool Calling | Reasoning | +| --------- | ------ | -----------------: | --------------- | ------------ | --------- | +| openai | 28 | $0.02 | 1047576 | 18 | 8 | +| anthropic | 11 | $1 | 1000000 | 11 | 11 | +| google | 21 | $0.075 | 2097152 | 8 | 2 | +| deepseek | 4 | $0.14 | 1000000 | 4 | 3 | +| meta | 12 | $0.1 | 10000000 | 9 | 0 | +| mistral | 16 | $0.04 | 256000 | 12 | 1 | +| xai | 6 | $0.2 | 131072 | 6 | 5 | +| alibaba | 62 | $0.15 | 1000000 | 62 | 52 | + +## Common Migration Paths + +### OpenAI โ†’ Cheaper Alternatives + +| OpenAI Model | Cheapest Alternative | Provider | Input $/M | Savings | +| -------------------- | -------------------- | --------- | --------- | ------- | +| gpt-4.1 ($2) | gpt-4.1-mini | openai | $0.40 | 80% | +| gpt-4.1-mini ($0.40) | gpt-4.1-nano | openai | $0.10 | 75% | +| o4-mini ($1.10) | deepseek-r1 | deepseek | $0.55 | 50% | +| gpt-4.1 ($2) | claude-haiku-4 | anthropic | $1 | 50% | +| gpt-4.1 ($2) | gemini-2.5-flash | google | $0.15 | 93% | + +### Anthropic โ†’ Cheaper Alternatives + +| Anthropic Model | Cheapest Alternative | Provider | Input $/M | Savings | +| -------------------- | -------------------- | -------- | --------- | ------- | +| claude-opus-4 ($15) | o4-mini | openai | $1.10 | 93% | +| claude-sonnet-4 ($3) | gemini-2.5-flash | google | $0.15 | 95% | +| claude-sonnet-4 ($3) | deepseek-chat | deepseek | $0.14 | 95% | +| claude-haiku-4 ($1) | gemini-2.5-flash | google | $0.15 | 85% | + +### Google โ†’ Cheaper Alternatives + +| Google Model | Cheapest Alternative | Provider | Input $/M | Savings | +| ---------------------- | -------------------- | -------- | --------- | ------- | +| gemini-2.5-pro ($1.25) | gemini-2.5-flash | google | $0.15 | 88% | +| gemini-2.5-pro ($1.25) | deepseek-chat | deepseek | $0.14 | 89% | + +## Migration Checklist + +When switching providers, verify these compatibility points: + +- [ ] **API format** โ€” OpenAI-compatible vs proprietary API +- [ ] **Model names** โ€” different providers use different model IDs +- [ ] **Tool calling format** โ€” function calling syntax varies +- [ ] **Streaming** โ€” SSE vs WebSocket vs HTTP streaming +- [ ] **Rate limits** โ€” requests per minute, tokens per minute +- [ ] **Context window** โ€” may differ from original provider +- [ ] **Modalities** โ€” vision, audio, video support varies +- [ ] **Structured output** โ€” JSON mode availability +- [ ] **Prompt caching** โ€” can reduce costs 50-90% +- [ ] **Data residency** โ€” where is data processed and stored + +## OpenAI-Compatible Providers + +These providers offer OpenAI-compatible APIs โ€” minimal code changes needed: + +| Provider | Base URL | Notes | +| ----------- | ------------------------------- | --------------------------- | +| openrouter | `openrouter.ai/api/v1` | Aggregator, 356+ models | +| deepinfra | `api.deepinfra.com/v1` | Focus on open-source models | +| togetherai | `api.together.xyz/v1` | Open-source model hosting | +| groq | `api.groq.com/openai/v1` | Ultra-fast inference | +| cerebras | `api.cerebras.ai/v1` | Fastest inference speed | +| fireworks | `api.fireworks.ai/inference/v1` | Serverless model hosting | +| siliconflow | `api.siliconflow.cn/v1` | China-focused provider | + +## Related Documentation + +- [Pricing Comparison](pricing-comparison.md) โ€” side-by-side pricing across providers +- [Model Selection Guide](model-selection.md) โ€” decision framework for choosing models +- [Free AI Models](free-models.md) โ€” 81 free models by capability +- [Cached Pricing](cached-pricing.md) โ€” 1,374 models with prompt caching +- [Chat Models](chat-models.md) โ€” 2,350 models with tool calling +- [Agentic Models](agentic-models.md) โ€” 1,080 models with tool calling + reasoning +- [API Reference](api.md) โ€” programmatic access to model data +- [OpenAI Alternatives](openai-alternatives.md) โ€” GPT-4/GPT-3.5 alternatives with pricing + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/modality-matrix.md b/docs/modality-matrix.md new file mode 100644 index 00000000..9fc5a5fb --- /dev/null +++ b/docs/modality-matrix.md @@ -0,0 +1,106 @@ +**English** | [ไธญๆ–‡](./zh/modality-matrix.md) + +# Modality Matrix + +Which models support vision, audio, image generation, and video? This page lists the top models for each modality. + +> For the full list, browse the `providers/` directory or download [models.json](https://github.com/i-need-token/ai-models/releases/latest). + +## Vision (Image Input) + +1,487 models accept images as input. Here are the most capable flagships: + +| Model | Provider | Context | Input $/1M | Output $/1M | +| ---------------- | ------------- | ------- | ---------: | ----------: | +| GPT-4.1 | OpenAI | 1M | $2.00 | $8.00 | +| Claude Opus 4 | Anthropic | 200K | $15.00 | $75.00 | +| Gemini 2.5 Pro | Google | 1M | $1.25 | $10.00 | +| Qwen3-235B-A22B | Alibaba Cloud | 128K | ยฅ1.00 | ยฅ4.00 | +| DeepSeek-V3 | DeepSeek | 128K | $0.27 | $1.10 | +| Llama 4 Maverick | Meta | 1M | โ€” | โ€” | +| Mistral Large | Mistral | 128K | $2.00 | $6.00 | +| Grok 3 | xAI | 131K | $3.00 | $15.00 | + +**Cheapest vision models (USD):** + +| Model | Provider | Input $/1M | Output $/1M | +| ------------- | ------------- | ---------: | ----------: | +| DeepSeek-V3 | DeepSeek | $0.27 | $1.10 | +| Qwen3-30B-A3B | Alibaba Cloud | ยฅ0.10 | ยฅ0.30 | +| Llama 4 Scout | Together AI | $0.15 | $0.60 | +| Gemma 3 27B | Google | $0.20 | $0.80 | +| Phi-4 | Microsoft | $0.10 | $0.40 | + +## Image Output (Image Generation) + +28 models can generate images: + +| Model | Provider | Type | +| -------------------- | ----------------- | ----------------------- | +| GPT-Image-1 | OpenAI | Native image generation | +| DALL-E 3 | OpenAI | Native image generation | +| Gemini 2.0 Flash | Google | Multimodal output | +| Flux Pro | Black Forest Labs | Image generation | +| Flux Dev | Black Forest Labs | Image generation | +| Ideogram 3 | Ideogram | Image generation | +| Stable Diffusion 3.5 | Stability AI | Image generation | +| Midjourney v7 | Midjourney | Image generation | + +## Audio Input (Speech Recognition) + +118 models accept audio as input: + +| Model | Provider | Capabilities | +| --------------- | ------------- | -------------------------------- | +| GPT-4o-audio | OpenAI | Audio understanding + generation | +| Gemini 2.5 Pro | Google | Audio understanding | +| Claude Sonnet 4 | Anthropic | Audio understanding | +| Qwen2-Audio | Alibaba Cloud | Audio understanding | +| Whisper | OpenAI | Speech recognition | + +## Audio Output (Speech Generation) + +34 models can generate audio: + +| Model | Provider | Type | +| -------------- | ------------- | -------------- | +| GPT-4o-audio | OpenAI | Audio output | +| Gemini 2.5 Pro | Google | Audio output | +| Qwen2-Audio | Alibaba Cloud | Audio output | +| TTS-1 | OpenAI | Text-to-speech | +| TTS-1-HD | OpenAI | Text-to-speech | + +## Video Input + +167 models accept video as input: + +| Model | Provider | Context | +| ---------------- | ------------- | ----------- | +| Gemini 2.5 Pro | Google | 1M tokens | +| GPT-4.1 | OpenAI | 1M tokens | +| Claude Opus 4 | Anthropic | 200K tokens | +| Qwen3-235B-A22B | Alibaba Cloud | 128K tokens | +| Llama 4 Maverick | Meta | 1M tokens | + +## Multimodal Models (3+ Input Modalities) + +Models that accept text + at least 2 additional input modalities: + +| Model | Provider | Input Modalities | +| -------------- | ------------- | ------------------------- | +| GPT-4o-audio | OpenAI | text, image, audio | +| Gemini 2.5 Pro | Google | text, image, audio, video | +| Claude Opus 4 | Anthropic | text, image, audio | +| Qwen2-Audio | Alibaba Cloud | text, image, audio | + +## Related Documentation + +- [Vision Models](vision-models.md) โ€” 1,487 vision models +- [Audio Models](audio-models.md) โ€” 118 audio input + 34 audio output models +- [Video Models](video-models.md) โ€” 167 video input/output models +- [Image Generation](image-generation.md) โ€” 28 image generation models +- [Model Selection Guide](model-selection.md) โ€” decision framework + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/model-comparison.md b/docs/model-comparison.md new file mode 100644 index 00000000..b041ed7a --- /dev/null +++ b/docs/model-comparison.md @@ -0,0 +1,109 @@ +**English** | [ไธญๆ–‡](./zh/model-comparison.md) + +# Model Comparison + +Quick-reference comparisons for popular AI model categories. All data sourced from first-party provider APIs and documentation. + +## Top-Tier Flagship Models + +The most capable models from each major provider. Pricing shown for direct provider API. + +| Model | Provider | Context | Input $/Mtok | Output $/Mtok | Reasoning | Tool Call | Vision | +| ---------------- | --------- | ------: | -----------: | ------------: | :-------: | :-------: | :----: | +| o3 | OpenAI | 200K | 10.00 | 40.00 | โœ… | โœ… | โœ… | +| Claude Opus 4.7 | Anthropic | 1M | 5.00 | 25.00 | โœ… | โœ… | โœ… | +| Gemini 2.5 Pro | Google | 1M | 1.25 | 10.00 | โœ… | โœ… | โœ… | +| DeepSeek-V4-Pro | DeepSeek | 1M | 0.435 | 0.87 | โœ… | โœ… | โŒ | +| Grok 4 | xAI | 131K | 3.00 | 15.00 | โœ… | โœ… | โœ… | +| Llama 4 Maverick | Meta | 1M | 0.24 | 0.97 | โŒ | โœ… | โœ… | +| Qwen3-235B | Alibaba | โ€” | 2.00 | 8.00 | โœ… | โœ… | โŒ | +| Mistral Large | Mistral | 128K | 2.00 | 6.00 | โŒ | โœ… | โœ… | + +## Cost-Effective Models + +Best value models for high-volume workloads. + +| Model | Provider | Context | Input $/Mtok | Output $/Mtok | Reasoning | Tool Call | +| ----------------- | --------- | ------: | -----------: | ------------: | :-------: | :-------: | +| GPT-4.1 Nano | OpenAI | 1M | 0.10 | 0.40 | โŒ | โœ… | +| o4-mini | OpenAI | 200K | 1.10 | 4.40 | โœ… | โœ… | +| Claude Haiku 4.5 | Anthropic | 200K | 1.00 | 5.00 | โœ… | โœ… | +| Gemini 2.5 Flash | Google | 1M | 0.15 | 3.50 | โœ… | โœ… | +| DeepSeek-V4-Flash | DeepSeek | 1M | 0.14 | 0.28 | โœ… | โœ… | +| Llama 4 Scout | Meta | 10M | 0.17 | 0.66 | โŒ | โœ… | +| Qwen3-30B | Alibaba | โ€” | 0.75 | 3.00 | โœ… | โœ… | +| Mistral Small | Mistral | 128K | 0.20 | 0.60 | โŒ | โœ… | +| Grok 3 Mini | xAI | 131K | 0.25 | 1.27 | โœ… | โœ… | + +## Largest Context Windows + +Models with the biggest context windows for long-document processing. + +| Model | Provider | Context (tokens) | Input $/Mtok | Output $/Mtok | +| ----------------- | --------- | ---------------: | -----------: | ------------: | +| Llama 4 Scout | Meta | 10,000,000 | 0.17 | 0.66 | +| Claude Opus 4.7 | Anthropic | 1,000,000 | 5.00 | 25.00 | +| Claude Sonnet 4.6 | Anthropic | 1,000,000 | 3.00 | 15.00 | +| GPT-4.1 | OpenAI | 1,048,576 | 2.00 | 8.00 | +| Gemini 2.5 Pro | Google | 1,048,576 | 1.25 | 10.00 | +| Gemini 2.5 Flash | Google | 1,048,576 | 0.15 | 3.50 | +| Llama 4 Maverick | Meta | 1,000,000 | 0.24 | 0.97 | +| DeepSeek-V4-Pro | DeepSeek | 1,000,000 | 0.435 | 0.87 | + +## Free Models + +Models available at no cost (as of data collection date). + +| Model | Provider | Context | Reasoning | Tool Call | +| ----------------------------- | -------- | ------: | :-------: | :-------: | +| DeepSeek-V4-Flash (free tier) | DeepSeek | 1M | โœ… | โœ… | +| Gemini 2.5 Flash (free tier) | Google | 1M | โœ… | โœ… | +| Llama 4 Scout (self-hosted) | Meta | 10M | โŒ | โœ… | +| Qwen3-30B (self-hosted) | Alibaba | โ€” | โœ… | โœ… | +| Mistral Small (self-hosted) | Mistral | 128K | โŒ | โœ… | + +> Free tiers typically have rate limits. Self-hosted models require your own infrastructure. + +## Vision-Capable Models + +Models that accept image inputs. + +| Model | Provider | Image Input | Image Output | Video Input | +| ---------------- | --------- | :---------: | :----------: | :---------: | +| o3 | OpenAI | โœ… | โŒ | โŒ | +| Claude Opus 4.7 | Anthropic | โœ… | โŒ | โŒ | +| Gemini 2.5 Pro | Google | โœ… | โŒ | โŒ | +| GPT-4.1 | OpenAI | โœ… | โŒ | โŒ | +| Llama 4 Maverick | Meta | โœ… | โŒ | โŒ | +| Grok 3 | xAI | โœ… | โŒ | โŒ | + +## Open-Weight Models + +Models with publicly available weights for self-hosting. + +| Model | Provider | Context | Input $/Mtok | Output $/Mtok | Reasoning | +| ----------------- | --------- | ------: | -----------: | ------------: | :-------: | +| Llama 4 Maverick | Meta | 1M | 0.24 | 0.97 | โŒ | +| Llama 4 Scout | Meta | 10M | 0.17 | 0.66 | โŒ | +| Qwen3-235B | Alibaba | โ€” | 2.00 | 8.00 | โœ… | +| Qwen3-30B | Alibaba | โ€” | 0.75 | 3.00 | โœ… | +| Mistral Small 3.2 | Mistral | 128K | 0.20 | 0.60 | โŒ | +| Phi-4 | Microsoft | 16K | 0.125 | 0.50 | โŒ | + +> Pricing shown for hosted inference. Self-hosted models have no per-token cost but require infrastructure. + +--- + +**Note**: All pricing and capability data is from first-party sources. Prices may vary on inference platforms. Check `providers//models/` for the most current data. + +## Related Documentation + +- [Model Selection Guide](model-selection.md) โ€” decision framework for choosing models +- [Pricing Comparison](pricing-comparison.md) โ€” side-by-side pricing across providers +- [Free AI Models](free-models.md) โ€” 81 free models +- [Open-Weight Models](open-weights.md) โ€” 527 models you can run yourself +- [Context Window Comparison](context-windows.md) โ€” largest context windows + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/model-selection-cheatsheet.md b/docs/model-selection-cheatsheet.md new file mode 100644 index 00000000..be900691 --- /dev/null +++ b/docs/model-selection-cheatsheet.md @@ -0,0 +1,105 @@ +# AI Model Selection Cheatsheet + +> Quick-reference guide to picking the right AI model for your use case. All data from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” 4,587+ models across 95 providers. + +## ๐ŸŽฏ Decision Tree + +``` +What do you need? +โ”œโ”€โ”€ Cheapest model with tool calling โ†’ ling-2.6-flash ($0.01/$0.03/M) +โ”œโ”€โ”€ Best free reasoning model โ†’ DeepSeek R1 (92% MATH-500) +โ”œโ”€โ”€ Largest context window โ†’ Gemini 2.5 Pro (1M tokens) +โ”œโ”€โ”€ Best coding assistant โ†’ Claude Sonnet 4 / GPT-4.1 +โ”œโ”€โ”€ Open-source with tool calling โ†’ Qwen3 4B ($0.03/$0.15/M) +โ”œโ”€โ”€ Free model with vision โ†’ Gemma 4 27B IT +โ””โ”€โ”€ Cheapest for production โ†’ bdc-coder ($0.01/$0.01/M) +``` + +## ๐Ÿ’ฐ By Budget + +| Budget | Best Pick | Input/Output $/M | Why | +| ------------- | --------------- | ---------------- | -------------------------------- | +| **Free** | DeepSeek R1 | $0/$0 | Best reasoning among free models | +| **Free** | Gemma 4 27B IT | $0/$0 | Free vision + tool calling | +| **< $0.05/M** | ling-2.6-flash | $0.01/$0.03 | Cheapest tool calling | +| **< $0.10/M** | Qwen3 4B | $0.03/$0.15 | Open-source reasoning + TC | +| **< $0.50/M** | GPT-4.1-mini | $0.40/$1.60 | Best value frontier model | +| **< $2/M** | Claude Sonnet 4 | $3/$15 | Top coding + reasoning | +| **< $5/M** | GPT-4.1 | $2/$8 | 1M context + vision | +| **Premium** | o3 | $10/$40 | Best reasoning benchmark scores | + +## ๐Ÿ› ๏ธ By Use Case + +### AI Agents + +Need: tool calling + reasoning + low latency + +- **Best value**: ling-2.6-flash ($0.01/$0.03/M) โ€” cheapest TC model +- **Balanced**: GPT-4.1-mini ($0.40/$1.60/M) โ€” reliable + 1M context +- **Premium**: Claude Sonnet 4 ($3/$15/M) โ€” best agentic performance + +### Code Generation + +Need: tool calling + structured output + large context + +- **Best value**: bdc-coder ($0.01/$0.01/M) โ€” cheapest coding model +- **Balanced**: GPT-4.1-mini ($0.40/$1.60/M) โ€” great code quality +- **Premium**: Claude Sonnet 4 ($3/$15/M) โ€” SOTA on SWE-bench + +### Chat / RAG + +Need: large context + low cost + fast responses + +- **Best value**: Qwen3 4B ($0.03/$0.15/M) โ€” cheap + 262K context +- **Balanced**: GPT-4.1-nano ($0.10/$0.40/M) โ€” fast + cheap +- **Premium**: Gemini 2.5 Pro ($1.25/$10/M) โ€” 1M context + reasoning + +### Vision / Multimodal + +Need: image input + text output + tool calling + +- **Free**: Gemma 4 27B IT โ€” free vision + TC +- **Best value**: GPT-4.1-mini ($0.40/$1.60/M) โ€” vision + 1M context +- **Premium**: Claude Sonnet 4 ($3/$15/M) โ€” best vision understanding + +### Reasoning / Math + +Need: reasoning capability + structured output + +- **Free**: DeepSeek R1 โ€” 92% MATH-500 +- **Best value**: Qwen3.5 4B ($0.03/$0.15/M) โ€” cheap reasoning +- **Premium**: o3 ($10/$40/M) โ€” SOTA on GPQA, MATH-500 + +### High-Volume Production + +Need: lowest cost per token + reliability + +- **Cheapest TC**: ling-2.6-flash ($0.01/$0.03/M) +- **Cheapest reasoning**: Qwen3.5 0.8B ($0.01/$0.05/M) +- **Cheapest coding**: bdc-coder ($0.01/$0.01/M) + +## ๐Ÿ“Š Quick Stats + +| Metric | Count | +| ------------------- | ----- | +| Total models | 4,587 | +| Providers | 95 | +| Free models | 81 | +| Tool-calling models | 2,350 | +| Reasoning models | 1,306 | +| Vision models | 1,487 | +| Open-weight models | 527 | +| Structured output | 829 | + +## ๐Ÿ”— Explore More + +- [Interactive Catalog](https://i-need-token.github.io/ai-models/) โ€” search, filter, compare all models +- [Free Models Guide](free-models.md) โ€” all 81 free models +- [Tool Calling Guide](tool-calling.md) โ€” 2,350 models with tool calling +- [Pricing Comparison](pricing-comparison.md) โ€” find the cheapest model +- [Context Windows](context-windows.md) โ€” largest context windows +- [Model Comparison](model-comparison.md) โ€” head-to-head comparisons + +--- + +_Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” first-party data only, updated automatically._ diff --git a/docs/model-selection.md b/docs/model-selection.md new file mode 100644 index 00000000..d3a465fe --- /dev/null +++ b/docs/model-selection.md @@ -0,0 +1,134 @@ +# Model Selection Guide + +> ๐Ÿ“‹ **Quick reference?** See the [Model Selection Cheatsheet](model-selection-cheatsheet.md) for a budget-by-budget guide. +> [ไธญๆ–‡](zh/model-selection.md) + +How to choose the right AI model for your use case โ€” practical recommendations based on cost, capabilities, and context windows. + +Data sourced from the [AI Models Catalog](https://github.com/i-need-token/ai-models). + +## Decision Framework + +``` +What do you need? +โ”œโ”€โ”€ Cheapest possible โ†’ Free models (81 available) +โ”‚ โ”œโ”€โ”€ With tool calling โ†’ See "Free + Tool Calling" below +โ”‚ โ”œโ”€โ”€ With reasoning โ†’ See "Free + Reasoning" below +โ”‚ โ””โ”€โ”€ Best overall free โ†’ See "Best Free Models" below +โ”œโ”€โ”€ Best value (cheap + capable) โ†’ See "Best Value Models" below +โ”œโ”€โ”€ Largest context โ†’ See "Large Context Models" below +โ”œโ”€โ”€ Specific capability +โ”‚ โ”œโ”€โ”€ Tool calling โ†’ [Tool Calling Models](tool-calling.md) +โ”‚ โ”œโ”€โ”€ Reasoning โ†’ [Reasoning Models](reasoning-models.md) +โ”‚ โ”œโ”€โ”€ Vision โ†’ [Vision Models](vision-models.md) +โ”‚ โ”œโ”€โ”€ Structured output โ†’ [Structured Output](structured-output.md) +โ”‚ โ””โ”€โ”€ Prompt caching โ†’ [Cached Pricing](cached-pricing.md) +โ””โ”€โ”€ Full comparison โ†’ [Model Comparison](model-comparison.md) ยท [Pricing Comparison](pricing-comparison.md) +``` + +## Best Free Models + +Models with $0 input and $0 output pricing โ€” perfect for prototyping and development. + +| Model | Provider | Context | Capabilities | +| ----- | -------- | ------- | ------------ | + +> See [Free AI Models](free-models.md) for the complete list of 81 free models. + +## Free + Tool Calling + +Free models that support function/tool calling โ€” ideal for building agents at zero cost. + +| Model | Provider | Context | Capabilities | +| ----- | -------- | ------- | ------------ | + +## Free + Reasoning + +Free models with chain-of-thought reasoning โ€” complex problem solving at zero cost. + +| Model | Provider | Context | Capabilities | +| ----- | -------- | ------- | ------------ | + +## Best Value Models + +Cheapest models with tool calling โ€” best bang for the buck for production agents. + +| Model | Provider | Context | Input $/M | Output $/M | Capabilities | +| --------------------------- | ------------ | ------- | --------- | ---------- | ------------ | +| ernie-4.5-0.3b | aihubmix | 0 | $0.0068 | $0.0272 | ๐Ÿ”ง ๐Ÿ‘ ๐Ÿ“‹ | +| bdc-coder | inferencenet | 131K | $0.01 | $0.01 | ๐Ÿ”ง ๐Ÿ”“ | +| inclusionai--ling-2.6-flash | openrouter | 262K | $0.01 | $0.03 | ๐Ÿ”ง ๐Ÿ“‹ | +| ling-2.6-flash | inclusionai | 262K | $0.01 | $0.03 | ๐Ÿ”ง | +| qwen-3.5-0.8b | auriko | 262K | $0.01 | $0.05 | ๐Ÿง  ๐Ÿ”ง ๐Ÿ‘ | + +Cheapest models with vision: + +| Model | Provider | Context | Input $/M | Output $/M | Capabilities | +| -------------------- | --------- | ------- | --------- | ---------- | ------------ | +| ernie-4.5-0.3b | aihubmix | 0 | $0.0068 | $0.0272 | ๐Ÿ”ง ๐Ÿ‘ ๐Ÿ“‹ | +| deepseek-ocr | aihubmix | 0 | $0.01 | $0.01 | ๐Ÿ‘ | +| gemini-2.0-flash-exp | aihubmix | 0 | $0.01 | $0.04 | ๐Ÿ‘ | +| qwen-3.5-0.8b | auriko | 262K | $0.01 | $0.05 | ๐Ÿง  ๐Ÿ”ง ๐Ÿ‘ | +| qwen3.5-0.8b | deepinfra | 262K | $0.01 | $0.05 | ๐Ÿง  ๐Ÿ‘ | + +Cheapest models with reasoning: + +| Model | Provider | Context | Input $/M | Output $/M | Capabilities | +| --------------------- | --------- | ------- | --------- | ---------- | ------------ | +| qwen-3.5-0.8b | auriko | 262K | $0.01 | $0.05 | ๐Ÿง  ๐Ÿ”ง ๐Ÿ‘ | +| qwen3.5-0.8b | deepinfra | 262K | $0.01 | $0.05 | ๐Ÿง  ๐Ÿ‘ | +| gemma-2-2b-it | cortecs | 0 | $0.018 | $0.054 | ๐Ÿง  | +| llama-3.1-8b-instruct | cortecs | 0 | $0.018 | $0.054 | ๐Ÿง  ๐Ÿ”ง | +| qwen-3.5-2b | auriko | 262K | $0.02 | $0.1 | ๐Ÿง  ๐Ÿ”ง ๐Ÿ‘ | + +## Large Context Models + +Models with the largest context windows โ€” for long documents, multi-turn conversations, and codebases. + +| Model | Provider | Context | Input $/M | Output $/M | Capabilities | +| ---------------------------- | ---------- | ------- | --------- | ---------- | ------------ | +| meta-llama--llama-4-scout | openrouter | 10M | $0.08 | $0.3 | ๐Ÿ”ง ๐Ÿ‘ ๐Ÿ“‹ | +| meta-llama-4-scout | meta | 10M | $0.17 | $0.66 | ๐Ÿ”ง ๐Ÿ‘ | +| gemini-1.5-pro | google | 2M | $1.25 | $5 | ๐Ÿ”ง ๐Ÿ‘ ๐Ÿ“‹ | +| grok-code-fast-1 | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ”ง ๐Ÿ‘ | +| gpt-4o | jiekou | 2M | $1.9 | $5.7 | ๐Ÿ”ง ๐Ÿ‘ | +| grok-4.20-0309-non-reasoning | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ”ง ๐Ÿ‘ | +| grok-4.20-0309-reasoning | jiekou | 2M | $1.9 | $5.7 | ๐Ÿ”ง ๐Ÿ‘ | +| grok-4-1-fast-reasoning | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ”ง ๐Ÿ‘ | +| grok-4-fast-reasoning | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ”ง ๐Ÿ‘ | +| x-ai--grok-4-fast | fastrouter | 2M | $0.2 | $0.5 | ๐Ÿ”ง ๐Ÿ‘ | + +> See [Context Window Comparison](context-windows.md) for the full analysis. + +## Cost Optimization Tips + +1. **Use free models for development** โ€” prototype with free models, switch to paid for production +2. **Enable prompt caching** โ€” [1,374 models](cached-pricing.md) support caching with 50-90% input cost savings +3. **Choose the smallest capable model** โ€” e.g., GPT-4.1 Mini instead of GPT-4.1 for simple tasks +4. **Use open-weight models** โ€” [527 models](open-weights.md) can run on your own infrastructure +5. **Compare across providers** โ€” the same model is often cheaper through alternative providers (e.g., Groq, Together AI, DeepInfra) +6. **Batch requests** โ€” some providers offer 50% discount for batch API calls +7. **Monitor usage** โ€” track input/output token ratios to optimize model selection + +## Related Documentation + +- [Model Comparison](model-comparison.md) โ€” flagship, cost-effective, free, and open-weight models +- [Pricing Comparison](pricing-comparison.md) โ€” side-by-side pricing across providers +- [Cached Pricing](cached-pricing.md) โ€” models with prompt caching support +- [Free AI Models](free-models.md) โ€” 81 free models by capability +- [Open-Weight Models](open-weights.md) โ€” 527 models you can run yourself +- [Context Window Comparison](context-windows.md) โ€” largest context windows +- [Tool Calling Models](tool-calling.md) โ€” 2,350 models with tool calling +- [Reasoning Models](reasoning-models.md) โ€” 1,306 models with reasoning +- [Vision Models](vision-models.md) โ€” 1,487 models with image understanding +- [Quick Start Guide](quick-start.md) โ€” get started in 30 seconds + +- [Chat Models](chat-models.md) โ€” 2,350 models with tool calling for chat applications +- [Multimodal Models](multimodal-models.md) โ€” 1,519 models with image/audio/video input + +- [Large Context Models](large-context-models.md) โ€” 2,195 models with 128K+ context +- [Small & Edge Models](small-models.md) โ€” 1,153 models for on-device inference + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/multimodal-models.md b/docs/multimodal-models.md new file mode 100644 index 00000000..1745d8f0 --- /dev/null +++ b/docs/multimodal-models.md @@ -0,0 +1,101 @@ +# Multimodal Models + +[ไธญๆ–‡](zh/multimodal-models.md) + +AI models that can process **multiple input modalities** โ€” images, audio, and video alongside text. These models power visual Q&A, document analysis, video understanding, and audio transcription. + +Data sourced from the [AI Models Catalog](https://github.com/i-need-token/ai-models). + +## Why Multimodal Models Matter + +Multimodal models break the text-only barrier: + +- **Visual Q&A** โ€” ask questions about images and documents +- **Document Analysis** โ€” extract information from PDFs, screenshots, and scans +- **Video Understanding** โ€” analyze video content, summarize clips +- **Audio Processing** โ€” transcribe speech, analyze audio content +- **Accessibility** โ€” describe images for visually impaired users +- **Content Moderation** โ€” detect inappropriate content across modalities + +## Stats + +| Metric | Count | +| ----------------------------- | ----- | +| Multimodal models | 1519 | +| Providers | 61 | +| Image input | 1487 | +| Audio input | 118 | +| Video input | 167 | +| Free multimodal models | 53 | +| Open-weight multimodal models | 119 | +| With tool calling | 1179 | +| With reasoning | 701 | + +## Providers + +`01ai`, `302ai`, `aihubmix`, `aimlapi`, `amazon`, `amazon-bedrock`, `anthropic`, `arcee`, `auriko`, `baidu`, `berget`, `bytedance`, `chutes`, `clarifai`, `cloudferro-sherlock`, `cloudflare`, `cortecs`, `databricks`, `deepinfra`, `digitalocean`, `evroc`, `fastrouter`, `fireworks`, `google`, `google-vertex` and 36 more + +## Free Multimodal Models + +Free models with multimodal input โ€” zero-cost visual/audio applications. + +| Model | Provider | Context | Input $/M | Output $/M | Modalities | +| ---------------------------------------------------- | ---------- | ------- | --------- | ---------- | -------------- | +| google--lyria-3-clip-preview | openrouter | 1M | Free | Free | ๐Ÿ–ผ๏ธ | +| google--lyria-3-pro-preview | openrouter | 1M | Free | Free | ๐Ÿ–ผ๏ธ | +| google--gemma-4-26b-a4b-it--free | openrouter | 262K | Free | Free | ๐Ÿ–ผ๏ธ ๐ŸŽฌ ๐Ÿ”ง ๐Ÿง  | +| google--gemma-4-31b-it--free | openrouter | 262K | Free | Free | ๐Ÿ–ผ๏ธ ๐ŸŽฌ ๐Ÿ”ง ๐Ÿง  | +| gemma-4-26b-a4b-it | auriko | 262K | Free | Free | ๐Ÿ–ผ๏ธ ๐Ÿ”ง ๐Ÿง  | +| gemma-4-31b-it | auriko | 262K | Free | Free | ๐Ÿ–ผ๏ธ ๐Ÿ”ง ๐Ÿง  | +| nvidia--nemotron-3-nano-omni-30b-a3b-reasoning--free | openrouter | 256K | Free | Free | ๐Ÿ–ผ๏ธ ๐ŸŽค ๐ŸŽฌ ๐Ÿ”ง ๐Ÿง  | +| spotlight | arcee | 131K | Free | Free | ๐Ÿ–ผ๏ธ | +| gemma-3-4b-it | google | 131K | Free | Free | ๐Ÿ–ผ๏ธ | +| gemma-3-12b-it | google | 131K | Free | Free | ๐Ÿ–ผ๏ธ | + +## Cheapest Multimodal Models + +Best value multimodal models for production. + +| Model | Provider | Context | Input $/M | Output $/M | Modalities | +| -------------------------- | --------- | ------- | --------- | ---------- | ---------- | +| ernie-4.5-0.3b | aihubmix | 0 | $0.0068 | $0.0272 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง | +| deepseek-ocr | aihubmix | 0 | $0.01 | $0.01 | ๐Ÿ–ผ๏ธ | +| gemini-2.0-flash-exp | aihubmix | 0 | $0.01 | $0.04 | ๐Ÿ–ผ๏ธ ๐ŸŽค ๐ŸŽฌ | +| qwen-3.5-0.8b | auriko | 262K | $0.01 | $0.05 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง ๐Ÿง  | +| qwen3.5-0.8b | deepinfra | 262K | $0.01 | $0.05 | ๐Ÿ–ผ๏ธ ๐Ÿง  | +| qwen3-vl-flash-2026-01-22 | aihubmix | 0 | $0.0103 | $0.103 | ๐Ÿ–ผ๏ธ ๐ŸŽฌ ๐Ÿ”ง | +| qwen3-vl-flash | aihubmix | 0 | $0.0103 | $0.103 | ๐Ÿ–ผ๏ธ ๐ŸŽฌ ๐Ÿ”ง | +| glm-ocr | aihubmix | 0 | $0.0141 | $0.0141 | ๐Ÿ–ผ๏ธ | +| paddlepaddle--paddleocr-vl | novitaai | 16K | $0.02 | $0.02 | ๐Ÿ–ผ๏ธ | +| qwen-3.5-2b | auriko | 262K | $0.02 | $0.1 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง ๐Ÿง  | + +## Largest Context Multimodal Models + +Multimodal models with the largest context windows โ€” for processing long documents and videos. + +| Model | Provider | Context | Input $/M | Output $/M | Modalities | +| ---------------------------- | ---------- | ------- | --------- | ---------- | ----------- | +| meta-llama--llama-4-scout | openrouter | 10M | $0.08 | $0.3 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง | +| meta-llama-4-scout | meta | 10M | $0.17 | $0.66 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง | +| gemini-1.5-pro | google | 2M | $1.25 | $5 | ๐Ÿ–ผ๏ธ ๐ŸŽค ๐ŸŽฌ ๐Ÿ”ง | +| grok-code-fast-1 | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง | +| gpt-4o | jiekou | 2M | $1.9 | $5.7 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง | +| grok-4.20-0309-non-reasoning | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง | +| grok-4.20-0309-reasoning | jiekou | 2M | $1.9 | $5.7 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง | +| grok-4-1-fast-reasoning | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง | +| grok-4-fast-reasoning | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง | +| x-ai--grok-4-fast | fastrouter | 2M | $0.2 | $0.5 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง | + +## Related Documentation + +- [Vision Models](vision-models.md) โ€” 1,487 models with image input +- [Video Models](video-models.md) โ€” models with video understanding +- [Audio Models](audio-models.md) โ€” models with audio input/output +- [Image Generation](image-generation.md) โ€” 28 models that generate images +- [Agentic Models](agentic-models.md) โ€” 1,080 models with tool calling + reasoning +- [Free AI Models](free-models.md) โ€” 81 free models by capability +- [Model Selection Guide](model-selection.md) โ€” decision framework + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/open-weights.md b/docs/open-weights.md new file mode 100644 index 00000000..f3f0ba3d --- /dev/null +++ b/docs/open-weights.md @@ -0,0 +1,118 @@ +**English** | [ไธญๆ–‡](./zh/open-weights.md) + +# Open-Weight AI Models + +513 models in this catalog are open-weight โ€” you can download the weights and run them on your own infrastructure. This page highlights the most capable and widely available open-weight models. + +> All data sourced from first-party APIs and documentation. "Open-weight" means the model weights are publicly available; license terms vary by model. + +## Quick Stats + +| Capability | Open-Weight Models | +| ------------------------- | -----------------: | +| Total open-weight models | 513 | +| Unique model IDs | 420 | +| With tool calling | 270 | +| With reasoning | 101 | +| With vision (image input) | 104 | + +## Most Widely Available + +These open-weight models are available on the most providers โ€” easy to find, easy to switch: + +| Model | Providers | Context | Tool Call | Reasoning | Vision | +| ----------------------------- | --------: | ------- | --------- | --------- | ------ | +| GPT-OSS-120B | 14 | 131K | โœ… | โœ… | โŒ | +| GPT-OSS-20B | 8 | 131K | โœ… | โœ… | โŒ | +| Qwen3.5-397B-A17B | 4 | 262K | โœ… | โœ… | โŒ | +| Kimi K2 Thinking | 4 | 262K | โœ… | โœ… | โœ… | +| DeepSeek-R1-Distill-Llama-70B | 4 | 131K | โœ… | โœ… | โŒ | +| Llama 4 Scout 17B | 4 | 328K | โœ… | โŒ | โœ… | +| DeepSeek-R1 | 3 | 131K | โœ… | โœ… | โŒ | +| Llama 4 Maverick | 3 | 1M | โœ… | โŒ | โœ… | +| Qwen3-32B | 3 | 131K | โœ… | โœ… | โŒ | +| Gemma 4 31B IT | 3 | 262K | โœ… | โœ… | โœ… | + +## Largest Context Windows + +Open-weight models with the largest context windows: + +| Model | Context | Tool Call | Reasoning | Vision | +| ----------------- | ------- | --------- | --------- | ------ | +| Llama 4 Scout | 10M | โœ… | โŒ | โœ… | +| Qwen3.5 Flash | 1M | โœ… | โŒ | โœ… | +| Qwen3.6 Flash | 1M | โœ… | โŒ | โœ… | +| Llama 4 Maverick | 1M | โœ… | โŒ | โœ… | +| DeepSeek-V4 Flash | 1M | โœ… | โœ… | โŒ | +| DeepSeek-V4 Pro | 1M | โœ… | โœ… | โŒ | +| MiMo V2.5 | 1M | โœ… | โœ… | โœ… | +| Minimax M2.5 | 1M | โœ… | โŒ | โŒ | +| Gemma 4 31B IT | 1M | โœ… | โŒ | โœ… | + +## Best Open-Weight Reasoning Models + +These open-weight models support chain-of-thought reasoning: + +| Model | Context | Tool Call | Vision | Providers | +| -------------------- | ------- | --------- | ------ | --------: | +| DeepSeek-V4 Flash | 1M | โœ… | โŒ | 2 | +| DeepSeek-V4 Pro | 1M | โœ… | โŒ | 2 | +| MiMo V2.5 Pro | 1M | โœ… | โŒ | 1 | +| MiMo V2.5 | 1M | โœ… | โœ… | 1 | +| Gemma 4 26B A4B IT | 262K | โœ… | โœ… | 3 | +| Kimi K2.6 | 262K | โœ… | โœ… | 2 | +| Qwen3.5-397B-A17B | 262K | โœ… | โŒ | 2 | +| Nemotron-3-120B-A12B | 262K | โœ… | โŒ | 1 | +| DeepSeek-R1 | 131K | โœ… | โŒ | 3 | +| Qwen3-32B | 131K | โœ… | โœ… | 3 | + +## Best Open-Weight Vision Models + +Open-weight models that accept image input: + +| Model | Context | Tool Call | Reasoning | Providers | +| ------------------ | ------- | --------- | --------- | --------: | +| MiMo V2.5 | 1M | โœ… | โœ… | 1 | +| Llama 4 Maverick | 1M | โœ… | โŒ | 3 | +| Llama 4 Scout | 10M | โœ… | โŒ | 2 | +| Gemma 4 31B IT | 1M | โœ… | โŒ | 3 | +| Qwen3.5 Flash | 1M | โœ… | โŒ | 1 | +| Kimi K2.6 | 262K | โœ… | โœ… | 2 | +| Gemma 4 26B A4B IT | 262K | โœ… | โœ… | 3 | +| Llama 4 Scout 17B | 328K | โœ… | โŒ | 4 | + +## Cheapest Open-Weight Models + +Lowest per-token pricing for open-weight inference: + +| Model | Provider | Input $/1M | Output $/1M | Context | +| -------------------------- | ------------ | ---------: | ----------: | ------- | +| GLM-4-Flash | 302AI | $0.0014 | $0.0014 | 131K | +| Mistral-Nemo-Instruct-2407 | KlusterAI | $0.008 | $0.001 | 131K | +| BDC-Coder | InferenceNet | $0.01 | $0.01 | 131K | +| Granite 4.0 H Micro | Cloudflare | $0.017 | $0.112 | 131K | +| Llama 3.1 8B Instruct | InferenceNet | $0.02 | $0.03 | 131K | +| Mistral Nemo Instruct 2407 | MegaNova | $0.02 | $0.04 | 131K | +| Meta-Llama-3.1-8B-Instruct | Nebius | $0.02 | $0.06 | 131K | +| Llama 3.2 1B Instruct | Cloudflare | $0.027 | $0.201 | 131K | + +## Key Takeaways + +- **513 open-weight models** across 420 unique model IDs โ€” the largest open-weight model catalog available +- **GPT-OSS-120B** is the most widely available, offered by 14 providers +- **Llama 4 Scout** has the largest context window at 10M tokens +- **DeepSeek-R1** is the most popular open-weight reasoning model, available on 3 providers +- **MiMo V2.5** is the only open-weight model combining 1M context, reasoning, and vision +- Pricing varies widely โ€” the cheapest open-weight models cost under $0.01/1M tokens + +## Related Documentation + +- [Model Selection Guide](model-selection.md) โ€” decision framework for choosing models +- [Free AI Models](free-models.md) โ€” 81 free models +- [Provider Overview](providers.md) โ€” all 95 providers organized by type +- [Reasoning Models](reasoning-models.md) โ€” 1,306 models with reasoning +- [Cached Pricing](cached-pricing.md) โ€” 1,374 models with prompt caching + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/openai-alternatives.md b/docs/openai-alternatives.md new file mode 100644 index 00000000..be13fdea --- /dev/null +++ b/docs/openai-alternatives.md @@ -0,0 +1,156 @@ +**English** | [ไธญๆ–‡](./zh/openai-alternatives.md) + +# OpenAI Alternatives โ€” GPT-4, GPT-3.5, and Beyond + +Comprehensive guide to AI models comparable to OpenAI's GPT-4, GPT-4o, and GPT-3.5 Turbo โ€” with pricing, capabilities, and API compatibility. All data sourced from first-party APIs via the [AI Models Catalog](https://github.com/i-need-token/ai-models). + +## Quick Comparison: GPT-4 Class Alternatives + +Models with **tool calling + reasoning + vision** (the full GPT-4 capability set): + +| Model | Provider | Context | Input $/1M | Output $/1M | Open Weights | +| ----------------------------- | ---------- | ------- | ---------- | ----------- | ------------ | +| openai--gpt-oss-120b | novitaai | 128K | $0.05 | $0.25 | | +| Qwen--Qwen3.6-35B-A3B | neuralwatt | 0 | $0.05 | $0.1 | | +| Nemotron-3-Nano-Omni | nebius | 125K | $0.06 | $0.24 | โœ… | +| seed-1.6-flash | bytedance | 256K | $0.07 | $0.3 | | +| gemma-4-26b-a4b-it | cloudflare | 256K | $0.1 | $0.3 | โœ… | +| Gemma-3-27b-it | nebius | 93K | $0.1 | $0.3 | โœ… | +| seed-2.0-mini | bytedance | 256K | $0.1 | $0.4 | | +| google--gemma-4-26b-a4b-it | novitaai | 256K | $0.13 | $0.4 | | +| google--gemma-4-31B-turbo-TEE | chutes | 128K | $0.13 | $0.38 | | +| baidu--ernie-4.5-vl-28b-a3b | novitaai | 29K | $0.14 | $0.56 | | +| google--gemma-4-31b-it | novitaai | 256K | $0.14 | $0.4 | | +| amazon-nova-2.0-lite | amazon | 62K | $0.15 | $1.25 | | +| gemini-2.5-flash | google | 1024K | $0.15 | $3.5 | | +| amazon-nova-2.0-omni | amazon | 62K | $0.2 | $1.3 | | +| xai-grok-4.1 | xai | 128K | $0.2 | $0.5 | | + +> Full list: 617 models with tool calling + reasoning + vision across 50+ providers. See [Agentic Models](agentic-models.md) for the complete catalog. + +## Cheapest Tool-Calling Models + +Best value models with function/tool calling (direct providers only): + +| Model | Provider | Context | Input $/1M | Output $/1M | +| ------------------------------------------- | -------------- | ------- | ---------- | ----------- | +| ling-2.6-flash | inclusionai | 256K | $0.01 | $0.03 | +| bdc-coder | inferencenet | 128K | $0.01 | $0.01 | +| klusterai--Meta-Llama-3.1-8B-Instruct-Turbo | klusterai | 127K | $0.015 | $0.02 | +| granite-4.0-h-micro | cloudflare | 128K | $0.017 | $0.112 | +| schematron-v3 | inferencenet | 128K | $0.02 | $0.05 | +| schematron-3b | inferencenet | 128K | $0.02 | $0.05 | +| llama-3.1-8b-instruct--fp-16 | inferencenet | 128K | $0.02 | $0.03 | +| liquid-ai--LFM2-24B-A2B | togetherai | 128K | $0.03 | $0.12 | +| qwen--qwen3-4b-fp8 | novitaai | 125K | $0.03 | $0.03 | +| schematron-v2-turbo | inferencenet | 128K | $0.03 | $0.15 | +| gpt-oss-20b | inferencenet | 128K | $0.03 | $0.15 | +| openai--gpt-oss-20b | neuralwatt | 0 | $0.03 | $0.16 | +| amazon-nova-micro | amazon | 125K | $0.035 | $0.14 | +| amazon-nova-micro | amazon-bedrock | 125K | $0.035 | $0.14 | +| mistral-nemo-12b-instruct--fp-8 | inferencenet | 128K | $0.0375 | $0.1 | + +> Full list: 2,350 tool-calling models across 67 providers. See [Tool Calling Models](tool-calling.md). + +## Free Alternatives to GPT-4 + +Models with tool calling at zero cost (direct providers): + +| Model | Provider | Context | Capabilities | +| --------------------------------- | -------- | ------- | ---------------------------- | +| glm-4.7-flash | zhipuai | 195K | Tool Call | +| glm-4.1v-thinking-flash | zhipuai | 62K | Reasoning, Vision, Tool Call | +| glm-4-flash-250414 | zhipuai | 125K | Tool Call | +| glm-4v-flash | zhipuai | 15K | Vision, Tool Call | +| autoglm-phone | zhipuai | 19K | Vision, Tool Call | +| glm-ocr | zhipuai | 0 | Vision, Tool Call | +| glm-4.6v-flash | zhipuai | 125K | Vision, Tool Call | +| cobuddy | baidu | 128K | Tool Call | +| qwen--qwen3-omni-30b-a3b-instruct | novitaai | 64K | Vision, Tool Call | +| qwen--qwen3-omni-30b-a3b-thinking | novitaai | 64K | Reasoning, Vision, Tool Call | +| baidu--ernie-4.5-0.3b | aimlapi | 117K | Tool Call | +| qwen--qwen3.5-4b-free | mixlayer | 128K | Reasoning, Tool Call | +| llama-4-scout-17b-16e-instruct | cerebras | 128K | Tool Call | +| qwen-2.5-32b | cerebras | 128K | Tool Call | +| llama-3.3-70b | cerebras | 128K | Tool Call | + +> Full list: 81 free models. See [Free AI Models](free-models.md). + +## Largest Context Windows with Tool Calling + +| Model | Provider | Context | Input $/1M | Output $/1M | +| -------------------------------------------------- | ----------- | ------- | ---------- | ----------- | +| meta-llama-4-scout | meta | 9765K | $0.17 | $0.66 | +| xai--grok-4-fast-reasoning | aimlapi | 1953K | $0.52 | $1.3 | +| xai--grok-4-fast-non-reasoning | aimlapi | 1953K | $0.52 | $1.3 | +| meta-llama--Llama-4-Maverick-17B-128E-Instruct-FP8 | gmicloud | 1024K | $0.25 | $0.8 | +| minimax-m2-5 | baseten | 1024K | $0.3 | $1.2 | +| deepseek-v4-flash | baidu | 1024K | $0.126 | $0.252 | +| deepseek-v4-pro | siliconflow | 1024K | $1.74 | $3.48 | +| deepseek-v4-flash | siliconflow | 1024K | $0.14 | $0.28 | +| deepseek--deepseek-v4-pro | novitaai | 1024K | $1.67 | $3.38 | +| xiaomimimo--mimo-v2.5-pro | novitaai | 1024K | $2 | $6 | +| deepseek--deepseek-v4-flash | novitaai | 1024K | $0.14 | $0.28 | +| gemini-2.0-flash-lite | google | 1024K | $0.075 | $0.3 | +| gemini-2.5-flash | google | 1024K | $0.15 | $3.5 | +| gemini-2.5-pro | google | 1024K | $1.25 | $10 | +| gemini-2.0-flash | google | 1024K | $0.1 | $0.4 | + +> Full list: 2,195 models with 128K+ context. See [Large Context Models](large-context-models.md). + +## OpenAI-Compatible Providers + +70 providers offer OpenAI-compatible API endpoints โ€” switch with minimal code changes: + +| Provider | API Endpoint | Model Count | Free Tier | +| --------------- | -------------------------------------------- | ----------- | --------- | +| Regolo | `https://api.regolo.ai/v1` | 1 | โ€” | +| MegaNova | `https://api.meganova.ai/v1` | 1 | โ€” | +| GMI Cloud | `https://api.gmi-serving.com/v1` | 1 | โ€” | +| Cohere | `https://api.cohere.com` | 1 | โ€” | +| Requesty | `https://router.requesty.ai/v1` | 1 | โ€” | +| ๆŽฅๅฃ AI | `https://api.jiekou.ai/v1` | 1 | โ€” | +| Zhipu AI (ๆ™บ่ฐฑ) | `https://open.bigmodel.cn/api/paas/v4` | 1 | โ€” | +| SambaNova | `https://api.sambanova.ai/v1` | 1 | โ€” | +| Baseten | `https://model-api.baseten.co/v1` | 1 | โ€” | +| Wafer | `https://pass.wafer.ai/v1` | 1 | โ€” | +| Arcee AI | `https://api.arcee.ai/v1` | 1 | โ€” | +| Moonshot AI | `https://api.moonshot.cn/v1` | 1 | โ€” | +| Amazon Nova | `https://bedrock.us-east-1.amazonaws.com/v1` | 1 | โ€” | +| Baidu | `https://qianfan.baidubce.com/v1` | 1 | โ€” | +| Together AI | `https://api.together.xyz/v1` | 1 | โ€” | +| OpenRouter | `https://openrouter.ai/api/v1` | 1 | โ€” | +| FastRouter | `https://api.fastrouter.ai/v1` | 1 | โ€” | +| SubModel | `https://api.submodel.ai/v1` | 1 | โ€” | +| Inception Labs | `https://api.inceptionlabs.ai/v1` | 1 | โ€” | +| SiliconFlow | `https://api.siliconflow.cn/v1` | 1 | โ€” | + +> See [Migration Guide](migration-guide.md) for step-by-step instructions on switching from OpenAI. + +## Choosing Your Alternative + +| Need | Best Option | See | +| ----------------------------- | ---------------------------------- | ------------------------------------------- | +| Cheapest tool calling | DeepSeek, Qwen3 | [Pricing Comparison](pricing-comparison.md) | +| GPT-4-level reasoning | Claude Opus 4, Gemini 2.5 Pro | [Reasoning Models](reasoning-models.md) | +| Free for prototyping | Google Gemini, Cloudflare | [Free Models](free-models.md) | +| Largest context | Gemini 2.5 Pro (1M), Llama 4 (10M) | [Context Windows](context-windows.md) | +| Open weights for self-hosting | Llama 4, Qwen3 | [Open-Weight Models](open-weights.md) | +| Easy migration from OpenAI | Any OpenAI-compatible provider | [Migration Guide](migration-guide.md) | +| Running AI agents | Models with tool_call + reasoning | [Agentic Models](agentic-models.md) | + +## Related Documentation + +- [Tool Calling Models](tool-calling.md) โ€” 2,350 models with function calling +- [Reasoning Models](reasoning-models.md) โ€” 1,306 models with chain-of-thought +- [Vision Models](vision-models.md) โ€” 1,487 models with image understanding +- [Free AI Models](free-models.md) โ€” 81 models at zero cost +- [Pricing Comparison](pricing-comparison.md) โ€” side-by-side pricing across providers +- [Migration Guide](migration-guide.md) โ€” switch providers with minimal code changes +- [Provider Comparison](provider-comparison.md) โ€” top 30 providers by model count +- [Agentic Models](agentic-models.md) โ€” 1,080 models for AI agents +- [Code Models](code-models.md) โ€” 189 code-focused models + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/pricing-comparison.md b/docs/pricing-comparison.md new file mode 100644 index 00000000..d49b2ff4 --- /dev/null +++ b/docs/pricing-comparison.md @@ -0,0 +1,134 @@ +**English** | [ไธญๆ–‡](./zh/pricing-comparison.md) + +# Pricing Comparison + +Side-by-side pricing comparison for AI model inference across providers and platforms. All prices in USD per million tokens, sourced from first-party APIs. + +## Direct Provider Pricing + +Pricing from the model producer's own API. + +### OpenAI + +| Model | Input $/Mtok | Output $/Mtok | Cache Read $/Mtok | Context | +| ------------ | -----------: | ------------: | ----------------: | ------: | +| GPT-4.1 Nano | 0.10 | 0.40 | 0.025 | 1M | +| GPT-4o Mini | 0.15 | 0.60 | 0.075 | 128K | +| GPT-4.1 Mini | 0.40 | 1.60 | 0.10 | 1M | +| GPT-4.1 | 2.00 | 8.00 | 0.50 | 1M | +| GPT-4o | 2.50 | 10.00 | 1.25 | 128K | +| o4-mini | 1.10 | 4.40 | 0.275 | 200K | +| o3 | 10.00 | 40.00 | 2.50 | 200K | + +### Anthropic + +| Model | Input $/Mtok | Output $/Mtok | Context | +| ----------------- | -----------: | ------------: | ------: | +| Claude Haiku 4.5 | 1.00 | 5.00 | 200K | +| Claude Sonnet 4.0 | 3.00 | 15.00 | 1M | +| Claude Sonnet 4.5 | 3.00 | 15.00 | 1M | +| Claude Sonnet 4.6 | 3.00 | 15.00 | 1M | +| Claude Opus 4.5 | 5.00 | 25.00 | 200K | +| Claude Opus 4.7 | 5.00 | 25.00 | 1M | + +### Google + +| Model | Input $/Mtok | Output $/Mtok | Cache Read $/Mtok | Context | +| --------------------- | -----------: | ------------: | ----------------: | ------: | +| Gemini 1.5 Flash 8B | 0.075 | 0.30 | โ€” | 1M | +| Gemini 2.0 Flash Lite | 0.075 | 0.30 | โ€” | 1M | +| Gemini 2.0 Flash | 0.10 | 0.40 | โ€” | 1M | +| Gemini 2.5 Flash Lite | 0.10 | 0.40 | โ€” | 1M | +| Gemini 2.5 Flash | 0.15 | 3.50 | 0.0375 | 1M | +| Gemini 2.5 Pro | 1.25 | 10.00 | 0.315 | 1M | + +### DeepSeek + +| Model | Input $/Mtok | Output $/Mtok | Cache Read $/Mtok | Context | +| ----------------- | -----------: | ------------: | ----------------: | ------: | +| DeepSeek-V4-Flash | 0.14 | 0.28 | 0.0028 | 1M | +| DeepSeek-V4-Pro | 0.435 | 0.87 | 0.003625 | 1M | + +### xAI + +| Model | Input $/Mtok | Output $/Mtok | Context | +| ----------- | -----------: | ------------: | ------: | +| Grok 4 Fast | 0.20 | 0.50 | 131K | +| Grok 4.1 | 0.20 | 0.50 | 131K | +| Grok 3 Mini | 0.25 | 1.27 | 131K | +| Grok 4.2 | 2.00 | 6.00 | 131K | +| Grok 3 | 3.00 | 15.00 | 131K | +| Grok 4 | 3.00 | 15.00 | 131K | + +### Meta (via hosted inference) + +| Model | Input $/Mtok | Output $/Mtok | Context | +| ---------------- | -----------: | ------------: | ------: | +| Llama 3.2 1B | 0.10 | 0.10 | 128K | +| Llama 4 Scout | 0.17 | 0.66 | 10M | +| Llama 4 Maverick | 0.24 | 0.97 | 1M | + +### Mistral + +| Model | Input $/Mtok | Output $/Mtok | Context | +| ------------- | -----------: | ------------: | ------: | +| Ministral 3B | 0.04 | 0.04 | 128K | +| Ministral 8B | 0.10 | 0.10 | 128K | +| Mistral Small | 0.20 | 0.60 | 128K | +| Mistral Large | 2.00 | 6.00 | 128K | + +## Cross-Platform Price Comparison + +Same model on different inference platforms โ€” prices can vary significantly. + +### Llama 4 Scout (10M context) + +| Platform | Input $/Mtok | Output $/Mtok | +| ------------- | -----------: | ------------: | +| AIHubMix | 0.061 | 0.183 | +| Auriko | 0.08 | 0.30 | +| DeepInfra | 0.08 | 0.30 | +| Kluster AI | 0.08 | 0.45 | +| Meta (direct) | 0.17 | 0.66 | + +### Llama 4 Maverick (1M context) + +| Platform | Input $/Mtok | Output $/Mtok | +| --------------- | -----------: | ------------: | +| AIHubMix | 0.10 | 0.10 | +| ๆŽฅๅฃ AI | 0.10 | 0.50 | +| AIHubMix (Groq) | 0.11 | 0.33 | +| Cortecs | 0.124 | 0.603 | +| Auriko | 0.15 | 0.60 | +| Meta (direct) | 0.24 | 0.97 | + +## Cheapest Models Overall + +The absolute cheapest per-token models across all providers. + +| Model | Provider | Input $/Mtok | Output $/Mtok | Context | +| ------------------- | -------- | -----------: | ------------: | ------: | +| Ministral 3B | Mistral | 0.04 | 0.04 | 128K | +| Voxtral Mini | Mistral | 0.04 | 0.04 | 128K | +| Ministral 8B | Mistral | 0.10 | 0.10 | 128K | +| Llama 3.2 1B | Meta | 0.10 | 0.10 | 128K | +| GPT-4.1 Nano | OpenAI | 0.10 | 0.40 | 1M | +| Gemini 1.5 Flash 8B | Google | 0.075 | 0.30 | 1M | +| DeepSeek-V4-Flash | DeepSeek | 0.14 | 0.28 | 1M | + +--- + +**Note**: All pricing from first-party sources as of data collection date. Inference platform prices may differ. Check `providers//models/` for current data. CNY and EUR pricing available in provider YAML files. + +## Related Documentation + +- [Model Selection Guide](model-selection.md) โ€” decision framework for choosing models +- [Cached Pricing](cached-pricing.md) โ€” 1,374 models with prompt caching +- [Free AI Models](free-models.md) โ€” 81 free models +- [Context Window Comparison](context-windows.md) โ€” largest context windows +- [Provider Overview](providers.md) โ€” all 95 providers +- [OpenAI Alternatives](openai-alternatives.md) โ€” cheapest GPT-4 alternatives + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/provider-comparison.md b/docs/provider-comparison.md new file mode 100644 index 00000000..22c13572 --- /dev/null +++ b/docs/provider-comparison.md @@ -0,0 +1,127 @@ +# Provider Comparison + +[ไธญๆ–‡](zh/provider-comparison.md) + +Side-by-side comparison of AI model providers โ€” model count, capabilities, pricing, and context windows at a glance. + +Data sourced from the [AI Models Catalog](https://github.com/i-need-token/ai-models). + +## Top 30 Providers by Model Count + +| Provider | Models | Free | Tool Call | Reasoning | Vision | Cheapest $/M | Capabilities | +| -------------- | -----: | ---: | --------: | --------: | -----: | -----------: | ------------ | +| nanogpt | 547 | 0 | 0 | 0 | 0 | $0.02 | | +| aihubmix | 476 | 0 | 132 | 74 | 145 | $0.00 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐ŸŽค | +| openrouter | 356 | 29 | 263 | 190 | 160 | $0.01 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐ŸŽค | +| martian | 304 | 0 | 0 | 3 | 2 | $0.02 | ๐Ÿง  ๐Ÿ‘๏ธ | +| requesty | 277 | 0 | 251 | 139 | 151 | $0.02 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ | +| 302ai | 268 | 0 | 190 | 44 | 144 | $0.00 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐Ÿ”“ | +| auriko | 181 | 5 | 154 | 108 | 93 | $0.01 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐Ÿ–ผ๏ธ | +| llmgateway | 163 | 3 | 158 | 85 | 89 | $0.03 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐Ÿ–ผ๏ธ | +| aimlapi | 147 | 2 | 21 | 0 | 14 | $0.01 | ๐Ÿ”ง ๐Ÿ‘๏ธ | +| fastrouter | 120 | 2 | 94 | 66 | 65 | $0.02 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐ŸŽค | +| orcarouter | 120 | 0 | 102 | 64 | 111 | $0.05 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐Ÿ”“ | +| cortecs | 105 | 0 | 97 | 82 | 52 | $0.02 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐ŸŽค | +| novitaai | 104 | 2 | 72 | 53 | 33 | $0.02 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐ŸŽค | +| vultr | 98 | 0 | 11 | 22 | 23 | $0.55 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐ŸŽค | +| deepinfra | 88 | 0 | 0 | 51 | 38 | $0.01 | ๐Ÿง  ๐Ÿ‘๏ธ | +| venice | 75 | 0 | 64 | 55 | 39 | $0.05 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ | +| jiekou | 73 | 0 | 73 | 0 | 49 | $0.03 | ๐Ÿ”ง ๐Ÿ‘๏ธ ๐Ÿ”“ | +| meganova | 63 | 4 | 60 | 7 | 37 | $0.02 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐Ÿ”“ | +| alibaba | 62 | 0 | 62 | 52 | 0 | $0.15 | ๐Ÿ”ง ๐Ÿง  | +| ppio | 60 | 1 | 46 | 12 | 11 | $0.21 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐Ÿ”“ | +| amazon-bedrock | 57 | 0 | 37 | 0 | 16 | $0.04 | ๐Ÿ”ง ๐Ÿ‘๏ธ ๐ŸŽค ๐ŸŽฌ | +| google-vertex | 38 | 0 | 32 | 0 | 19 | $0.07 | ๐Ÿ”ง ๐Ÿ‘๏ธ ๐ŸŽค ๐ŸŽฌ | +| siliconflow-cn | 37 | 0 | 2 | 7 | 9 | $0.50 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ | +| stepfun | 31 | 14 | 0 | 0 | 11 | $0.70 | ๐Ÿ‘๏ธ ๐ŸŽค ๐Ÿ–ผ๏ธ | +| cloudflare | 30 | 0 | 15 | 10 | 7 | $0.02 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐Ÿ”“ | +| gmicloud | 29 | 0 | 11 | 10 | 0 | $0.07 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ”“ | +| databricks | 29 | 0 | 4 | 0 | 10 | $0.05 | ๐Ÿ”ง ๐Ÿ‘๏ธ ๐Ÿ”“ | +| openai | 28 | 5 | 18 | 8 | 12 | $0.02 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐ŸŽค | +| siliconflow | 27 | 0 | 24 | 2 | 3 | $0.04 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐Ÿ”“ | +| togetherai | 24 | 0 | 22 | 2 | 0 | $0.03 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ”“ | + +## Provider Categories + +### Aggregators (Multi-Provider Access) + +These providers offer access to models from multiple AI companies through a single API: + +| Provider | Models | Notes | +| ---------- | -----: | ----------------------------------------------- | +| openrouter | 356 | Largest model aggregator, OpenAI-compatible API | +| requesty | 277 | Smart routing across providers | +| martian | 304 | Multi-provider with load balancing | +| aihubmix | 476 | Chinese market aggregator | +| nanogpt | 547 | Pay-per-token, no subscription | +| llmgateway | 163 | Enterprise API gateway | +| fastrouter | 120 | Fast model routing | +| orcarouter | 120 | Multi-provider routing | + +### Direct Providers (First-Party APIs) + +| Provider | Models | Specialty | +| --------- | -----: | ---------------------------------- | +| openai | 28 | GPT-4.1, o3/o4 reasoning models | +| anthropic | 11 | Claude 4 family, best for agents | +| google | 21 | Gemini 2.5, 1M+ context | +| deepseek | 4 | DeepSeek R1, best open reasoning | +| meta | 12 | Llama 4, open weights | +| mistral | 16 | Mistral Large, Codestral | +| xai | 6 | Grok 3, real-time data | +| alibaba | 62 | Qwen 3, largest open-source family | + +### Infrastructure Providers (Hosted Open-Source) + +| Provider | Models | Specialty | +| ---------- | -----: | ------------------------------ | +| groq | 12 | Fastest inference (LPU) | +| cerebras | 11 | Ultra-fast inference (CS-3) | +| togetherai | 24 | Serverless open-source hosting | +| deepinfra | 88 | Cost-effective inference | +| fireworks | 10 | Serverless model hosting | +| cloudflare | 30 | Edge inference (Workers AI) | + +### Regional Providers + +| Provider | Models | Region | +| ------------------- | -----: | ---------------- | +| siliconflow | 27 | China | +| siliconflow-cn | 37 | China (domestic) | +| stepfun | 31 | China | +| zhipuai | 20 | China | +| baichuan | 11 | China | +| baidu | 8 | China | +| iflytek | 6 | China | +| tencent | 14 | China | +| ppio | 60 | China | +| ovhcloud | 12 | Europe (France) | +| scaleway | 13 | Europe (France) | +| cloudferro-sherlock | 12 | Europe (EU) | + +## Choosing a Provider + +| If you need... | Best provider | Why | +| --------------------- | ------------------------------ | ------------------------- | +| **Cheapest prices** | deepseek, google | Input from $0.14/M tokens | +| **Fastest inference** | groq, cerebras | Sub-100ms latency | +| **Largest context** | google, meta | 1M-10M token context | +| **Most models** | nanogpt, aihubmix | 500+ models each | +| **Best for agents** | anthropic, openai | Tool calling + reasoning | +| **Open weights** | meta, deepseek | Run on your own hardware | +| **EU data residency** | ovhcloud, scaleway, cloudferro | EU-hosted inference | +| **China access** | siliconflow, ppio, stepfun | China-based endpoints | + +## Related Documentation + +- [Migration Guide](migration-guide.md) โ€” switching providers with pricing comparison +- [Pricing Comparison](pricing-comparison.md) โ€” side-by-side pricing across providers +- [Providers Overview](providers.md) โ€” all 95 providers listed +- [Model Selection Guide](model-selection.md) โ€” decision framework +- [Free AI Models](free-models.md) โ€” 81 free models by capability +- [Chat Models](chat-models.md) โ€” 2,350 models with tool calling +- [Agentic Models](agentic-models.md) โ€” 1,080 models with tool calling + reasoning + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/providers.md b/docs/providers.md new file mode 100644 index 00000000..526b1379 --- /dev/null +++ b/docs/providers.md @@ -0,0 +1,172 @@ +**English** | [ไธญๆ–‡](./zh/providers.md) + +# Provider Overview + +A comprehensive overview of all 95 AI model providers in this catalog, organized by type. + +## Model Producers + +Providers that develop and produce their own AI models. Their APIs and documentation are the authoritative source for model data. + +| Provider | ID | Models | Key Models | API Format | +| ----------------------- | ------------- | -----: | ---------------------------------- | ---------- | +| 01.AI (้›ถไธ€ไธ‡็‰ฉ) | `01ai` | 5 | Yi-Lightning, Yi-Vision | OpenAI | +| AI21 Labs | `ai21` | 2 | Jamba 1.5 | OpenAI | +| Alibaba Cloud (Bailian) | `alibaba` | 62 | Qwen 3, Qwen 2.5 | OpenAI | +| Amazon Nova | `amazon` | 7 | Nova Pro, Nova Lite | OpenAI | +| Anthropic | `anthropic` | 11 | Claude Opus 4.7, Claude Sonnet 4.6 | Anthropic | +| ByteDance | `bytedance` | 5 | Doubao-Pro, Doubao-Lite | OpenAI | +| Cloudflare Workers AI | `cloudflare` | 30 | Llama 3.3, Mistral | OpenAI | +| Cohere | `cohere` | โ€” | Command R+, Embed 3 | OpenAI | +| DeepSeek | `deepseek` | 4 | DeepSeek-V4-Pro, DeepSeek-R1 | OpenAI | +| Google | `google` | 21 | Gemini 3.5 Flash, Gemini 3.1 Pro | Google | +| IBM Granite | `ibm` | โ€” | Granite 3.3 | OpenAI | +| iFlytek SparkDesk | `iflytek` | 6 | SparkDesk 4.0 Ultra | OpenAI | +| Inception Labs | `inception` | 5 | Mercury Coder | OpenAI | +| InclusionAI | `inclusionai` | 3 | Book3R | OpenAI | +| Meta Llama | `meta` | 12 | Llama 4 Maverick, Llama 4 Scout | OpenAI | +| Microsoft Phi | `microsoft` | 12 | Phi-4, Phi-4-Mini | OpenAI | +| MiniMax | `minimax` | 21 | MiniMax-Text-01, MiniMax-M1 | OpenAI | +| Mistral AI | `mistral` | 16 | Mistral Large, Codestral | OpenAI | +| Moonshot AI | `moonshotai` | 16 | Kimi K2.6, Kimi K2.5 | OpenAI | +| NVIDIA | `nvidia` | โ€” | Nemotron Ultra | OpenAI | +| OpenAI | `openai` | 28 | GPT-5.5, GPT-5.4, o3 | OpenAI | +| Perplexity | `perplexity` | 4 | Sonar, Sonar Pro | OpenAI | +| Reka AI | `reka` | 2 | Reka Core, Reka Flash | OpenAI | +| Sarvam AI | `sarvam` | โ€” | Sarvam-M | OpenAI | +| StepFun | `stepfun` | 31 | Step-2, Step-1.5V | OpenAI | +| Tencent Hunyuan | `tencent` | 14 | Hunyuan-Turbos | OpenAI | +| Upstage | `upstage` | 8 | Solar Pro, Solar Mini | OpenAI | +| Voyage AI | `voyage` | 21 | Voyage 3, Voyage Code 3 | OpenAI | +| Writer | `writer` | 6 | Palmyra X5 | OpenAI | +| xAI Grok | `xai` | 6 | Grok 3, Grok 3 Mini | OpenAI | +| Xiaomi | `xiaomi` | 5 | MiMo | OpenAI | +| Zhipu AI (ๆ™บ่ฐฑ) | `zhipuai` | 20 | GLM-4, GLM-Z1 | OpenAI | + +## Inference Platforms + +Providers that host and serve models produced by others. They offer their own per-token pricing and API access. + +| Provider | ID | Models | Pricing Currency | API Format | +| ---------------------- | --------------------- | -----: | ---------------- | ---------- | +| 302.AI | `302ai` | 268 | CNY | OpenAI | +| AIHubMix | `aihubmix` | 476 | CNY | OpenAI | +| AI/ML API | `aimlapi` | 147 | USD | OpenAI | +| Aion Labs | `aion` | 5 | USD | OpenAI | +| Arcee AI | `arcee` | 7 | USD | OpenAI | +| Auriko | `auriko` | 181 | USD | OpenAI | +| Baseten | `baseten` | 9 | USD | OpenAI | +| Berget | `berget` | 7 | EUR | OpenAI | +| Cerebras | `cerebras` | 11 | USD | OpenAI | +| Chutes | `chutes` | 12 | USD | OpenAI | +| Clarifai | `clarifai` | 12 | USD | OpenAI | +| CloudFerro Sherlock | `cloudferro-sherlock` | 12 | EUR | OpenAI | +| Cortecs | `cortecs` | 105 | USD | OpenAI | +| Databricks | `databricks` | 29 | USD | OpenAI | +| DeepInfra | `deepinfra` | 88 | USD | OpenAI | +| DigitalOcean | `digitalocean` | 20 | USD | OpenAI | +| DInference | `dinference` | 6 | CNY | OpenAI | +| evroc | `evroc` | 8 | EUR | OpenAI | +| FastRouter | `fastrouter` | 120 | USD | OpenAI | +| Fireworks AI | `fireworks` | 10 | USD | OpenAI | +| FriendliAI | `friendli` | 8 | USD | OpenAI | +| GMI Cloud | `gmicloud` | 29 | USD | OpenAI | +| Google Vertex AI | `google-vertex` | 38 | USD | Google | +| Groq | `groq` | 12 | USD | OpenAI | +| HPC-AI Cloud | `hpc-ai` | 11 | CNY | OpenAI | +| Hyperbolic | `hyperbolic` | 11 | USD | OpenAI | +| Inference.net | `inferencenet` | 20 | USD | OpenAI | +| ๆŽฅๅฃ AI | `jiekou` | 73 | CNY | OpenAI | +| Kluster AI | `klusterai` | 12 | USD | OpenAI | +| LLM Gateway | `llmgateway` | 163 | USD | OpenAI | +| Martian | `martian` | 304 | USD | OpenAI | +| MegaNova | `meganova` | 63 | USD | OpenAI | +| Mixlayer | `mixlayer` | 5 | USD | OpenAI | +| MoArk AI | `moark` | โ€” | USD | OpenAI | +| Morph | `morph` | 7 | USD | OpenAI | +| NanoGPT | `nanogpt` | 547 | USD | OpenAI | +| Nebius | `nebius` | 23 | USD | OpenAI | +| NeuralWatt | `neuralwatt` | 14 | USD | OpenAI | +| Nous Research | `nousresearch` | 7 | USD | OpenAI | +| Novita AI | `novitaai` | 104 | USD | OpenAI | +| OrcaRouter | `orcarouter` | 120 | USD | OpenAI | +| OVHcloud AI Endpoints | `ovhcloud` | 12 | EUR | OpenAI | +| PPIO | `ppio` | 60 | CNY | OpenAI | +| Privatemode AI | `privatemode` | 5 | EUR | OpenAI | +| Qiniu AI | `qiniu-ai` | โ€” | CNY | OpenAI | +| Regolo | `regolo` | โ€” | EUR | OpenAI | +| Requesty | `requesty` | 277 | USD | OpenAI | +| SambaNova | `sambanova` | 7 | USD | OpenAI | +| Scaleway | `scaleway` | 13 | EUR | OpenAI | +| SiliconFlow | `siliconflow` | 27 | USD | OpenAI | +| SiliconFlow CN | `siliconflow-cn` | 37 | CNY | OpenAI | +| SubModel | `submodel` | 6 | USD | OpenAI | +| Tencent Cloud TokenHub | `tencent-tokenhub` | 19 | CNY | OpenAI | +| TextSynth | `textsynth` | 6 | USD | OpenAI | +| Together AI | `togetherai` | 24 | USD | OpenAI | +| Venice AI | `venice` | 75 | USD | OpenAI | +| Vultr Cloud Inference | `vultr` | 98 | USD | OpenAI | +| Wafer | `wafer` | 2 | USD | OpenAI | + +## Cloud Provider Hosted Services + +Major cloud providers offering hosted AI model services. + +| Provider | ID | Models | Cloud Platform | +| -------------------- | ---------------- | -----: | -------------- | +| Amazon Bedrock | `amazon-bedrock` | 57 | AWS | +| Azure OpenAI Service | `azure` | โ€” | Azure | +| Google Vertex AI | `google-vertex` | 38 | GCP | + +## Chinese Market Providers + +Providers primarily serving the Chinese market with CNY pricing. + +| Provider | ID | Models | +| ----------------------- | ------------------ | -----: | +| 302.AI | `302ai` | 268 | +| AIHubMix | `aihubmix` | 476 | +| Alibaba Cloud (Bailian) | `alibaba` | 62 | +| Baichuan AI | `baichuan` | 11 | +| Baidu | `baidu` | 8 | +| ByteDance | `bytedance` | 5 | +| DInference | `dinference` | 6 | +| HPC-AI Cloud | `hpc-ai` | 11 | +| iFlytek SparkDesk | `iflytek` | 6 | +| ๆŽฅๅฃ AI | `jiekou` | 73 | +| MiniMax | `minimax` | 21 | +| Moonshot AI | `moonshotai` | 16 | +| PPIO | `ppio` | 60 | +| Qiniu AI | `qiniu-ai` | โ€” | +| SiliconFlow CN | `siliconflow-cn` | 37 | +| StepFun | `stepfun` | 31 | +| Tencent Cloud TokenHub | `tencent-tokenhub` | 19 | +| Tencent Hunyuan | `tencent` | 14 | +| Xiaomi | `xiaomi` | 5 | +| Zhipu AI (ๆ™บ่ฐฑ) | `zhipuai` | 20 | + +## European Market Providers + +Providers with EUR pricing, serving the European market. + +| Provider | ID | Models | +| --------------------- | --------------------- | -----: | +| Berget | `berget` | 7 | +| CloudFerro Sherlock | `cloudferro-sherlock` | 12 | +| evroc | `evroc` | 8 | +| OVHcloud AI Endpoints | `ovhcloud` | 12 | +| Privatemode AI | `privatemode` | 5 | +| Regolo | `regolo` | โ€” | +| Scaleway | `scaleway` | 13 | + +## Related Documentation + +- [Model Comparison](model-comparison.md) โ€” flagship, cost-effective, free models +- [Pricing Comparison](pricing-comparison.md) โ€” side-by-side pricing +- [Open-Weight Models](open-weights.md) โ€” 527 models you can run yourself +- [Free AI Models](free-models.md) โ€” 81 free models +- [Data Schema](data-schema.md) โ€” complete YAML schema + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/quick-start.md b/docs/quick-start.md new file mode 100644 index 00000000..b645b839 --- /dev/null +++ b/docs/quick-start.md @@ -0,0 +1,142 @@ +**English** | [ไธญๆ–‡](./zh/quick-start.md) + +# Quick Start Guide + +Find the right AI model for your needs in 30 seconds. + +## I want to find the cheapest model + +โ†’ See [Pricing Comparison](pricing-comparison.md) for the cheapest models per provider and cross-platform price comparisons. + +**Cheapest models with tool calling:** + +| Model | Provider | Input (per 1M tokens) | Output (per 1M tokens) | +| ---------------- | ------------- | --------------------: | ---------------------: | +| DeepSeek-V3 | DeepSeek | $0.27 | $1.10 | +| Qwen3-235B-A22B | Alibaba Cloud | $0.14 | $0.42 | +| Llama 4 Maverick | Together AI | $0.20 | $0.80 | + +## I want the most capable model + +โ†’ See [Model Comparison](model-comparison.md) for flagship model comparisons. + +**Top-tier flagships:** + +| Model | Context | Tool Call | Vision | Input $/1M | Output $/1M | +| -------------- | ------- | --------- | ------ | ---------: | ----------: | +| GPT-4.1 | 1M | โœ… | โœ… | $2.00 | $8.00 | +| Claude Opus 4 | 200K | โœ… | โœ… | $15.00 | $75.00 | +| Gemini 2.5 Pro | 1M | โœ… | โœ… | $1.25 | $10.00 | +| DeepSeek-R1 | 128K | โœ… | โŒ | $0.55 | $2.19 | + +## I want a free model + +โ†’ See [Model Comparison](model-comparison.md#free-models) for the full list. + +**Free models with tool calling:** + +- Google Gemini 2.0 Flash (via Google AI Studio) +- Cloudflare Workers AI models (edge inference) +- Various models on Chutes, Cerebras, Groq free tiers + +## I want the largest context window + +โ†’ See [Model Comparison](model-comparison.md#largest-context-windows) for the full list. + +| Model | Context Window | +| --------------- | -------------: | +| Llama 4 Scout | 10M tokens | +| Gemini 2.5 Pro | 1M tokens | +| GPT-4.1 | ~1M tokens | +| Claude Sonnet 4 | 200K tokens | + +## I want to browse all providers + +โ†’ See [Provider Overview](providers.md) for all 95 providers organized by type. + +## I want to use the data programmatically + +### npm package + +```bash +npm install ai-models +``` + +```typescript +import catalog from "ai-models"; // 4,587 models as JSON +import type { Model } from "ai-models"; // TypeScript types +``` + +### Download data files + +```bash +# JSON โ€” full metadata (2.3 MB) +curl -LO https://github.com/i-need-token/ai-models/releases/latest/download/models.json + +# CSV โ€” flat table for Excel/Google Sheets (560 KB) +curl -LO https://github.com/i-need-token/ai-models/releases/latest/download/models.csv +``` + +### CDN access (no install) + +The compiled JSON is available via [jsDelivr CDN](https://www.jsdelivr.com/package/npm/ai-models) โ€” no download or install needed: + +```bash +# Always up-to-date, CORS-enabled, works in browsers +curl -s https://github.com/i-need-token/ai-models/releases/latest/download/models.json | jq '.models | length' +``` + +```html + +``` + +### From source + +```bash +# Install dependencies +npm install + +# Compute catalog statistics +npx tsx scripts/stats.ts + +# Validate all model data +npx tsx scripts/validate.ts +``` + +```typescript +import { ModelSchema } from "./types/schemas"; +import { parse } from "yaml"; +import { readFileSync } from "fs"; + +// Load and validate a model +const raw = readFileSync("providers/openai/models/gpt-4.1.yaml", "utf-8"); +const model = ModelSchema.parse(parse(raw)); + +console.log(model.pricing); // { input: 2, output: 8, cache_read: 0.5 } +console.log(model.limit); // { context: 1047576, output: 32768 } +``` + +## I want to add a new provider + +โ†’ See [Contributing Guide](../CONTRIBUTING.md) and [Data Acquisition Guide](data-acquisition.md). + +## I want to understand the data format + +โ†’ See [Data Schema Reference](data-schema.md) for the complete YAML schema. + +## Related Documentation + +- [Model Selection Guide](model-selection.md) โ€” decision framework for choosing models +- [FAQ](faq.md) โ€” common questions about the catalog +- [API & Programmatic Access](api.md) โ€” download and use the data +- [Code Examples](code-examples.md) โ€” practical examples in TypeScript, Python, Go, Rust +- [Glossary](glossary.md) โ€” key terms and definitions + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/reasoning-models.md b/docs/reasoning-models.md new file mode 100644 index 00000000..8703ba33 --- /dev/null +++ b/docs/reasoning-models.md @@ -0,0 +1,104 @@ +**English** | [ไธญๆ–‡](./zh/reasoning-models.md) + +# AI Reasoning Models + +1,306 models in this catalog support reasoning (chain-of-thought / extended thinking). This page highlights the most capable and cost-effective reasoning models available. + +> All data sourced from first-party APIs and documentation. "Reasoning" means the model can produce extended chain-of-thought before answering. + +## Quick Stats + +| Capability | Reasoning Models | +| ------------------------- | ---------------: | +| Total reasoning models | 1,306 | +| Unique model IDs | 868 | +| With tool calling | 1,076 | +| With vision (image input) | 697 | +| Open-weight | 119 | + +## Top Reasoning Models by Context + +The largest-context reasoning models โ€” ideal for complex, multi-step tasks: + +| Model | Context | Tool Call | Vision | Input $/1M | Providers | +| ----------------------------- | ------- | --------- | ------ | ---------: | --------: | +| Grok 4 Fast Reasoning | 2M | โœ… | โœ… | $0.20 | 2 | +| Grok 4.1 Fast Reasoning | 2M | โœ… | โœ… | $0.20 | 2 | +| Grok 4.20 | 2M | โœ… | โœ… | $1.42 | 1 | +| GPT-5.4 | 1M | โœ… | โœ… | $2.50 | 4 | +| GPT-5.5 | 1M | โœ… | โœ… | $5.00 | 4 | +| Gemini 2.5 Pro | 1M | โœ… | โœ… | $1.25 | 4 | +| Gemini 2.5 Flash | 1M | โœ… | โœ… | $0.15 | 3 | +| Gemini 2.5 Flash Lite | 1M | โœ… | โœ… | $0.10 | 3 | +| Gemini 3 Flash Preview | 1M | โœ… | โœ… | $0.50 | 4 | +| Gemini 3.1 Flash Lite Preview | 1M | โœ… | โœ… | $0.25 | 3 | +| DeepSeek Reasoner | 1M | โœ… | โœ… | $0.43 | 1 | + +## Cheapest Reasoning Models + +Best value for reasoning capability: + +| Model | Provider | Input $/1M | Output $/1M | Context | +| --------------------- | --------- | ---------: | ----------: | ------- | +| Qwen 3.5 0.8B | Auriko | $0.01 | $0.05 | 262K | +| Qwen 3.5 0.8B | DeepInfra | $0.01 | $0.05 | 262K | +| Qwen 3.5 2B | Auriko | $0.02 | $0.10 | 262K | +| Qwen 3.5 2B | DeepInfra | $0.02 | $0.10 | 262K | +| GPT-5 Nano | Requesty | $0.025 | $0.20 | 400K | +| Qwen 3.5 4B | Auriko | $0.03 | $0.15 | 262K | +| Qwen 3.5 4B | DeepInfra | $0.03 | $0.15 | 262K | +| Gemini 2.5 Flash Lite | Google | $0.10 | $0.60 | 1M | +| Gemini 2.5 Flash | Google | $0.15 | $0.60 | 1M | +| Grok 4 Fast Reasoning | xAI | $0.20 | $0.50 | 2M | + +## Best Reasoning + Vision Models + +Models that can reason about images โ€” ideal for visual analysis: + +| Model | Context | Input $/1M | Providers | +| ----------------------- | ------- | ---------: | --------: | +| Grok 4 Fast Reasoning | 2M | $0.20 | 2 | +| Gemini 2.5 Flash | 1M | $0.15 | 3 | +| Gemini 2.5 Pro | 1M | $1.25 | 4 | +| GPT-5.4 | 1M | $2.50 | 4 | +| DeepSeek Reasoner | 1M | $0.43 | 1 | +| MiMo V2.5 (open-weight) | 1M | varies | 2 | + +## Open-Weight Reasoning Models + +119 open-weight models support reasoning โ€” run them on your own hardware: + +| Model | Context | Tool Call | Vision | Providers | +| ----------------------- | ------- | --------- | ------ | --------: | +| MiMo V2.5 Pro | 1M | โœ… | โŒ | 2 | +| MiMo V2.5 | 1M | โœ… | โœ… | 2 | +| DeepSeek-V4 Pro | 1M | โœ… | โŒ | 1 | +| Qwen3 Next 80B Thinking | 262K | โœ… | โŒ | 4 | +| Kimi K2.6 | 262K | โœ… | โœ… | 4 | +| Trinity Large Thinking | 262K | โœ… | โŒ | 1 | +| Nemotron 3 120B | 262K | โœ… | โŒ | 1 | +| Qwen3.5 397B A17B | 262K | โœ… | โŒ | 2 | + +## Key Takeaways + +- **1,306 reasoning models** across 868 unique IDs โ€” the largest reasoning model catalog available +- **Grok 4 Fast Reasoning** offers the best value at 2M context for $0.20/1M input +- **Gemini 2.5 Flash Lite** is the cheapest 1M-context reasoning model at $0.10/1M +- **MiMo V2.5** is the only open-weight model combining 1M context, reasoning, and vision +- **697 reasoning models** also support vision โ€” the most common combined capability +- Small reasoning models (Qwen 3.5 0.8Bโ€“4B) cost as little as $0.01โ€“$0.03/1M tokens + +## Related Documentation + +- [Model Selection Guide](model-selection.md) โ€” decision framework for choosing models +- [Tool Calling Models](tool-calling.md) โ€” 2,350 models with tool calling +- [Structured Output](structured-output.md) โ€” 829 JSON-mode models +- [Free AI Models](free-models.md) โ€” 81 free models, some with reasoning +- [Cached Pricing](cached-pricing.md) โ€” 1,374 models with prompt caching +- [OpenAI Alternatives](openai-alternatives.md) โ€” GPT-4 class alternatives with reasoning +- [Agentic Models](agentic-models.md) โ€” 1,080 models with tool_call + reasoning for agents +- [Code Models](code-models.md) โ€” 189 code-focused models + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/small-language-models.md b/docs/small-language-models.md new file mode 100644 index 00000000..accd9328 --- /dev/null +++ b/docs/small-language-models.md @@ -0,0 +1,126 @@ +# Small Language Models (SLM) Guide + +> Complete guide to 2,000+ small language models for edge deployment, mobile apps, and cost-efficient production. + +## What Are Small Language Models? + +Small Language Models (SLMs) are AI models with fewer than ~10 billion parameters, designed for efficiency, low latency, and deployment on resource-constrained hardware. They offer a practical alternative to large frontier models when cost, speed, or privacy matters. + +### Key Advantages + +| Factor | Small Model (SLM) | Large Model (LLM) | +| --------------------- | ---------------------- | -------------------------- | +| Cost per 1M tokens | $0.01 โ€“ $0.20 | $1 โ€“ $40 | +| Latency (first token) | 50 โ€“ 200ms | 200 โ€“ 2000ms | +| Deployment | On-device, edge, cloud | Cloud only | +| Privacy | Data stays on device | Data sent to cloud | +| Customization | Easy fine-tuning | Expensive fine-tuning | +| Complex reasoning | Good for simple tasks | Superior for complex tasks | + +## Quick Stats + +| Metric | Count | +| --------------------- | ----- | +| Total small models | 2,002 | +| With tool calling | 928 | +| With reasoning | 557 | +| Free SLMs | 48 | +| First-party providers | 689 | + +## Best SLMs by Use Case + +### AI Agents on a Budget + +Need tool calling + reasoning + low latency for high-volume agent workflows. + +- **Best value**: ling-2.6-flash ($0.01/$0.03/M) โ€” cheapest tool-calling model with 262K context +- **Balanced**: GPT-4.1-mini ($0.40/$1.60/M) โ€” reliable + 1M context +- **Free**: Gemma 4 27B IT โ€” free vision + tool calling + +### On-Device / Edge Deployment + +Need models that run on smartphones, IoT devices, or edge servers. + +- **Ultra-compact**: Qwen3.5 0.8B โ€” reasoning in a tiny package +- **Balanced**: Qwen3 4B ($0.03/$0.15/M) โ€” open-source with reasoning +- **Vision**: Gemma 4 27B IT โ€” free with vision + tool calling + +### Code Completion + +Need tool calling + structured output for coding assistance. + +- **Cheapest**: bdc-coder ($0.01/$0.01/M) โ€” cheapest coding model +- **Balanced**: GPT-4.1-nano ($0.10/$0.40/M) โ€” fast + cheap +- **Open-source**: Qwen3 4B ($0.03/$0.15/M) โ€” reasoning + tool calling + +### Math & Reasoning + +Need reasoning capability for step-by-step problem solving. + +- **Free**: DeepSeek R1 Distill Llama 8B โ€” free reasoning model +- **Cheapest**: Qwen3.5 0.8B ($0.01/$0.05/M) โ€” cheapest reasoning +- **Balanced**: Qwen3.5 4B ($0.03/$0.15/M) โ€” open-source reasoning + +### Chat & RAG + +Need large context + low cost for retrieval-augmented generation. + +- **Cheapest**: Qwen3 4B ($0.03/$0.15/M) โ€” cheap + 262K context +- **Fast**: GPT-4.1-nano ($0.10/$0.40/M) โ€” fast + cheap +- **Large context**: Gemini 2.5 Flash ($0.15/$0.60/M) โ€” 1M context + reasoning + +## Cheapest Small Models with Tool Calling + +| Model | Provider | Input $/M | Output $/M | Context | Reasoning | +| ------------------------------------------- | --------- | --------- | ---------- | ------- | --------- | +| ling-2.6-flash | ling | $0.01 | $0.03 | 262K | โ€” | +| klusterai--Meta-Llama-3.1-8B-Instruct-Turbo | klusterai | $0.015 | $0.02 | 131K | โ€” | +| granite-4.0-h-micro | ibm | $0.017 | $0.112 | 131K | โ€” | +| llama-3.1-8b-instruct--fp-16 | fireworks | $0.02 | $0.03 | 131K | โ€” | +| schematron-3b | fireworks | $0.02 | $0.05 | 131K | โ€” | + +## Free Small Language Models + +48 small models available at zero cost โ€” perfect for prototyping and development: + +| Model | Provider | Context | Tool Calling | Reasoning | +| ------------------------------ | -------- | ------- | ------------ | --------- | +| deepseek-r1-distill-llama-8b | cerebras | 131K | โ€” | โœ“ | +| llama-4-scout-17b-16e-instruct | cerebras | 131K | โœ“ | โ€” | +| qwen-2.5-32b | cerebras | 131K | โœ“ | โ€” | +| gemma-4-26b-a4b-it | auriko | 262K | โœ“ | โ€” | +| glm-4.5-flash | auriko | 200K | โœ“ | โ€” | + +## Small Models with Reasoning + +557 small models with reasoning capabilities: + +| Model | Provider | Input $/M | Output $/M | Context | Tool Calling | +| ---------------------------- | --------- | --------- | ---------- | ------- | ------------ | +| qwen3.5-0.8b | qwen | $0.01 | $0.05 | 262K | โ€” | +| qwen3.5-2b | qwen | $0.02 | $0.10 | 262K | โ€” | +| qwen--qwen3-4b-fp8 | fireworks | $0.03 | $0.03 | 128K | โ€” | +| qwen3.5-4b | qwen | $0.03 | $0.15 | 262K | โ€” | +| deepseek-r1-distill-llama-8b | cerebras | Free | Free | 131K | โ€” | + +## How to Choose the Right SLM + +1. **Define your constraints**: Budget, latency, deployment target (cloud vs edge) +2. **Identify required capabilities**: Tool calling? Reasoning? Vision? Structured output? +3. **Check context window**: How much text do you need to process? +4. **Compare pricing**: Use the [interactive catalog](https://i-need-token.github.io/ai-models/) or [pricing calculator](https://i-need-token.github.io/ai-models/ai-model-pricing-calculator.html) +5. **Test with your data**: Small models vary significantly in quality for specific domains + +## Related Documentation + +- [Free Models Guide](free-models.md) โ€” all 81 free models +- [Tool Calling Guide](tool-calling.md) โ€” 2,350 models with tool calling +- [Reasoning Models Guide](reasoning-models.md) โ€” 1,306 reasoning models +- [Pricing Comparison](pricing-comparison.md) โ€” find the cheapest model +- [Context Windows](context-windows.md) โ€” largest context windows +- [Model Selection Cheatsheet](model-selection-cheatsheet.md) โ€” quick-reference guide +- [Small Language Models Comparison](https://i-need-token.github.io/ai-models/small-language-models.html) โ€” interactive SEO page + +--- + +_Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” first-party data only, updated automatically._ diff --git a/docs/small-models.md b/docs/small-models.md new file mode 100644 index 00000000..ec3cc772 --- /dev/null +++ b/docs/small-models.md @@ -0,0 +1,80 @@ +# Small & Edge Models + +[ไธญๆ–‡](zh/small-models.md) + +AI models designed for **edge deployment, on-device inference, and resource-constrained environments** โ€” models under ~16B parameters that can run on consumer hardware, mobile devices, and embedded systems. + +Data sourced from the [AI Models Catalog](https://github.com/i-need-token/ai-models). + +## Why Small Models Matter + +Small models enable AI where cloud connectivity is limited or latency is critical: + +- **On-device inference** โ€” run AI without internet, on phones and laptops +- **Edge computing** โ€” deploy in IoT devices, robotics, and vehicles +- **Low latency** โ€” sub-100ms response times for real-time applications +- **Cost efficiency** โ€” cheaper to run, especially at scale +- **Privacy** โ€” data never leaves the device +- **Offline capability** โ€” AI that works without connectivity + +## Stats + +| Metric | Count | +| ------------------------ | ----- | +| Small/edge models | 1153 | +| Providers | 63 | +| Free small models | 30 | +| Open-weight small models | 272 | +| With tool calling | 434 | +| With reasoning | 250 | + +## Providers + +`302ai`, `aihubmix`, `aimlapi`, `aion`, `alibaba`, `amazon-bedrock`, `auriko`, `baichuan`, `berget`, `bytedance`, `cerebras`, `chutes`, `clarifai`, `cloudferro-sherlock`, `cloudflare`, `cortecs`, `databricks`, `deepinfra`, `digitalocean`, `evroc`, `fastrouter`, `fireworks`, `friendli`, `gmicloud`, `google`, `google-vertex`, `groq`, `hpc-ai`, `hyperbolic`, `inferencenet`, `jiekou`, `klusterai`, `llmgateway`, `martian`, `meganova`, `meta`, `microsoft`, `mistral`, `mixlayer`, `moonshotai`, `morph`, `nanogpt`, `nebius`, `neuralwatt`, `nousresearch`, `novitaai`, `openrouter`, `orcarouter`, `ovhcloud`, `ppio`, `privatemode`, `requesty`, `sambanova`, `scaleway`, `siliconflow`, `siliconflow-cn`, `submodel`, `tencent`, `textsynth`, `togetherai`, `venice`, `vultr`, `wafer` + +## Free Small Models + +Free small models โ€” zero-cost edge AI. + +| Model | Provider | Context | Input $/M | Output $/M | Capabilities | +| ---------------------------------------------------- | ---------- | ------- | --------- | ---------- | ------------ | +| nvidia--nemotron-3-super-120b-a12b--free | openrouter | 1M | Free | Free | ๐Ÿ”ง ๐Ÿง  ๐Ÿ“‹ | +| google--gemma-4-26b-a4b-it--free | openrouter | 262K | Free | Free | ๐Ÿ”ง ๐Ÿง  ๐Ÿ“‹ | +| google--gemma-4-31b-it--free | openrouter | 262K | Free | Free | ๐Ÿ”ง ๐Ÿง  ๐Ÿ“‹ | +| gemma-4-26b-a4b-it | auriko | 262K | Free | Free | ๐Ÿ”ง ๐Ÿง  ๐Ÿ“‹ | +| gemma-4-31b-it | auriko | 262K | Free | Free | ๐Ÿ”ง ๐Ÿง  ๐Ÿ“‹ | +| nvidia--nemotron-3-nano-omni-30b-a3b-reasoning--free | openrouter | 256K | Free | Free | ๐Ÿ”ง ๐Ÿง  | +| gemma-3-4b-it | google | 131K | Free | Free | | +| gemma-3-12b-it | google | 131K | Free | Free | | +| gemma-3-27b-it | google | 131K | Free | Free | | +| gemma-3n-E2B-it | google | 131K | Free | Free | | + +## Cheapest Small Models + +Best value small models for production. + +| Model | Provider | Context | Input $/M | Output $/M | Capabilities | +| ----------------------------------------------- | -------- | ------- | --------- | ---------- | ------------ | +| llama3-groq-8b-8192-tool-use-preview | aihubmix | 0 | $9.5e-05 | $9.5e-05 | | +| mistralai--mistral-7b-instruct--free | aihubmix | 0 | $0.001 | $0.001 | | +| deepseek-ai--deepseek-r1-distill-llama-8b | aihubmix | 0 | $0.005 | $0.005 | | +| deepseek-ai--deepseek-r1-distill-qwen-7b | aihubmix | 0 | $0.005 | $0.005 | | +| deepseek-ai--deepseek-r1-distill-qwen-1.5b | aihubmix | 0 | $0.005 | $0.005 | | +| ernie-4.5-0.3b | aihubmix | 0 | $0.0068 | $0.0272 | ๐Ÿ”ง ๐Ÿ“‹ | +| google--gemma-2-9b-it--free | aihubmix | 0 | $0.01 | $0.01 | | +| meta-llama--llama-3.2-3b-instruct--free | aihubmix | 0 | $0.01 | $0.01 | | +| meta-llama--llama-3.2-11b-vision-instruct--free | aihubmix | 0 | $0.01 | $0.01 | | +| meta-llama--llama-3.1-8b-instruct--free | aihubmix | 0 | $0.01 | $0.01 | | + +## Related Documentation + +- [Open Weights](open-weights.md) โ€” 527 open-weight models +- [Free AI Models](free-models.md) โ€” 81 free models by capability +- [Chat Models](chat-models.md) โ€” 2,350 models with tool calling +- [Code Models](code-models.md) โ€” 189 code-focused models +- [Model Selection Guide](model-selection.md) โ€” decision framework +- [Provider Comparison](provider-comparison.md) โ€” top 30 providers + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/structured-output.md b/docs/structured-output.md new file mode 100644 index 00000000..efabf5a6 --- /dev/null +++ b/docs/structured-output.md @@ -0,0 +1,84 @@ +**English** | [ไธญๆ–‡](./zh/structured-output.md) + +# AI Structured Output Models (JSON Mode) + +829 models in this catalog support structured output โ€” the ability to generate responses that conform to a specified JSON schema. This is essential for building reliable AI-powered APIs, data pipelines, and automation. + +> All data sourced from first-party APIs and documentation. "Structured output" means the model can enforce a JSON schema on its response (also known as JSON mode, constrained decoding, or guided generation). + +## Quick Stats + +| Capability | Structured Output Models | +| ------------------------------ | -----------------------: | +| Total structured output models | 829 | +| Unique model IDs | 704 | +| With tool calling | 749 | +| With reasoning | 473 | +| With vision | 411 | +| Open-weight | 24 | + +## Cheapest Structured Output Models + +Best value for generating reliable JSON responses: + +| Model | Provider | Input $/1M | Output $/1M | Context | Tool Call | Reasoning | +| --------------------- | ---------- | ---------: | ----------: | ------- | --------- | --------- | +| Ernie 4.5 0.3B | AIHubMix | $0.0068 | $0.0272 | โ€” | โœ… | โŒ | +| Ling 2.6 Flash | OpenRouter | $0.01 | $0.03 | 262K | โœ… | โŒ | +| Qwen3 VL Flash | AIHubMix | $0.0103 | $0.103 | โ€” | โœ… | โŒ | +| Llama 3.1 8B Instruct | Auriko | $0.02 | $0.03 | 131K | โœ… | โŒ | +| Mistral Nemo | OpenRouter | $0.02 | $0.02 | โ€” | โœ… | โŒ | +| Doubao Seed 1.6 Flash | AIHubMix | $0.022 | $0.022 | โ€” | โœ… | โŒ | +| GPT-5 Nano | AIHubMix | $0.025 | $0.20 | โ€” | โœ… | โœ… | +| GPT-OSS 20B | NeuralWatt | $0.03 | $0.03 | โ€” | โœ… | โœ… | +| Granite 4.0 H Micro | Cloudflare | $0.017 | $0.112 | 131K | โœ… | โŒ | +| Gemini 2.5 Flash Lite | Google | $0.10 | $0.60 | 1M | โœ… | โœ… | + +## Free Structured Output Models + +24 models offer free structured output โ€” ideal for prototyping: + +| Model | Provider | Context | Tool Call | Reasoning | +| ------------------------- | ---------- | ------- | --------- | --------- | +| Ernie 4.5 0.3B | AIMLAPI | โ€” | โœ… | โŒ | +| Gemma 4 26B A4B IT | Auriko | โ€” | โœ… | โœ… | +| Gemma 4 31B IT | Auriko | โ€” | โœ… | โŒ | +| Qwen3 Omni 30B A3B | NovitaAI | โ€” | โœ… | โœ… | +| Dolphin Mistral 24B | OpenRouter | โ€” | โœ… | โŒ | +| Gemma 4 26B A4B IT (free) | OpenRouter | โ€” | โœ… | โœ… | +| Gemma 4 31B IT (free) | OpenRouter | โ€” | โœ… | โŒ | + +## Best Structured Output + Tool Calling + Reasoning + +For AI agents that need to return structured data, call tools, and reason: + +| Model | Context | Input $/1M | Tool Call | Reasoning | Providers | +| --------------------- | ------- | ---------: | --------- | --------- | --------: | +| Grok 4 Fast Reasoning | 2M | $0.20 | โœ… | โœ… | 2 | +| Gemini 2.5 Flash | 1M | $0.15 | โœ… | โœ… | 3 | +| Gemini 2.5 Pro | 1M | $1.25 | โœ… | โœ… | 4 | +| GPT-5.4 | 1M | $2.50 | โœ… | โœ… | 4 | +| DeepSeek Reasoner | 1M | $0.43 | โœ… | โœ… | 1 | +| GPT-5 Nano | โ€” | $0.025 | โœ… | โœ… | 4 | + +## Key Takeaways + +- **829 structured output models** โ€” the largest catalog of JSON-mode models +- **749 models** combine structured output with tool calling โ€” perfect for AI agents +- **24 free models** support structured output โ€” start building at zero cost +- **Gemini 2.5 Flash** is the best value: 1M context, structured output, tool calling, and reasoning for $0.15/1M +- Small models (Ernie 4.5 0.3B, Ling 2.6 Flash) cost as little as $0.01/1M with structured output +- 91% of structured output models also support tool calling โ€” these capabilities go hand-in-hand + +## Related Documentation + +- [Model Selection Guide](model-selection.md) โ€” decision framework for choosing models +- [Tool Calling Models](tool-calling.md) โ€” 2,350 models with tool calling +- [Reasoning Models](reasoning-models.md) โ€” 1,306 models with reasoning +- [Free AI Models](free-models.md) โ€” 81 free models, some with structured output +- [Cached Pricing](cached-pricing.md) โ€” 1,374 models with prompt caching +- [Agentic Models](agentic-models.md) โ€” 1,080 models with tool_call + reasoning for agents + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/tool-calling.md b/docs/tool-calling.md new file mode 100644 index 00000000..2b70a89d --- /dev/null +++ b/docs/tool-calling.md @@ -0,0 +1,102 @@ +**English** | [ไธญๆ–‡](./zh/tool-calling.md) + +# AI Tool Calling Models + +2,350 models in this catalog support tool calling (function calling). This page highlights the most capable and cost-effective models for building AI agents and automation. + +> All data sourced from first-party APIs and documentation. "Tool calling" means the model can invoke external functions/tools as part of its response. + +## Quick Stats + +| Capability | Tool-Calling Models | +| ------------------------- | ------------------: | +| Total tool-calling models | 2,350 | +| Unique model IDs | 1,540 | +| With reasoning | 1,076 | +| With vision (image input) | 1,063 | +| With structured output | 829 | +| Open-weight | 270 | + +## Cheapest Tool-Calling Models + +Best value for building AI agents: + +| Model | Provider | Input $/1M | Output $/1M | Context | Reasoning | +| -------------------------- | ------------ | ---------: | ----------: | ------- | --------- | +| GLM-4-Flash | 302AI | $0.0014 | $0.0014 | 131K | โŒ | +| Mistral-Nemo-Instruct-2407 | KlusterAI | $0.008 | $0.001 | 131K | โŒ | +| BDC-Coder | InferenceNet | $0.01 | $0.01 | 131K | โŒ | +| Qwen 3.5 0.8B | Auriko | $0.01 | $0.05 | 262K | โœ… | +| Qwen 3.5 0.8B | DeepInfra | $0.01 | $0.05 | 262K | โœ… | +| Qwen 3.5 2B | Auriko | $0.02 | $0.10 | 262K | โœ… | +| Qwen 3.5 2B | DeepInfra | $0.02 | $0.10 | 262K | โœ… | +| GPT-5 Nano | Requesty | $0.025 | $0.20 | 400K | โœ… | +| Gemini 2.5 Flash Lite | Google | $0.10 | $0.60 | 1M | โœ… | +| Gemini 2.5 Flash | Google | $0.15 | $0.60 | 1M | โœ… | +| Grok 4 Fast Reasoning | xAI | $0.20 | $0.50 | 2M | โœ… | + +## Largest Context Tool-Calling Models + +For agents that need to process large documents or long conversation histories: + +| Model | Context | Input $/1M | Reasoning | Providers | +| --------------------- | ------- | ---------: | --------- | --------: | +| Llama 4 Scout | 10M | $0.08 | โŒ | 4 | +| Grok 4 Fast Reasoning | 2M | $0.20 | โœ… | 2 | +| GPT-5.4 | 1M | $2.50 | โœ… | 4 | +| Gemini 2.5 Pro | 1M | $1.25 | โœ… | 4 | +| Gemini 2.5 Flash | 1M | $0.15 | โœ… | 3 | +| DeepSeek-V4 Flash | 1M | $0.27 | โœ… | 2 | +| GPT-4.1 | 1M | $2.00 | โŒ | 4 | +| Llama 4 Maverick | 1M | $0.15 | โŒ | 3 | + +## Best Tool-Calling + Reasoning + Vision + +The "holy trinity" for advanced AI agents โ€” tool calling, reasoning, and vision in one model: + +| Model | Context | Input $/1M | Providers | +| ----------------------- | ------- | ---------: | --------: | +| Grok 4 Fast Reasoning | 2M | $0.20 | 2 | +| Gemini 2.5 Flash | 1M | $0.15 | 3 | +| Gemini 2.5 Pro | 1M | $1.25 | 4 | +| GPT-5.4 | 1M | $2.50 | 4 | +| DeepSeek Reasoner | 1M | $0.43 | 1 | +| MiMo V2.5 (open-weight) | 1M | varies | 2 | +| Kimi K2.6 (open-weight) | 262K | varies | 4 | + +## Free Tool-Calling Models + +45 free models support tool calling โ€” ideal for prototyping and testing: + +| Model | Provider | Context | Reasoning | Vision | +| ------------------------------ | -------- | ------- | --------- | ------ | +| gemini-2.0-flash | Google | 1M | โœ… | โœ… | +| gemini-2.5-flash-preview-05-20 | Google | 1M | โœ… | โœ… | +| llama-4-scout | Chutes | 10M | โŒ | โœ… | +| llama-4-maverick | Chutes | 1M | โŒ | โœ… | +| deepseek-r1 | Chutes | 128K | โœ… | โŒ | +| qwen3-235b-a22b | Chutes | 128K | โœ… | โœ… | +| gemma-3-27b-it | Chutes | 128K | โœ… | โœ… | + +## Key Takeaways + +- **2,350 tool-calling models** across 1,540 unique IDs โ€” the largest tool-calling model catalog +- **Gemini 2.5 Flash** is the best value: 1M context, tool calling, reasoning, and vision for $0.15/1M +- **Grok 4 Fast Reasoning** offers the largest context (2M) with all three capabilities +- **45 free models** support tool calling โ€” start building agents at zero cost +- **829 models** also support structured output โ€” perfect for reliable JSON responses +- Small models (Qwen 3.5 0.8Bโ€“4B) cost as little as $0.01โ€“$0.03/1M tokens with tool calling + +## Related Documentation + +- [Model Selection Guide](model-selection.md) โ€” decision framework for choosing models +- [Free AI Models](free-models.md) โ€” 81 free models, many with tool calling +- [Structured Output](structured-output.md) โ€” 829 JSON-mode models +- [Reasoning Models](reasoning-models.md) โ€” 1,306 models with reasoning +- [Cached Pricing](cached-pricing.md) โ€” 1,374 models with prompt caching +- [OpenAI Alternatives](openai-alternatives.md) โ€” GPT-4/GPT-3.5 alternatives with tool calling +- [Agentic Models](agentic-models.md) โ€” 1,080 models with tool_call + reasoning for agents + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/video-models.md b/docs/video-models.md new file mode 100644 index 00000000..2c34019f --- /dev/null +++ b/docs/video-models.md @@ -0,0 +1,210 @@ +# Video Models + +[ไธญๆ–‡](zh/video-models.md) + +AI models that support video input or output, sourced from the [AI Models Catalog](https://github.com/i-need-token/ai-models). + +## Stats + +| Metric | Count | +| ------------------ | ----- | +| Total video models | 171 | +| Video input | 167 | +| Video output | 4 | +| Free | 0 | +| Open weights | 6 | +| Providers | 18 | + +## Providers + +`aihubmix`, `amazon`, `amazon-bedrock`, `bytedance`, `chutes`, `fastrouter`, `google`, `google-vertex`, `hpc-ai`, `inferencenet`, `minimax`, `novitaai`, `openrouter`, `tencent`, `tencent-tokenhub`, `voyage`, `vultr`, `xiaomi` + +## Models + +| Model | Provider | Context | Input Price | Capabilities | +| ---------------------------------------------------- | ---------------- | ------- | ----------- | -------------- | +| doubao-seed-1-6 | aihubmix | โ€” | $0.09 | ๐Ÿ“น in ๐Ÿ”ง | +| doubao-seed-1-6-flash | aihubmix | โ€” | $0.022 | ๐Ÿ“น in ๐Ÿ”ง | +| doubao-seed-1-6-lite | aihubmix | โ€” | $0.041 | ๐Ÿ“น in ๐Ÿ”ง | +| doubao-seed-1-6-thinking | aihubmix | โ€” | $0.09 | ๐Ÿ“น in ๐Ÿ”ง | +| doubao-seed-1-8 | aihubmix | โ€” | $0.054795 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| gemini-2.0-flash | aihubmix | โ€” | $0.05 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.0-flash-exp | aihubmix | โ€” | $0.01 | ๐Ÿ“น in | +| gemini-2.0-flash-lite | aihubmix | โ€” | $0.038 | ๐Ÿ“น in | +| gemini-2.0-flash-search | aihubmix | โ€” | $0.05 | ๐Ÿ“น in | +| gemini-2.0-flash-thinking-exp-01-21 | aihubmix | โ€” | $0.038 | ๐Ÿ“น in ๐Ÿง  | +| gemini-2.0-pro-exp-02-05 | aihubmix | โ€” | $0.625 | ๐Ÿ“น in | +| gemini-2.0-pro-exp-02-05-search | aihubmix | โ€” | $0.625 | ๐Ÿ“น in | +| gemini-2.5-flash | aihubmix | โ€” | $0.15 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-flash-lite | aihubmix | โ€” | $0.05 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-flash-lite-nothink | aihubmix | โ€” | $0.05 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-flash-lite-preview-09-2025 | aihubmix | โ€” | $0.05 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-flash-lite-preview-09-2025-nothink | aihubmix | โ€” | $0.05 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-flash-nothink | aihubmix | โ€” | $0.15 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-flash-preview-05-20-nothink | aihubmix | โ€” | $0.15 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-flash-preview-05-20-search | aihubmix | โ€” | $0.15 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-flash-preview-09-2025 | aihubmix | โ€” | $0.15 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-flash-search | aihubmix | โ€” | $0.15 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-pro | aihubmix | โ€” | $0.625 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| gemini-2.5-pro-exp-03-25 | aihubmix | โ€” | $0.625 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-pro-preview-03-25-search | aihubmix | โ€” | $0.625 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| gemini-2.5-pro-preview-05-06 | aihubmix | โ€” | $0.625 | ๐Ÿ“น in ๐Ÿง  | +| gemini-2.5-pro-preview-05-06-search | aihubmix | โ€” | $0.625 | ๐Ÿ“น in ๐Ÿง  | +| gemini-2.5-pro-preview-06-05 | aihubmix | โ€” | $0.625 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| gemini-2.5-pro-preview-06-05-search | aihubmix | โ€” | $0.625 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| gemini-2.5-pro-search | aihubmix | โ€” | $0.625 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| gemini-3.1-flash-lite-preview-nothink | aihubmix | โ€” | $0.125 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| glm-4.5v | aihubmix | โ€” | $0.137 | ๐Ÿ“น in | +| glm-4.6v | aihubmix | โ€” | $0.0685 | ๐Ÿ“น in | +| gme-qwen2-vl-2b-instruct | aihubmix | โ€” | $0.069 | ๐Ÿ“น in | +| kimi-k2.5 | aihubmix | โ€” | $0.3 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| mimo-v2-omni | aihubmix | โ€” | $0.22 | ๐Ÿ“น in | +| mimo-v2-pro | aihubmix | โ€” | $0.55 | ๐Ÿ“น in | +| qwen--qwen2.5-vl-32b-instruct | aihubmix | โ€” | $0.12 | ๐Ÿ“น in ๐Ÿ”ง | +| qwen--qwen2.5-vl-72b-instruct | aihubmix | โ€” | $0.25 | ๐Ÿ“น in | +| qwen2-vl-72b-instruct | aihubmix | โ€” | $1.09 | ๐Ÿ“น in | +| qwen2-vl-7b-instruct | aihubmix | โ€” | $0.14 | ๐Ÿ“น in | +| qwen3-vl-235b-a22b-instruct | aihubmix | โ€” | $0.137 | ๐Ÿ“น in ๐Ÿ”ง | +| qwen3-vl-235b-a22b-thinking | aihubmix | โ€” | $0.137 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen3-vl-30b-a3b-instruct | aihubmix | โ€” | $0.0514 | ๐Ÿ“น in ๐Ÿ”ง | +| qwen3-vl-30b-a3b-thinking | aihubmix | โ€” | $0.0514 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen3-vl-flash | aihubmix | โ€” | $0.0103 | ๐Ÿ“น in ๐Ÿ”ง | +| qwen3-vl-flash-2026-01-22 | aihubmix | โ€” | $0.0103 | ๐Ÿ“น in ๐Ÿ”ง | +| qwen3-vl-plus | aihubmix | โ€” | $0.0685 | ๐Ÿ“น in ๐Ÿ”ง | +| veo-2.0-generate-001 | aihubmix | โ€” | $1 | ๐Ÿ“น in | +| veo-3 | aihubmix | โ€” | $1 | ๐Ÿ“น in | +| veo-3.0-generate-preview | aihubmix | โ€” | $1 | ๐Ÿ“น in | +| veo-3.1-fast-generate-preview | aihubmix | โ€” | $1 | ๐Ÿ“น in | +| veo-3.1-generate-preview | aihubmix | โ€” | $1 | ๐Ÿ“น in | +| veo-3.1-lite-generate-preview | aihubmix | โ€” | $1 | ๐Ÿ“น in | +| veo3 | aihubmix | โ€” | $1 | ๐Ÿ“น in | +| amazon-nova-2.0-lite | amazon | โ€” | $0.15 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| amazon-nova-2.0-omni | amazon | โ€” | $0.2 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| amazon-nova-2.0-pro | amazon | โ€” | $0.625 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| amazon-nova-lite | amazon | โ€” | $0.06 | ๐Ÿ“น in ๐Ÿ”ง | +| amazon-nova-premier | amazon | โ€” | $2.5 | ๐Ÿ“น in ๐Ÿ”ง | +| amazon-nova-pro | amazon | โ€” | $0.8 | ๐Ÿ“น in ๐Ÿ”ง | +| amazon-nova-2-lite | amazon-bedrock | โ€” | $0.33 | ๐Ÿ“น in ๐Ÿ”ง | +| amazon-nova-lite | amazon-bedrock | โ€” | $0.06 | ๐Ÿ“น in ๐Ÿ”ง | +| amazon-nova-premier | amazon-bedrock | โ€” | $2.5 | ๐Ÿ“น in ๐Ÿ”ง | +| amazon-nova-pro | amazon-bedrock | โ€” | $0.8 | ๐Ÿ“น in ๐Ÿ”ง | +| amazon-nova-pro-latency-optimized | amazon-bedrock | โ€” | $1 | ๐Ÿ“น in ๐Ÿ”ง | +| seed-1.6 | bytedance | โ€” | $0.25 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| seed-1.6-flash | bytedance | โ€” | $0.07 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| seed-2.0-lite | bytedance | โ€” | $0.25 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| seed-2.0-mini | bytedance | โ€” | $0.1 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| moonshotai--Kimi-K2.5-TEE | chutes | โ€” | $0.44 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| moonshotai--Kimi-K2.6-TEE | chutes | โ€” | $0.74 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-3-flash-preview | fastrouter | โ€” | $0.5 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-3.1-flash-lite-preview | fastrouter | โ€” | $0.25 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-3.1-pro-preview | fastrouter | โ€” | $2 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemma-4-31b-it | fastrouter | โ€” | $0.2 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| gemini-1.5-flash | google | โ€” | $0.075 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-1.5-flash-8b | google | โ€” | $0.075 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-1.5-pro | google | โ€” | $1.25 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.0-flash | google | โ€” | $0.1 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.0-flash-lite | google | โ€” | $0.075 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-flash | google | โ€” | $0.15 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| gemini-2.5-flash-lite | google | โ€” | $0.1 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-pro | google | โ€” | $1.25 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| gemma-3n-E2B-it | google | โ€” | โ€” | ๐Ÿ“น in | +| gemma-3n-E4B-it | google | โ€” | โ€” | ๐Ÿ“น in | +| veo-2.0-generate | google | โ€” | โ€” | ๐Ÿ“น out | +| gemini-2-5-flash | google-vertex | โ€” | $0.3 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2-5-flash-lite | google-vertex | โ€” | $0.1 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2-5-pro | google-vertex | โ€” | $1.25 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-3-1-flash-lite | google-vertex | โ€” | $0.25 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-3-flash | google-vertex | โ€” | $0.5 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-3-pro | google-vertex | โ€” | $2 | ๐Ÿ“น in ๐Ÿ”ง | +| xiaomi--mimo-v2.5 | hpc-ai | โ€” | $0.4 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  ๐Ÿ”“ | +| cliptagger-12b | inferencenet | โ€” | $0.3 | ๐Ÿ“น in ๐Ÿ”“ | +| MiniMax-Hailuo-02 | minimax | โ€” | โ€” | ๐Ÿ“น out | +| MiniMax-Hailuo-2.3 | minimax | โ€” | โ€” | ๐Ÿ“น out | +| MiniMax-Hailuo-2.3-Fast | minimax | โ€” | โ€” | ๐Ÿ“น out | +| baidu--ernie-4.5-vl-28b-a3b-thinking | novitaai | โ€” | $0.39 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| moonshotai--kimi-k2.5 | novitaai | โ€” | $0.6 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| moonshotai--kimi-k2.6 | novitaai | โ€” | $0.8 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen2.5-vl-72b-instruct | novitaai | โ€” | $0.8 | ๐Ÿ“น in | +| qwen--qwen3-omni-30b-a3b-instruct | novitaai | โ€” | โ€” | ๐Ÿ“น in ๐Ÿ”ง | +| qwen--qwen3-omni-30b-a3b-thinking | novitaai | โ€” | โ€” | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3-vl-235b-a22b-instruct | novitaai | โ€” | $0.3 | ๐Ÿ“น in ๐Ÿ”ง | +| qwen--qwen3-vl-235b-a22b-thinking | novitaai | โ€” | $0.98 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3-vl-30b-a3b-instruct | novitaai | โ€” | $0.2 | ๐Ÿ“น in ๐Ÿ”ง | +| qwen--qwen3-vl-30b-a3b-thinking | novitaai | โ€” | $0.2 | ๐Ÿ“น in ๐Ÿ”ง | +| qwen--qwen3-vl-8b-instruct | novitaai | โ€” | $0.08 | ๐Ÿ“น in ๐Ÿ”ง | +| qwen--qwen3.5-122b-a10b | novitaai | โ€” | $0.4 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.5-27b | novitaai | โ€” | $0.3 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.5-35b-a3b | novitaai | โ€” | $0.25 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.5-397b-a17b | novitaai | โ€” | $0.6 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.6-27b | novitaai | โ€” | $0.6 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.6-35b-a3b | novitaai | โ€” | $0.248 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| zai-org--glm-4.5v | novitaai | โ€” | $0.6 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| zai-org--glm-4.6v | novitaai | โ€” | $0.3 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| amazon--nova-2-lite-v1 | openrouter | โ€” | $0.3 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| bytedance-seed--seed-1.6 | openrouter | โ€” | $0.25 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| bytedance-seed--seed-1.6-flash | openrouter | โ€” | $0.075 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| bytedance-seed--seed-2.0-lite | openrouter | โ€” | $0.25 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| bytedance-seed--seed-2.0-mini | openrouter | โ€” | $0.1 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-2.0-flash-001 | openrouter | โ€” | $0.1 | ๐Ÿ“น in ๐Ÿ”ง | +| google--gemini-2.0-flash-lite-001 | openrouter | โ€” | $0.075 | ๐Ÿ“น in ๐Ÿ”ง | +| google--gemini-2.5-flash | openrouter | โ€” | $0.3 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-2.5-flash-lite | openrouter | โ€” | $0.1 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-2.5-flash-lite-preview-09-2025 | openrouter | โ€” | $0.1 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-2.5-pro | openrouter | โ€” | $1.25 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-2.5-pro-preview-05-06 | openrouter | โ€” | $1.25 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-3-flash-preview | openrouter | โ€” | $0.5 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-3.1-flash-lite | openrouter | โ€” | $0.25 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-3.1-flash-lite-preview | openrouter | โ€” | $0.25 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-3.1-pro-preview | openrouter | โ€” | $2 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-3.1-pro-preview-customtools | openrouter | โ€” | $2 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-3.5-flash | openrouter | โ€” | $1.5 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemma-4-26b-a4b-it | openrouter | โ€” | $0.06 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemma-4-26b-a4b-it--free | openrouter | โ€” | โ€” | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemma-4-31b-it | openrouter | โ€” | $0.12 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemma-4-31b-it--free | openrouter | โ€” | โ€” | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| nvidia--nemotron-3-nano-omni-30b-a3b-reasoning--free | openrouter | โ€” | โ€” | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| nvidia--nemotron-nano-12b-v2-vl--free | openrouter | โ€” | โ€” | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| perceptron--perceptron-mk1 | openrouter | โ€” | $0.15 | ๐Ÿ“น in ๐Ÿง  | +| qwen--qwen3.5-122b-a10b | openrouter | โ€” | $0.26 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.5-27b | openrouter | โ€” | $0.195 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.5-35b-a3b | openrouter | โ€” | $0.139 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.5-397b-a17b | openrouter | โ€” | $0.39 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.5-9b | openrouter | โ€” | $0.04 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.5-flash-02-23 | openrouter | โ€” | $0.065 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.5-plus-02-15 | openrouter | โ€” | $0.26 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.5-plus-20260420 | openrouter | โ€” | $0.3 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.6-27b | openrouter | โ€” | $0.32 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.6-35b-a3b | openrouter | โ€” | $0.15 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.6-flash | openrouter | โ€” | $0.1875 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.6-plus | openrouter | โ€” | $0.325 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| rekaai--reka-edge | openrouter | โ€” | $0.1 | ๐Ÿ“น in ๐Ÿ”ง | +| xiaomi--mimo-v2-omni | openrouter | โ€” | $0.4 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| xiaomi--mimo-v2.5 | openrouter | โ€” | $0.4 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| z-ai--glm-4.6v | openrouter | โ€” | $0.3 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| z-ai--glm-5v-turbo | openrouter | โ€” | $1.2 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| ~google--gemini-flash-latest | openrouter | โ€” | $1.5 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| ~google--gemini-pro-latest | openrouter | โ€” | $2 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| hunyuan-turbos-vision-video | tencent | โ€” | $3 | ๐Ÿ“น in | +| yt-vita | tencent-tokenhub | โ€” | $1.2 | ๐Ÿ“น in | +| voyage-multimodal-3 | voyage | โ€” | $0.12 | ๐Ÿ“น in | +| voyage-multimodal-3.5 | voyage | โ€” | $0.12 | ๐Ÿ“น in | +| gemma-4-26b-a4b-it | vultr | โ€” | $0.55 | ๐Ÿ“น in ๐Ÿ”“ | +| gemma-4-31b-it | vultr | โ€” | $0.55 | ๐Ÿ“น in ๐Ÿ”“ | +| gemma-4-e2b-it | vultr | โ€” | $0.55 | ๐Ÿ“น in ๐Ÿ”“ | +| gemma-4-e4b-it | vultr | โ€” | $0.55 | ๐Ÿ“น in ๐Ÿ”“ | +| mimo-v2-omni | xiaomi | โ€” | $0.4 | ๐Ÿ“น in ๐Ÿ”ง | +| mimo-v2.5 | xiaomi | โ€” | $0.4 | ๐Ÿ“น in ๐Ÿ”ง | + +> ๐Ÿ’ก Use the [interactive catalog](https://i-need-token.github.io/ai-models/) to search and filter models with more criteria. + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. + +## Related Documentation + +- [Audio Models](audio-models.md) โ€” 118 audio input + 34 audio output models +- [Vision Models](vision-models.md) โ€” 1,487 vision models +- [Image Generation](image-generation.md) โ€” 28 image generation models +- [Modality Matrix](modality-matrix.md) โ€” all modalities at a glance +- [Model Selection Guide](model-selection.md) โ€” decision framework diff --git a/docs/vision-models.md b/docs/vision-models.md new file mode 100644 index 00000000..7d43b4e9 --- /dev/null +++ b/docs/vision-models.md @@ -0,0 +1,101 @@ +**English** | [ไธญๆ–‡](./zh/vision-models.md) + +# AI Vision Models + +1,487 models in this catalog accept image input (vision). This page highlights the most capable and cost-effective vision models for image understanding, document analysis, and visual reasoning. + +> All data sourced from first-party APIs and documentation. "Vision" means the model accepts image input; image generation is a separate capability. + +## Quick Stats + +| Capability | Vision Models | +| ------------------- | ------------: | +| Total vision models | 1,487 | +| Unique model IDs | 930 | +| With tool calling | 1,063 | +| With reasoning | 697 | +| Open-weight | 104 | + +## Cheapest Vision Models + +Best value for image understanding: + +| Model | Provider | Input $/1M | Output $/1M | Context | Tool Call | Reasoning | +| --------------------- | ----------- | ---------: | ----------: | ------- | --------- | --------- | +| Qwen 3.5 0.8B | Auriko | $0.01 | $0.05 | 262K | โœ… | โœ… | +| Qwen 3.5 0.8B | DeepInfra | $0.01 | $0.05 | 262K | โœ… | โœ… | +| Qwen 3.5 2B | Auriko | $0.02 | $0.10 | 262K | โœ… | โœ… | +| Qwen 3.5 2B | DeepInfra | $0.02 | $0.10 | 262K | โœ… | โœ… | +| Qwen 3.5 4B | Auriko | $0.03 | $0.15 | 262K | โœ… | โœ… | +| Qwen 3.5 4B | DeepInfra | $0.03 | $0.15 | 262K | โœ… | โœ… | +| Gemini 2.5 Flash Lite | Google | $0.10 | $0.60 | 1M | โœ… | โœ… | +| Gemini 2.5 Flash | Google | $0.15 | $0.60 | 1M | โœ… | โœ… | +| Llama 4 Maverick | Together AI | $0.15 | $0.60 | 1M | โœ… | โŒ | +| Grok 4 Fast Reasoning | xAI | $0.20 | $0.50 | 2M | โœ… | โœ… | + +## Largest Context Vision Models + +For analyzing large documents, multi-page PDFs, or long image sequences: + +| Model | Context | Input $/1M | Tool Call | Reasoning | Providers | +| --------------------- | ------- | ---------: | --------- | --------- | --------: | +| Llama 4 Scout | 10M | $0.08 | โœ… | โŒ | 4 | +| Grok 4 Fast Reasoning | 2M | $0.20 | โœ… | โœ… | 2 | +| GPT-5.4 | 1M | $2.50 | โœ… | โœ… | 4 | +| Gemini 2.5 Pro | 1M | $1.25 | โœ… | โœ… | 4 | +| Gemini 2.5 Flash | 1M | $0.15 | โœ… | โœ… | 3 | +| DeepSeek Reasoner | 1M | $0.43 | โœ… | โœ… | 1 | +| GPT-4.1 | 1M | $2.00 | โœ… | โŒ | 4 | +| Llama 4 Maverick | 1M | $0.15 | โœ… | โŒ | 3 | + +## Best Vision + Tool Calling + Reasoning + +The most capable vision models โ€” can see, reason, and act: + +| Model | Context | Input $/1M | Providers | +| ----------------------- | ------- | ---------: | --------: | +| Grok 4 Fast Reasoning | 2M | $0.20 | 2 | +| Gemini 2.5 Flash | 1M | $0.15 | 3 | +| Gemini 2.5 Pro | 1M | $1.25 | 4 | +| GPT-5.4 | 1M | $2.50 | 4 | +| DeepSeek Reasoner | 1M | $0.43 | 1 | +| MiMo V2.5 (open-weight) | 1M | varies | 2 | +| Kimi K2.6 (open-weight) | 262K | varies | 4 | + +## Open-Weight Vision Models + +104 open-weight models accept image input โ€” run vision AI on your own hardware: + +| Model | Context | Tool Call | Reasoning | Providers | +| ------------------ | ------- | --------- | --------- | --------: | +| MiMo V2.5 | 1M | โœ… | โœ… | 2 | +| Llama 4 Maverick | 1M | โœ… | โŒ | 3 | +| Llama 4 Scout | 10M | โœ… | โŒ | 2 | +| Gemma 4 31B IT | 1M | โœ… | โŒ | 3 | +| Qwen3.5 Flash | 1M | โœ… | โŒ | 1 | +| Kimi K2.6 | 262K | โœ… | โœ… | 4 | +| Gemma 4 26B A4B IT | 262K | โœ… | โœ… | 3 | +| Llama 4 Scout 17B | 328K | โœ… | โŒ | 4 | + +## Key Takeaways + +- **1,487 vision models** across 930 unique IDs โ€” the largest vision model catalog available +- **Gemini 2.5 Flash** is the best value: 1M context, vision, tool calling, and reasoning for $0.15/1M +- **Llama 4 Scout** has the largest vision context at 10M tokens +- **Grok 4 Fast Reasoning** is the only model combining 2M context, vision, tool calling, and reasoning +- **104 open-weight vision models** available โ€” run vision AI on your own infrastructure +- Small vision models (Qwen 3.5 0.8Bโ€“4B) cost as little as $0.01โ€“$0.03/1M tokens + +## Related Documentation + +- [Model Selection Guide](model-selection.md) โ€” decision framework for choosing models +- [Image Generation](image-generation.md) โ€” 28 image generation models +- [Video Models](video-models.md) โ€” 167 video input/output models +- [Modality Matrix](modality-matrix.md) โ€” all modalities at a glance +- [Free AI Models](free-models.md) โ€” 81 free models, some with vision +- [OpenAI Alternatives](openai-alternatives.md) โ€” GPT-4 class alternatives with vision +- [Audio Models](audio-models.md) โ€” 118 audio input + 34 audio output models + +--- + +Data sourced from [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” structured YAML with pricing, context windows, and capabilities for 4,587+ models across 95 providers. diff --git a/docs/zh/agentic-models.md b/docs/zh/agentic-models.md new file mode 100644 index 00000000..c83aa7c8 --- /dev/null +++ b/docs/zh/agentic-models.md @@ -0,0 +1,97 @@ +[English](../agentic-models.md) | **ไธญๆ–‡** + +# ๆ™บ่ƒฝไฝ“ AI ๆจกๅž‹ โ€” 1,080 ไธช็”จไบŽ AI ๆ™บ่ƒฝไฝ“็š„ๆจกๅž‹ + +ๅ…ทๅค‡ **ๅทฅๅ…ท่ฐƒ็”จ + ๆŽจ็†** ่ƒฝๅŠ›็š„ๆจกๅž‹ โ€” AI ๆ™บ่ƒฝไฝ“ใ€่‡ชไธปๅทฅไฝœๆตๅ’ŒๅคšๆญฅไปปๅŠกๆ‰ง่กŒ็š„ๆ ธๅฟƒๆž„ๅปบๅ—ใ€‚ๆ‰€ๆœ‰ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) ไธ€ๆ‰‹ APIใ€‚ + +## ไป€ไนˆไฝฟๆจกๅž‹ๆˆไธบ"ๆ™บ่ƒฝไฝ“"๏ผŸ + +ๆ™บ่ƒฝไฝ“ๆจกๅž‹ๅฏไปฅ๏ผš + +- **่ฐƒ็”จๅทฅๅ…ท/ๅ‡ฝๆ•ฐ** โ€” ไธŽ APIใ€ๆ•ฐๆฎๅบ“ๅ’Œๅค–้ƒจ็ณป็ปŸไบคไบ’ +- **้€ๆญฅๆŽจ็†** โ€” ่ง„ๅˆ’ใ€ๅˆ†่งฃไปปๅŠกๅ’Œ้ชŒ่ฏ็ป“ๆžœ +- **่‡ชไธป่กŒๅŠจ** โ€” ๆ— ้œ€ไบบๅทฅๅนฒ้ข„ๅณๅฏๅšๅ‡บๅ†ณ็ญ–ๅ’Œ้‡‡ๅ–่กŒๅŠจ + +่ฟ™ไบ›่ƒฝๅŠ›ๆ˜ฏ่Šๅคฉๆœบๅ™จไบบๅ’Œ AI ๆ™บ่ƒฝไฝ“็š„ๅ…ณ้”ฎๅŒบๅˆซใ€‚ + +## ็ปŸ่ฎก + +| Metric | Count | +| ---------------------- | ----- | +| Agentic models | 1076 | +| Providers | 51 | +| With vision | 617 | +| With structured output | 453 | +| Free | 30 | +| Open weights | 64 | + +## ๆœ€ไพฟๅฎœ็š„ๆ™บ่ƒฝไฝ“ๆจกๅž‹๏ผˆ็›ด่ฟžๆไพ›ๅ•†๏ผ‰ + +| Model | Provider | Context | Input $/1M | Output $/1M | Vision | +| ------------------------------ | ------------ | ------- | ---------- | ----------- | ------ | +| qwen--qwen3-4b-fp8 | novitaai | 125K | $0.03 | $0.03 | | +| openai--gpt-oss-20b | neuralwatt | 0 | $0.03 | $0.16 | | +| openai--gpt-oss-120b | novitaai | 128K | $0.05 | $0.25 | โœ… | +| gpt-oss-120b | inferencenet | 128K | $0.05 | $0.45 | | +| Qwen--Qwen3.6-35B-A3B | neuralwatt | 0 | $0.05 | $0.1 | โœ… | +| qwen3-30b-a3b-fp8 | cloudflare | 40K | $0.051 | $0.335 | | +| glm-4.7-flash | cloudflare | 128K | $0.06 | $0.4 | | +| Nemotron-3-Nano-Omni | nebius | 125K | $0.06 | $0.24 | โœ… | +| hermes-4-llama-3.1-8b | nousresearch | 128K | $0.06 | $0.12 | | +| zai-org--glm-4.7-flash | novitaai | 195K | $0.07 | $0.4 | | +| ring-2.6-1t | inclusionai | 256K | $0.07 | $0.62 | | +| seed-1.6-flash | bytedance | 256K | $0.07 | $0.3 | โœ… | +| microsoft-phi-4-mini-reasoning | microsoft | 125K | $0.075 | $0.3 | | +| Qwen--Qwen3-32B-TEE | chutes | 40K | $0.08 | $0.24 | | +| qwen--qwen3-30b-a3b-fp8 | novitaai | 40K | $0.09 | $0.45 | | + +## ๅ…่ดนๆ™บ่ƒฝไฝ“ๆจกๅž‹ + +| Model | Provider | Context | Vision | Structured Output | +| --------------------------------- | -------- | ------- | ------ | ----------------- | +| glm-4.1v-thinking-flash | zhipuai | 62K | โœ… | โœ… | +| qwen--qwen3-omni-30b-a3b-thinking | novitaai | 64K | โœ… | โœ… | +| qwen--qwen3.5-4b-free | mixlayer | 128K | | | + +## ๆœ€ๅคงไธŠไธ‹ๆ–‡ๆ™บ่ƒฝไฝ“ๆจกๅž‹ + +| Model | Provider | Context | Input $/1M | Output $/1M | +| --------------------------- | ----------- | ------- | ---------- | ----------- | +| deepseek-v4-flash | baidu | 1024K | $0.126 | $0.252 | +| deepseek-v4-pro | siliconflow | 1024K | $1.74 | $3.48 | +| deepseek-v4-flash | siliconflow | 1024K | $0.14 | $0.28 | +| deepseek--deepseek-v4-pro | novitaai | 1024K | $1.67 | $3.38 | +| xiaomimimo--mimo-v2.5-pro | novitaai | 1024K | $2 | $6 | +| deepseek--deepseek-v4-flash | novitaai | 1024K | $0.14 | $0.28 | +| gemini-2.5-flash | google | 1024K | $0.15 | $3.5 | +| gemini-2.5-pro | google | 1024K | $1.25 | $10 | +| deepseek-v4-pro | fireworks | 1024K | $1.74 | $3.48 | +| xiaomi--mimo-v2.5-pro | hpc-ai | 1024K | $1 | $3 | +| xiaomi--mimo-v2.5 | hpc-ai | 1024K | $0.4 | $2 | +| mimo-v2.5-pro | xiaomi | 1024K | $1 | $3 | +| mimo-v2-pro | xiaomi | 1024K | $1 | $3 | +| minimaxai--minimax-m1-80k | novitaai | 976K | $0.55 | $2.2 | +| qwen3.6-flash | alibaba | 976K | $1.2 | $7.2 | + +## ๆž„ๅปบ AI ๆ™บ่ƒฝไฝ“ + +| Agent Type | Recommended Models | Key Capabilities | +| ---------------- | --------------------------- | ------------------------------ | +| Code agents | Claude Sonnet 4, GPT-4.1 | Tool call + reasoning + code | +| Research agents | Gemini 2.5 Pro, DeepSeek R1 | Large context + reasoning | +| Data agents | Claude Sonnet 4, Qwen3 | Structured output + tool call | +| Vision agents | GPT-4o, Gemini 2.5 Flash | Vision + tool call + reasoning | +| Customer support | Llama 4 Scout, Qwen3 | Free/cheap + tool call | + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [Tool Calling Models](tool-calling.md) โ€” 2,350 models with function calling +- [Reasoning Models](reasoning-models.md) โ€” 1,306 models with chain-of-thought +- [Structured Output](structured-output.md) โ€” 829 models with JSON mode +- [OpenAI Alternatives](openai-alternatives.md) โ€” GPT-4 alternatives with agent capabilities +- [Vision Models](vision-models.md) โ€” 1,487 models with image understanding +- [Free AI Models](free-models.md) โ€” 81 models at zero cost + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/ai-model-picker.md b/docs/zh/ai-model-picker.md new file mode 100644 index 00000000..f72287cd --- /dev/null +++ b/docs/zh/ai-model-picker.md @@ -0,0 +1,64 @@ +# AI ๆจกๅž‹้€‰ๆ‹ฉๅ™จ + +ๅ›ž็ญ” 4 ไธช็ฎ€ๅ•้—ฎ้ข˜๏ผŒๆ‰พๅˆฐๆœ€้€‚ๅˆไฝ ็”จไพ‹็š„ AI ๆจกๅž‹ใ€‚ + +**[่ฏ•็”จไบคไบ’ๅผ้€‰ๆ‹ฉๅ™จ โ†’](https://i-need-token.github.io/ai-models/ai-model-picker.html)** + +## ๅทฅไฝœๅŽŸ็† + +AI ๆจกๅž‹้€‰ๆ‹ฉๅ™จไผš้—ฎไฝ ๅ››ไธช้—ฎ้ข˜๏ผš + +1. **ไฝ ๅœจๆž„ๅปบไป€ไนˆ๏ผŸ** โ€” AI ไปฃ็†ใ€ไปฃ็ ็”Ÿๆˆใ€ๅฏน่ฏ/RAGใ€ๆ•ฐๅญฆๆŽจ็†ใ€่ง†่ง‰/ๅคšๆจกๆ€ใ€ๆˆ–ๅคง่ง„ๆจก็”Ÿไบง +2. **ไฝ ็š„้ข„็ฎ—ๆ˜ฏๅคšๅฐ‘๏ผŸ** โ€” ๅ…่ดนใ€ไฝŽไบŽ $0.10/M tokenใ€ไฝŽไบŽ $1/Mใ€ๆˆ–้ซ˜็ซฏ +3. **ไฝ ้œ€่ฆๅคšๅฐ‘ไธŠไธ‹ๆ–‡๏ผŸ** โ€” ไฝŽไบŽ 32Kใ€32Kโ€“128Kใ€128Kโ€“512Kใ€ๆˆ– 512K+ +4. **ไป€ไนˆๆœ€้‡่ฆ๏ผŸ** โ€” ๆœ€ไฝŽๆˆๆœฌใ€ๆœ€ไฝณ่ดจ้‡ใ€ๆœ€ไฝŽๅปถ่ฟŸใ€ๆˆ–้š็ง/ๆœฌๅœฐ้ƒจ็ฝฒ + +ๆ นๆฎไฝ ็š„ๅ›ž็ญ”๏ผŒ้€‰ๆ‹ฉๅ™จๅฏน 95 ไธชๆไพ›ๅ•†็š„ 4,587+ ๆจกๅž‹่ฟ›่กŒ่ฏ„ๅˆ†ๅ’ŒๆŽ’ๅ๏ผŒๆŒ‰้ข„็ฎ—ๅ’ŒไธŠไธ‹ๆ–‡้œ€ๆฑ‚่ฟ‡ๆปค๏ผŒ็„ถๅŽๆŒ‰็”จไพ‹ๅ’Œไผ˜ๅ…ˆ็บงๅŠ ๆƒใ€‚ + +## ่ฏ„ๅˆ†้€ป่พ‘ + +| ็”จไพ‹ | ๅ…ณ้”ฎ่ƒฝๅŠ› | ๆƒ้‡ | +| ----------- | ----------------------------------------- | ------------------ | +| AI ไปฃ็† | ๅทฅๅ…ท่ฐƒ็”จ (+10)ใ€ๆŽจ็† (+5) | ๆ˜‚่ดตๆจกๅž‹ๆœ‰ๆˆๆœฌๆƒฉ็ฝš | +| ไปฃ็ ็”Ÿๆˆ | ๅทฅๅ…ท่ฐƒ็”จ (+8)ใ€ๆŽจ็† (+5)ใ€็ป“ๆž„ๅŒ–่พ“ๅ‡บ (+3) | โ€” | +| ๅฏน่ฏ/RAG | ๅคงไธŠไธ‹ๆ–‡ (+5)ใ€ๅทฅๅ…ท่ฐƒ็”จ (+3) | โ€” | +| ๆ•ฐๅญฆๆŽจ็† | ๆŽจ็† (+10)ใ€ๅทฅๅ…ท่ฐƒ็”จ (+3) | โ€” | +| ่ง†่ง‰/ๅคšๆจกๆ€ | ๅ›พๅƒ่พ“ๅ…ฅ (+10)ใ€ๅทฅๅ…ท่ฐƒ็”จ (+3) | โ€” | +| ๅคง่ง„ๆจก็”Ÿไบง | ๅทฅๅ…ท่ฐƒ็”จ (+5) | ๆˆๆœฌๆƒฉ็ฝšๆ”พๅคง 5 ๅ€ | + +่šๅˆๆไพ›ๅ•†๏ผˆOpenRouterใ€Requesty ็ญ‰๏ผ‰่ขซๆŽ’้™คไปฅ้ฟๅ…้‡ๅคๆจกๅž‹ๆก็›ฎใ€‚ + +## ๅฟซ้€ŸๆŽจ่ + +### ๆŒ‰็”จไพ‹็š„ๆœ€ไฝณๅ…่ดนๆจกๅž‹ + +| ็”จไพ‹ | ้ฆ–้€‰ | ๅŽŸๅ›  | +| -------- | ------------------------ | ---------------------- | +| AI ไปฃ็† | DeepSeek V4 Flash (ๅ…่ดน) | ๅทฅๅ…ท่ฐƒ็”จ + 1M ไธŠไธ‹ๆ–‡ | +| ไปฃ็ ็”Ÿๆˆ | Qwen3 Coder (ๅ…่ดน) | ๅทฅๅ…ท่ฐƒ็”จ + 1M ไธŠไธ‹ๆ–‡ | +| ๅฏน่ฏ/RAG | DeepSeek V4 Flash (ๅ…่ดน) | 1M ไธŠไธ‹ๆ–‡็ช—ๅฃ | +| ๆŽจ็† | DeepSeek R1 (ๅ…่ดน) | 92% MATH-500๏ผŒๆŽจ็†่ƒฝๅŠ› | +| ่ง†่ง‰ | โ€” | ๅ…่ดน่ง†่ง‰้€‰้กนๆœ‰้™ | + +### ๆœ€ไฝณ้ข„็ฎ—ๆจกๅž‹๏ผˆไฝŽไบŽ $0.10/M๏ผ‰ + +| ็”จไพ‹ | ้ฆ–้€‰ | ไปทๆ ผ | +| -------- | -------------- | --------------- | +| AI ไปฃ็† | ling-2.6-flash | $0.01/$0.03/M | +| ไปฃ็ ็”Ÿๆˆ | bdc-coder | $0.01/$0.01/M | +| ๆŽจ็† | qwen3.5-0.8b | $0.01/$0.05/M | +| ้€š็”จ | Mistral Nemo | $0.008/$0.001/M | + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๅ…่ดนๆจกๅž‹](free-models.md) โ€” 81 ไธชๅ…่ดนๆจกๅž‹ๅฎŒๆ•ดๅˆ—่กจ +- [ไปทๆ ผๆฏ”่พƒ](pricing-comparison.md) โ€” ่ทจๆ‰€ๆœ‰ๆไพ›ๅ•†ๆฏ”่พƒๆˆๆœฌ +- [ๅทฅๅ…ท่ฐƒ็”จ](tool-calling.md) โ€” 2,350 ไธชๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ็š„ๆจกๅž‹ +- [ๆŽจ็†ๆจกๅž‹](reasoning-models.md) โ€” 1,306 ไธชๆŽจ็†ๆจกๅž‹ +- [ไธŠไธ‹ๆ–‡็ช—ๅฃ](context-windows.md) โ€” ๆฏ”่พƒไธŠไธ‹ๆ–‡็ช—ๅฃๅคงๅฐ +- [ๆจกๅž‹้€‰ๆ‹ฉ้€ŸๆŸฅ่กจ](model-selection-cheatsheet.md) โ€” ๅ†ณ็ญ–ๆ ‘ๅ’Œ้ข„็ฎ—่กจ +- [ๅฟซ้€Ÿๅ…ฅ้—จ](quick-start.md) โ€” ๅผ€ๅง‹ไฝฟ็”จ็›ฎๅฝ• + +## ๆ•ฐๆฎๆฅๆบ + +ๆ‰€ๆœ‰ๆ•ฐๆฎๅ‡ๆฅ่‡ช็ฌฌไธ€ๆ–น API ๅ’Œๅฎ˜ๆ–นๆ–‡ๆกฃใ€‚่ฏฆ่ง[ๆ•ฐๆฎ่Žทๅ–](data-acquisition.md)ใ€‚ diff --git a/docs/zh/api.md b/docs/zh/api.md new file mode 100644 index 00000000..5d19645f --- /dev/null +++ b/docs/zh/api.md @@ -0,0 +1,222 @@ +[English](../api.md) | **ไธญๆ–‡** + +# API ไธŽ็ผ–็จ‹่ฎฟ้—ฎ + +ๅœจไฝ ็š„ๅบ”็”จไธญไฝฟ็”จ็›ฎๅฝ•ๆ•ฐๆฎใ€‚ + +## npm ๅŒ… + +ๅฐ†็›ฎๅฝ•ไฝœไธบ npm ไพ่ต–ๅฎ‰่ฃ…๏ผš + +```bash +npm install ai-models +``` + +```typescript +import catalog from "ai-models"; // 4,587 ไธชๆจกๅž‹ JSON +import type { Model } from "ai-models"; // TypeScript ็ฑปๅž‹ + +// ๆŸฅๆ‰พๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จไธ”่พ“ๅ…ฅไปทๆ ผไฝŽไบŽ $1/1M ็š„ๆจกๅž‹ +const affordable = catalog.models.filter((m) => m.tool_call && m.pricing.input < 1); +``` + +ๅŒ…ๅ†…ๅฎนๅŒ…ๆ‹ฌ๏ผš + +- `dist/models.json` โ€” ๅฎŒๆ•ด็›ฎๅฝ• JSON +- `dist/index.d.ts` โ€” TypeScript ็ฑปๅž‹ๅฎšไน‰ +- `types/` โ€” ๆบ็ฑปๅž‹ๅฎšไน‰๏ผˆModelใ€Snapshotใ€Providerใ€Pricing๏ผ‰ + +## CDN ่ฎฟ้—ฎ๏ผˆๆ— ้œ€ๅฎ‰่ฃ…๏ผ‰ + +็ผ–่ฏ‘ๅŽ็š„ JSON ๅฏ้€š่ฟ‡ [jsDelivr CDN](https://www.jsdelivr.com/package/npm/ai-models) ่ฎฟ้—ฎ โ€” ๆ— ้œ€ไธ‹่ฝฝๆˆ–ๅฎ‰่ฃ…ใ€‚CDN ่‡ชๅŠจๆไพ›ๆœ€ๆ–ฐ็š„ npm ๅ‘ๅธƒ็‰ˆๆœฌ๏ผš + +```html + + +``` + +```bash +# ็›ดๆŽฅ curl๏ผˆๅง‹็ปˆๆœ€ๆ–ฐ๏ผ‰ +curl -s https://github.com/i-need-token/ai-models/releases/latest/download/models.json | jq '.models | length' + +# ้”ๅฎš็‰นๅฎš็‰ˆๆœฌ +curl -s https://github.com/i-need-token/ai-models/releases/download/v0.1.0/models.json | jq '.stats' +``` + +```python +# Python โ€” ๆ— ้œ€ pip install +import urllib.request, json +catalog = json.loads(urllib.request.urlopen("https://github.com/i-need-token/ai-models/releases/latest/download/models.json").read()) +print(len(catalog["models"])) # 4587 +``` + +```go +// Go โ€” ๆ— ้œ€ไพ่ต– +resp, err := http.Get("https://github.com/i-need-token/ai-models/releases/latest/download/models.json") +``` + +### CDN ไธŽ GitHub Releases ๅฏนๆฏ” + +| ็‰นๆ€ง | jsDelivr CDN | GitHub Releases | +| ---------- | ------------------------------------------- | --------------------------------------------- | +| URL ็จณๅฎšๆ€ง | `cdn.jsdelivr.net/npm/ai-models@latest/...` | `github.com/.../releases/latest/download/...` | +| CORS | โœ… ๆ”ฏๆŒ โ€” ๅฏๅœจๆต่งˆๅ™จไธญไฝฟ็”จ | โŒ ไธๆ”ฏๆŒ โ€” ไป…ไธ‹่ฝฝ | +| ็ผ“ๅญ˜ | 7 ๅคฉ๏ผˆ็‰ˆๆœฌๅŒ–๏ผ‰๏ผŒ5 ๅˆ†้’Ÿ๏ผˆ`@latest`๏ผ‰ | ๆ— ็ผ“ๅญ˜ | +| ้€Ÿๅบฆ | ๅ…จ็ƒ CDN๏ผŒ300+ ่พน็ผ˜่Š‚็‚น | GitHub CDN | +| ้€‚็”จๅœบๆ™ฏ | Web ๅบ”็”จใ€ๆต่งˆๅ™จ่„šๆœฌใ€ๅฟซ้€ŸๅŽŸๅž‹ | CLI ๅทฅๅ…ทใ€CI/CDใ€ๆ‰นๅค„็† | + +## ็ผ–่ฏ‘ JSON + +ๆ‰€ๆœ‰ๆจกๅž‹ๆ•ฐๆฎๅฏไปฅไปŽ [GitHub Releases](https://github.com/i-need-token/ai-models/releases/latest) ไธ‹่ฝฝ๏ผŒๆไพ›ไธค็งๆ ผๅผ๏ผš + +| ๆ–‡ไปถ | ๆ ผๅผ | ๅคงๅฐ | ้€‚็”จๅœบๆ™ฏ | +| ------------- | ---- | ------- | ------------------------------ | +| `models.json` | JSON | ~2.3 MB | ็ผ–็จ‹่ฎฟ้—ฎใ€Web ๅบ”็”จใ€TypeScript | +| `models.csv` | CSV | ~560 KB | Excelใ€Google Sheetsใ€ๆ•ฐๆฎๅˆ†ๆž | +| `stats.json` | JSON | ~1 KB | ็›ฎๅฝ•็ปŸ่ฎกๆ‘˜่ฆ | + +ไนŸๅฏๅœจ [Hugging Face Datasets](https://huggingface.co/datasets/i-need-token/ai-models) ไธŠ่Žทๅ–๏ผŒๆ–นไพฟๆœบๅ™จๅญฆไน ็คพๅŒบไฝฟ็”จใ€‚ + +```bash +# ไธ‹่ฝฝ JSON๏ผˆๅฎŒๆ•ดๅ…ƒๆ•ฐๆฎ๏ผ‰ +curl -LO https://github.com/i-need-token/ai-models/releases/latest/download/models.json + +# ไธ‹่ฝฝ CSV๏ผˆ้€‚ๅˆ็”ตๅญ่กจๆ ผ๏ผ‰ +curl -LO https://github.com/i-need-token/ai-models/releases/latest/download/models.csv + +# ็‰นๅฎš็‰ˆๆœฌ +curl -LO https://github.com/i-need-token/ai-models/releases/download/v0.1.0/models.json +``` + +### ๆœฌๅœฐ็ผ–่ฏ‘ + +```bash +npm install +npx tsx scripts/compile.ts +# ่พ“ๅ‡บ๏ผšdist/models.json (2.3 MB) +``` + +### JSON ็ป“ๆž„ + +```json +{ + "generated_at": "2026-05-21T02:13:04.076Z", + "stats": { + "providers": 95, + "models": 4587, + "unique_model_ids": 2712, + "families": 441 + }, + "providers": { + "openai": { "name": "OpenAI", "model_count": 28 }, + "anthropic": { "name": "Anthropic", "model_count": 11 } + }, + "models": [ + { + "id": "gpt-4.1", + "name": "GPT-4.1", + "family": "gpt-4.1", + "provider": "openai", + "tool_call": true, + "structured_output": true, + "pricing": { "currency": "USD", "input": 2, "output": 8, "cache_read": 0.5 }, + "limit": { "context": 1047576, "output": 32768 }, + "modalities": { "input": ["text", "image"], "output": ["text"] } + } + ] +} +``` + +### ไฝฟ็”จ็คบไพ‹ + +**JavaScript/TypeScript๏ผš** + +```javascript +const catalog = require("./models.json"); + +// ๆŸฅๆ‰พๆ‰€ๆœ‰ๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จไธ”่พ“ๅ…ฅไปทๆ ผไฝŽไบŽ $1/1M token ็š„ๆจกๅž‹ +const cheap = catalog.models.filter( + (m) => m.tool_call && m.pricing?.input < 1 && m.pricing?.currency === "USD", +); + +// ๆŸฅๆ‰พๆฏไธชๆไพ›ๅ•†ๆœ€ไพฟๅฎœ็š„ๆจกๅž‹ +const byProvider = {}; +for (const m of catalog.models) { + if (!m.pricing?.input) continue; + if (!byProvider[m.provider] || m.pricing.input < byProvider[m.provider].pricing.input) { + byProvider[m.provider] = m; + } +} + +// ่Žทๅ–ๆ‰€ๆœ‰่ง†่ง‰ๆจกๅž‹ +const vision = catalog.models.filter((m) => m.modalities?.input?.includes("image")); +``` + +**Python๏ผš** + +```python +import json + +with open("models.json") as f: + catalog = json.load(f) + +# ๆŸฅๆ‰พๆ‰€ๆœ‰ๆŽจ็†ๆจกๅž‹ +reasoning = [m for m in catalog["models"] if m.get("reasoning")] + +# ๆŸฅๆ‰พไธŠไธ‹ๆ–‡็ช—ๅฃๆœ€ๅคง็š„ๆจกๅž‹ +by_context = sorted( + catalog["models"], + key=lambda m: (m.get("limit", {}) or {}).get("context", 0), + reverse=True, +)[:10] +``` + +## ๅ•ไธช YAML ๆ–‡ไปถ + +ๅฏนไบŽๅ•ไธชๆจกๅž‹็š„็ฑปๅž‹ๅฎ‰ๅ…จ่ฎฟ้—ฎ๏ผŒ็›ดๆŽฅไฝฟ็”จ YAML ๆ–‡ไปถ้…ๅˆ Zod ๆ ก้ชŒ๏ผš + +```typescript +import { ModelSchema } from "./types/schemas"; +import { parse } from "yaml"; +import { readFileSync } from "fs"; + +const raw = readFileSync("providers/openai/models/gpt-4.1.yaml", "utf-8"); +const model = ModelSchema.parse(parse(raw)); // ่ฟ่กŒๆ—ถๆ ก้ชŒ + +console.log(model.pricing); // { input: 2, output: 8, cache_read: 0.5 } +``` + +## CLI ๅทฅๅ…ท + +```bash +# ้ชŒ่ฏๆ‰€ๆœ‰ YAML ๆ•ฐๆฎ +npx tsx scripts/validate.ts + +# ่ฎก็ฎ—็›ฎๅฝ•็ปŸ่ฎก +npx tsx scripts/stats.ts # ่กจๆ ผๆ ผๅผ +npx tsx scripts/stats.ts json # JSON ๆ ผๅผ + +# ็ผ–่ฏ‘ไธบ models.json +npx tsx scripts/compile.ts + +# ไปŽๆไพ›ๅ•†ๅŒๆญฅๆ•ฐๆฎ +npx tsx scripts/sync.ts openai # ๅ•ไธชๆไพ›ๅ•† +npx tsx scripts/sync.ts # ๆ‰€ๆœ‰ๆไพ›ๅ•† +``` + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๅฟซ้€Ÿๅ…ฅ้—จ](quick-start.md) โ€” 30 ็ง’ๅ†…ๆ‰พๅˆฐ้€‚ๅˆ็š„ๆจกๅž‹ +- [ไปฃ็ ็คบไพ‹](code-examples.md) โ€” TypeScriptใ€Pythonใ€Goใ€Rustใ€jq +- [ๆ•ฐๆฎๆจกๅผ](data-schema.md) โ€” ๅฎŒๆ•ด YAML ๆจกๅผๅ‚่€ƒ +- [ๅธธ่ง้—ฎ้ข˜](faq.md) โ€” ๅธธ่ง้—ฎ้ข˜ +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ๅ†ณ็ญ–ๆก†ๆžถ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/audio-models.md b/docs/zh/audio-models.md new file mode 100644 index 00000000..24379b44 --- /dev/null +++ b/docs/zh/audio-models.md @@ -0,0 +1,83 @@ +[English](../audio-models.md) | **ไธญๆ–‡** + +# ้Ÿณ้ข‘ AI ๆจกๅž‹ โ€” ่ฏญ้Ÿณใ€ๅฃฐ้Ÿณๅ’Œ้Ÿณ้ข‘็†่งฃ + +ๅ…ทๅค‡ **้Ÿณ้ข‘่พ“ๅ…ฅ**๏ผˆ่ฏญ้Ÿณ่ฏ†ๅˆซใ€่ฏญ้Ÿณ็†่งฃ๏ผ‰ๅ’Œ **้Ÿณ้ข‘่พ“ๅ‡บ**๏ผˆๆ–‡ๆœฌ่ฝฌ่ฏญ้Ÿณใ€่ฏญ้Ÿณ็”Ÿๆˆ๏ผ‰่ƒฝๅŠ›็š„ๆจกๅž‹ใ€‚ๆ‰€ๆœ‰ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) ไธ€ๆ‰‹ APIใ€‚ + +## ็ปŸ่ฎก + +| Metric | Count | +| ------------------- | ----- | +| Audio input models | 115 | +| Audio output models | 34 | +| Total audio models | 133 | +| Providers | 20 | +| With tool calling | 69 | +| Free | 8 | + +## ้Ÿณ้ข‘่พ“ๅ…ฅๆจกๅž‹๏ผˆ่ฏญ้Ÿณ/ๅฃฐ้Ÿณ็†่งฃ๏ผ‰ + +ๅฏไปฅๅค„็†้Ÿณ้ข‘่พ“ๅ…ฅ็š„ๆจกๅž‹ โ€” ่ฝฌๅฝ•่ฏญ้Ÿณใ€ๅˆ†ๆž้Ÿณ้ข‘ใ€็†่งฃ่ฏญ้Ÿณๅ‘ฝไปค๏ผš + +| Model | Provider | Context | Input $/1M | Output $/1M | Tool Call | +| ------------------------------- | -------------- | ------- | ---------- | ----------- | --------- | +| mistral-voxtral-mini | amazon-bedrock | 125K | $0.04 | $0.04 | | +| voxtral-mini | mistral | 125K | $0.04 | $0.04 | | +| gemini-2.0-flash-lite | google | 1024K | $0.075 | $0.3 | โœ… | +| gemini-2-0-flash-lite | google-vertex | 1024K | $0.075 | $0.3 | โœ… | +| microsoft-phi-4-mini-multimodal | microsoft | 125K | $0.08 | $0.32 | โœ… | +| gemini-2.0-flash | google | 1024K | $0.1 | $0.4 | โœ… | +| gemini-2.5-flash-lite | google | 1024K | $0.1 | $0.4 | โœ… | +| mistral-voxtral-small | amazon-bedrock | 125K | $0.1 | $0.3 | | +| voxtral-small | mistral | 125K | $0.1 | $0.3 | | +| amazon-nova-2.0-lite | amazon | 62K | $0.15 | $1.25 | โœ… | +| gemini-2.5-flash | google | 1024K | $0.15 | $3.5 | โœ… | +| gemini-2-0-flash | google-vertex | 1024K | $0.15 | $0.6 | โœ… | +| voxtral-small-24b-2507 | scaleway | 128K | $0.15 | $0.35 | | +| amazon-nova-2.0-omni | amazon | 62K | $0.2 | $1.3 | โœ… | +| xiaomi--mimo-v2.5 | hpc-ai | 1024K | $0.4 | $2 | โœ… | + +## ้Ÿณ้ข‘่พ“ๅ‡บๆจกๅž‹๏ผˆๆ–‡ๆœฌ่ฝฌ่ฏญ้Ÿณ/่ฏญ้Ÿณ็”Ÿๆˆ๏ผ‰ + +ๅฏไปฅ็”Ÿๆˆ้Ÿณ้ข‘่พ“ๅ‡บ็š„ๆจกๅž‹ โ€” ๆ–‡ๆœฌ่ฝฌ่ฏญ้Ÿณใ€่ฏญ้Ÿณๅˆๆˆ๏ผš + +| Model | Provider | Input $/1M | Output $/1M | +| ---------------------- | -------- | ---------- | ----------- | +| gpt-4o-audio | openai | $2.5 | $10 | +| gpt-4o-realtime | openai | $5 | $20 | +| step-audio-2 | stepfun | $10 | $70 | +| stepaudio-2.5-realtime | stepfun | $10 | $70 | +| o1-realtime | openai | $15 | $60 | +| step-1o-audio | stepfun | $25 | $60 | + +## ๅ…่ดน้Ÿณ้ข‘ๆจกๅž‹ + +| Model | Provider | Audio In | Audio Out | Context | +| --------------------------------- | -------- | -------- | --------- | ------- | +| qwen--qwen3-omni-30b-a3b-instruct | novitaai | โœ… | โœ… | 64K | +| qwen--qwen3-omni-30b-a3b-thinking | novitaai | โœ… | | 64K | +| gemma-3n-E2B-it | google | โœ… | | 128K | +| gemma-3n-E4B-it | google | โœ… | | 128K | +| step-audio-r1.1 | stepfun | โœ… | โœ… | 0 | + +## ้€‰ๆ‹ฉ้Ÿณ้ข‘ๆจกๅž‹ + +| Use Case | Recommended | Key Feature | +| ------------------- | ------------------------- | ------------------------- | +| Voice assistants | GPT-4o-audio | Audio in/out + tool call | +| Transcription | Whisper, Gemini 2.5 Flash | Fast, cheap audio input | +| Voice agents | GPT-4o-realtime | Real-time audio streaming | +| Text-to-speech | OpenAI TTS, ElevenLabs | Natural voice output | +| Multilingual speech | Gemini 2.5 Pro | 100+ languages | + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [Multimodal Models](multimodal-models.md) โ€” 1,519 models with image/audio/video +- [Vision Models](vision-models.md) โ€” 1,487 models with image understanding +- [Chat Models](chat-models.md) โ€” 2,350 models with tool calling +- [Tool Calling Models](tool-calling.md) โ€” function calling capabilities +- [Free AI Models](free-models.md) โ€” 81 models at zero cost + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/benchmarks.md b/docs/zh/benchmarks.md new file mode 100644 index 00000000..4c11dd1c --- /dev/null +++ b/docs/zh/benchmarks.md @@ -0,0 +1,109 @@ +# AI ๆจกๅž‹ๅŸบๅ‡†ๆต‹่ฏ•ไธŽๆŽ’่กŒๆฆœ + +[English](../benchmarks.md) + +AI ๆจกๅž‹ๅฆ‚ไฝ•่ขซ่ฏ„ไผฐ โ€” ๅ…ณ้”ฎๅŸบๅ‡†ๆต‹่ฏ•ใ€ๆŽ’่กŒๆฆœๆ ผๅฑ€๏ผŒไปฅๅŠ่ฟ™ไบ›ๆ•ฐๅญ—ๅฏนๆจกๅž‹้€‰ๆ‹ฉ็š„ๆ„ไน‰ใ€‚ + +ๆ•ฐๆฎๆฅๆบ๏ผš[AI Models Catalog](https://github.com/i-need-token/ai-models)ใ€‚ + +## ไธบไป€ไนˆๅŸบๅ‡†ๆต‹่ฏ•ๅพˆ้‡่ฆ + +ๅŸบๅ‡†ๆต‹่ฏ•ๆไพ›ไบ†่ทจไปปๅŠกๆฏ”่พƒ AI ๆจกๅž‹็š„ๆ ‡ๅ‡†ๅŒ–ๆ–นๅผใ€‚็„ถ่€Œ๏ผŒๆฒกๆœ‰ไปปไฝ•ๅ•ไธ€ๅŸบๅ‡†ๆต‹่ฏ•่ƒฝ่ฏดๆ˜Žๅ…จ้ƒจ้—ฎ้ข˜ใ€‚ๆœฌๆŒ‡ๅ—ๆถต็›–ไธป่ฆๅŸบๅ‡†ๆต‹่ฏ•ใ€ๅฆ‚ไฝ•่งฃ่ฏปๅฎƒไปฌ๏ผŒไปฅๅŠๅฆ‚ไฝ•ๅฐ†ๅฎƒไปฌไธŽๆˆ‘ไปฌ็š„็›ฎๅฝ•ๆ•ฐๆฎ๏ผˆๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃใ€่ƒฝๅŠ›๏ผ‰็ป“ๅˆไฝฟ็”จ๏ผŒไปฅๅšๅ‡บๆ˜Žๆ™บ็š„ๆจกๅž‹้€‰ๆ‹ฉใ€‚ + +## ไธป่ฆๅŸบๅ‡†ๆต‹่ฏ• + +### ้€š็”จ่ฏญ่จ€็†่งฃ + +| ๅŸบๅ‡†ๆต‹่ฏ• | ๆต‹่ฏ•ๅ†…ๅฎน | ้กถ็บงๆจกๅž‹ | ๅค‡ๆณจ | +| --------- | ---------------------- | -------------------------------------- | -------------------------------- | +| MMLU | ๅคšไปปๅŠก็Ÿฅ่ฏ†๏ผˆ57ไธชๅญฆ็ง‘๏ผ‰ | GPT-4.1, Claude Opus 4, Gemini 2.5 Pro | ๆ ‡ๅ‡†ๅญฆๆœฏๅŸบๅ‡†๏ผ›ๅฏ่ƒฝไธๅๆ˜ ๅฎž้™…ไฝฟ็”จ | +| MMLU-Pro | ๆ›ด้šพ็š„ MMLU๏ผŒ้œ€่ฆๆŽจ็† | o3, Claude Sonnet 4, Gemini 2.5 Pro | ๆ›ดๅ…ทๆŒ‘ๆˆ˜ๆ€ง็š„็‰ˆๆœฌ | +| GPQA | ็ ”็ฉถ็”Ÿๆฐดๅนณ็ง‘ๅญฆ้—ฎ็ญ” | o3, Gemini 2.5 Pro | ไธ“ๅฎถ็บงๆŽจ็† | +| HellaSwag | ๅธธ่ฏ†ๆŽจ็† | ๅคงๅคšๆ•ฐๅ‰ๆฒฟๆจกๅž‹ๆŽฅ่ฟ‘ๆปกๅˆ† | ๆŽฅ่ฟ‘้ฅฑๅ’Œ | + +### ๆŽจ็†ไธŽๆ•ฐๅญฆ + +| ๅŸบๅ‡†ๆต‹่ฏ• | ๆต‹่ฏ•ๅ†…ๅฎน | ้กถ็บงๆจกๅž‹ | ๅค‡ๆณจ | +| ------------- | -------- | --------------------------- | ------------------ | +| MATH-500 | ็ซž่ต›ๆ•ฐๅญฆ | o3, DeepSeek R1, Qwen3-235B | ้‡ๅŒ–ไปปๅŠก็š„ๅ…ณ้”ฎๆŒ‡ๆ ‡ | +| AIME 2024 | ๆ•ฐๅญฆ็ซž่ต› | o3, DeepSeek R1 | ้žๅธธๆœ‰ๆŒ‘ๆˆ˜ๆ€ง | +| GSM8K | ๅฐๅญฆๆ•ฐๅญฆ | ๅคงๅคšๆ•ฐๆจกๅž‹ >90% | ๆŽฅ่ฟ‘้ฅฑๅ’Œ | +| ARC-Challenge | ็ง‘ๅญฆๆŽจ็† | ๅคงๅคšๆ•ฐๅ‰ๆฒฟๆจกๅž‹ | ๅฐๅญฆ็ง‘ๅญฆ | + +### ็ผ–็จ‹ + +| ๅŸบๅ‡†ๆต‹่ฏ• | ๆต‹่ฏ•ๅ†…ๅฎน | ้กถ็บงๆจกๅž‹ | ๅค‡ๆณจ | +| ------------- | -------------------- | ------------------------------------- | ------------------- | +| HumanEval | Python ไปฃ็ ็”Ÿๆˆ | Claude Sonnet 4, GPT-4.1, DeepSeek V3 | 164 ไธช Python ้—ฎ้ข˜ | +| SWE-bench | ็œŸๅฎž GitHub ้—ฎ้ข˜ไฟฎๅค | Claude Sonnet 4, o3 | ๆฏ” HumanEval ๆ›ด็œŸๅฎž | +| LiveCodeBench | ๆŒ็ปญๆ›ดๆ–ฐ็š„็ผ–็จ‹ๆต‹่ฏ• | ๅ„็ง | ้ฟๅ…ๆ•ฐๆฎๆฑกๆŸ“ | +| MBPP | ๅŸบ็ก€ Python ็ผ–็จ‹ | ๅคงๅคšๆ•ฐๆจกๅž‹ >80% | ๆŽฅ่ฟ‘้ฅฑๅ’Œ | + +### ๅคšๆจกๆ€ + +| ๅŸบๅ‡†ๆต‹่ฏ• | ๆต‹่ฏ•ๅ†…ๅฎน | ้กถ็บงๆจกๅž‹ | ๅค‡ๆณจ | +| --------- | ------------ | ------------------------------- | ------------ | +| MMMU | ๅคšๆจกๆ€็†่งฃ | Gemini 2.5 Pro, Claude Sonnet 4 | ๅ›พๅƒ + ๆ–‡ๆœฌ | +| MathVista | ่ง†่ง‰ๆ•ฐๅญฆๆŽจ็† | Gemini 2.5 Pro | ๅ›พ่กจ + ๆ•ฐๅญฆ | +| AI2D | ็ง‘ๅญฆๅ›พ่กจ | Gemini 2.5 Pro | ็ง‘ๅญฆๅ›พ่กจ็†่งฃ | +| DocVQA | ๆ–‡ๆกฃ็†่งฃ | Gemini 2.5 Pro | ๅ›พๅƒไธญ็š„ๆ–‡ๆœฌ | + +### ๅทฅๅ…ทไฝฟ็”จไธŽๆ™บ่ƒฝไฝ“ + +| ๅŸบๅ‡†ๆต‹่ฏ• | ๆต‹่ฏ•ๅ†…ๅฎน | ้กถ็บงๆจกๅž‹ | ๅค‡ๆณจ | +| -------- | -------------- | ------------------------ | ----------------------- | +| BFCL v3 | ๅ‡ฝๆ•ฐ่ฐƒ็”จๅ‡†็กฎ็އ | GPT-4.1, Claude Sonnet 4 | Berkeley ๅ‡ฝๆ•ฐ่ฐƒ็”จๆŽ’่กŒๆฆœ | +| ฯ„-bench | ๆ™บ่ƒฝไฝ“ไปปๅŠกๅฎŒๆˆ | ๅ„็ง | ๅŸบไบŽ็ปˆ็ซฏ็š„ๆ™บ่ƒฝไฝ“ไปปๅŠก | +| WebArena | ็ฝ‘้กตไบคไบ’ | ๅ„็ง | ็œŸๅฎž็ฝ‘้กตไปปๅŠก | + +## ๅ…ณ้”ฎๆŽ’่กŒๆฆœ + +| ๆŽ’่กŒๆฆœ | ไพง้‡ | URL | +| -------------------- | ------------ | ----------------------------------------------------------------------- | +| LMSYS Chatbot Arena | ไบบ็ฑปๅๅฅฝๆŽ’ๅ | https://chat.lmsys.org/ | +| Open LLM Leaderboard | ๅผ€ๆบๆจกๅž‹ๆŽ’ๅ | https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard | +| AlpacaEval | ๆŒ‡ไปค้ตๅพช | https://tatsu-lab.github.io/alpaca_eval/ | +| MT-Bench | ๅคš่ฝฎๅฏน่ฏ | Chatbot Arena ็š„ไธ€้ƒจๅˆ† | +| BigBench | ่ถ…่ถŠๅŸบ็ก€ไปปๅŠก | https://github.com/google/BIG-bench | +| MTEB | ๅตŒๅ…ฅๆจกๅž‹ | https://huggingface.co/spaces/mteb/leaderboard | + +## ๅฆ‚ไฝ•ๅฐ†ๅŸบๅ‡†ๆต‹่ฏ•ไธŽๆˆ‘ไปฌ็š„็›ฎๅฝ•็ป“ๅˆไฝฟ็”จ + +ไป…้ ๅŸบๅ‡†ๆต‹่ฏ•ไธ่ถณไปฅ่ฟ›่กŒๆจกๅž‹้€‰ๆ‹ฉใ€‚ๅฐ†ๅฎƒไปฌไธŽๆˆ‘ไปฌ็š„็›ฎๅฝ•ๆ•ฐๆฎ็ป“ๅˆไฝฟ็”จ๏ผš + +1. **ไปŽไฝ ็š„็”จไพ‹ๅผ€ๅง‹** โ†’ ๅ‚่ง[ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) +2. **ๆŒ‰่ƒฝๅŠ›็ญ›้€‰** โ†’ ๅทฅๅ…ท่ฐƒ็”จใ€ๆŽจ็†ใ€่ง†่ง‰็ญ‰ +3. **ๆŸฅ็œ‹ๅŸบๅ‡†ๆต‹่ฏ•ๅˆ†ๆ•ฐ** โ†’ ้’ˆๅฏนไฝ ็š„็‰นๅฎšไปปๅŠก้ข†ๅŸŸ +4. **ๆฏ”่พƒๅฎšไปท** โ†’ ไฝฟ็”จๆˆ‘ไปฌ็š„[ๅฎšไปทๆฏ”่พƒ](pricing-comparison.md) +5. **่€ƒ่™‘ไธŠไธ‹ๆ–‡็ช—ๅฃ** โ†’ ๅ‚่ง[ไธŠไธ‹ๆ–‡็ช—ๅฃ](context-windows.md) +6. **็”จไฝ ็š„ๆ•ฐๆฎๆต‹่ฏ•** โ†’ ๅŸบๅ‡†ๆต‹่ฏ•ๆ˜ฏไปฃ็†๏ผ›ๅฎž้™…ๆ€ง่ƒฝๅฏ่ƒฝไธๅŒ + +## ๅŸบๅ‡†ๆต‹่ฏ•็š„ๅฑ€้™ๆ€ง + +- **ๆ•ฐๆฎๆฑกๆŸ“**๏ผšๆจกๅž‹ๅฏ่ƒฝๅœจ่ฎญ็ปƒๆœŸ้—ด่ง่ฟ‡ๅŸบๅ‡†ๆต‹่ฏ•ๆ•ฐๆฎ +- **ไปปๅŠก็‹ญ็ช„**๏ผšๅŸบๅ‡†ๆต‹่ฏ•ๆต‹่ฏ•็‰นๅฎšๆŠ€่ƒฝ๏ผŒ่€Œ้ž้€š็”จๅฎž็”จๆ€ง +- **ๆŽ’่กŒๆฆœๅšๅผˆ**๏ผšไธบๅŸบๅ‡†ๆต‹่ฏ•ไผ˜ๅŒ–ๅฏ่ƒฝๆŸๅฎณๅฎž้™…ๆ€ง่ƒฝ +- **ๆ—ถๆ•ˆๆ€ง**๏ผš้š็€ๆจกๅž‹ๆ”น่ฟ›๏ผŒๅŸบๅ‡†ๆต‹่ฏ•่€ๅŒ–๏ผ›้ฅฑๅ’Œ็š„ๅŸบๅ‡†ๆต‹่ฏ•ๅ˜ๅพ—ๆ— ไฟกๆฏ้‡ +- **ๆ–‡ๅŒ–ๅ่ง**๏ผšๅคงๅคšๆ•ฐๅŸบๅ‡†ๆต‹่ฏ•ไปฅ่‹ฑ่ฏญๅ’Œ่ฅฟๆ–นไธบไธญๅฟƒ +- **ๆˆๆœฌ็›ฒๅŒบ**๏ผšๅŸบๅ‡†ๆต‹่ฏ•ๅฟฝ็•ฅๅฎšไปทใ€ๅปถ่ฟŸๅ’Œๅฏ็”จๆ€ง + +## ๅฎž็”จๅปบ่ฎฎ + +- **็ผ–็จ‹**๏ผšไฝฟ็”จ SWE-bench ่€Œ้ž HumanEval๏ผˆๆ›ด็œŸๅฎž๏ผ‰ +- **ๆ™บ่ƒฝไฝ“**๏ผš็”จไฝ ๅฎž้™…็š„ๅทฅๅ…ทๅฅ—ไปถๆต‹่ฏ•๏ผ›BFCL ๆ˜ฏ่ตท็‚น +- **ๆŽจ็†**๏ผšMATH-500 ๅ’Œ GPQA ๆฏ” MMLU ๆ›ดๆœ‰ๅŒบๅˆ†ๅบฆ +- **่Šๅคฉ**๏ผšChatbot Arena ไธŽไบบ็ฑปๅๅฅฝๆœ€็›ธๅ…ณ +- **ๆˆๆœฌๆ•ๆ„Ÿ**๏ผšๅ…ˆไฝฟ็”จๆˆ‘ไปฌ็š„[ๅ…่ดนๆจกๅž‹](free-models.md)ๆŒ‡ๅ— + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ้€‰ๆ‹ฉๆจกๅž‹็š„ๅ†ณ็ญ–ๆก†ๆžถ +- [ๅฎšไปทๆฏ”่พƒ](pricing-comparison.md) โ€” ่ทจๆไพ›ๅ•†ๆˆๆœฌๅˆ†ๆž +- [ๅ…่ดนๆจกๅž‹](free-models.md) โ€” 81 ไธชๅ…่ดนๆจกๅž‹ๅŠๅ…ถ่ƒฝๅŠ› +- [ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹](tool-calling.md) โ€” 2,350 ไธชๆ”ฏๆŒๅ‡ฝๆ•ฐ่ฐƒ็”จ็š„ๆจกๅž‹ +- [ๆŽจ็†ๆจกๅž‹](reasoning-models.md) โ€” 1,306 ไธชๆ”ฏๆŒๆ‰ฉๅฑ•ๆ€่€ƒ็š„ๆจกๅž‹ +- [่ง†่ง‰ๆจกๅž‹](vision-models.md) โ€” 1,487 ไธชๆ”ฏๆŒๅ›พๅƒ็†่งฃ็š„ๆจกๅž‹ +- [็ผ–็จ‹ๆจกๅž‹](code-models.md) โ€” ้’ˆๅฏน็ผ–็จ‹ไผ˜ๅŒ–็š„ๆจกๅž‹ +- [ๅผ€ๆ”พๆƒ้‡](open-weights.md) โ€” 527 ไธชๅผ€ๆ”พๆƒ้‡ๆจกๅž‹ +- [ไธŠไธ‹ๆ–‡็ช—ๅฃ](context-windows.md) โ€” ไธŠไธ‹ๆ–‡็ช—ๅฃๆฏ”่พƒ +- [ไบคไบ’ๅผ็›ฎๅฝ•](https://i-need-token.github.io/ai-models/) โ€” ๆต่งˆๅ’Œๆฏ”่พƒๆ‰€ๆœ‰ๆจกๅž‹ diff --git a/docs/zh/cached-pricing.md b/docs/zh/cached-pricing.md new file mode 100644 index 00000000..0b87ce23 --- /dev/null +++ b/docs/zh/cached-pricing.md @@ -0,0 +1,245 @@ +# ็ผ“ๅญ˜ๅฎšไปท + +[English](../cached-pricing.md) + +ๆ”ฏๆŒๆ็คบ็ผ“ๅญ˜็š„ AI ๆจกๅž‹๏ผŒๅฑ•็คบๆ ‡ๅ‡†ๅฎšไปทไธŽ็ผ“ๅญ˜ๅฎšไปทๅฏนๆฏ”ใ€‚็ผ“ๅญ˜่พ“ๅ…ฅๅฏๆฏ”ๆ ‡ๅ‡†่พ“ๅ…ฅ token **ไพฟๅฎœ 50-90%**ใ€‚ + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models)ใ€‚ + +## ไธบไป€ไนˆ็ผ“ๅญ˜ๅฎšไปทๅพˆ้‡่ฆ + +ๆ็คบ็ผ“ๅญ˜ๅ…่ฎธไฝ ๅญ˜ๅ‚จ้‡ๅค็š„ๆ็คบๅ‰็ผ€๏ผˆ็ณป็ปŸๆ็คบใ€ๅฐ‘ๆ ทๆœฌ็คบไพ‹ใ€ๅทฅๅ…ทๅฎšไน‰๏ผ‰๏ผŒๅนถๅœจๅคšไธช่ฏทๆฑ‚ไธญๅค็”จใ€‚่ฟ™ๆ˜พ่‘—้™ไฝŽไบ†๏ผš + +- **ๆˆๆœฌ**๏ผš่พ“ๅ…ฅ token ่Š‚็œ 50-90% +- **ๅปถ่ฟŸ**๏ผš็ผ“ๅญ˜ๅ†…ๅฎน็š„้ฆ– token ๆ—ถ้—ดๆ›ดๅฟซ +- **ๅžๅ้‡**๏ผšๆ›ด้ซ˜ๆ•ˆๅœฐๅˆฉ็”จ้€Ÿ็އ้™ๅˆถ + +## ็ปŸ่ฎก + +| ๆŒ‡ๆ ‡ | ๆ•ฐ้‡ | +| ------------------ | ---- | +| ๆ”ฏๆŒ็ผ“ๅญ˜ๅฎšไปท็š„ๆจกๅž‹ | 1374 | +| ๆไพ›ๅ•† | 39 | + +## ๆไพ›ๅ•† + +`aihubmix`, `aion`, `amazon-bedrock`, `auriko`, `baidu`, `baseten`, `chutes`, `clarifai`, `cloudflare`, `cortecs`, `databricks`, `deepinfra`, `deepseek`, `digitalocean`, `fastrouter`, `friendli`, `google`, `google-vertex`, `groq`, `hpc-ai`, `inception`, `jiekou`, `llmgateway`, `martian`, `minimax`, `moonshotai`, `nanogpt`, `openai`, `openrouter`, `ppio`, `privatemode`, `requesty`, `siliconflow`, `stepfun`, `tencent-tokenhub`, `togetherai`, `upstage`, `venice`, `wafer` + +## ๆจกๅž‹ๅฎšไปท + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/M | ็ผ“ๅญ˜่ฏปๅ– $/M | ็ผ“ๅญ˜ๅ†™ๅ…ฅ $/M | ่Š‚็œ | +| --------------------------------------------- | -------------- | ------ | ------------------- | -------------------- | ------------ | ----- | +| aistudio_gemini-2.0-flash | aihubmix | โ€” | $0.05 | $0.125 | โ€” | -150% | +| aistudio_gpt-4.1-mini | aihubmix | โ€” | $0.2 | $0.05 | โ€” | 75% | +| anthropic-opus-4-6 | aihubmix | โ€” | $2.5 | $0.25 | $3.125 | 90% | +| claude-haiku-4-5 | aihubmix | โ€” | $0.55 | $0.055 | $0.6875 | 90% | +| claude-sonnet-4-0 | aihubmix | โ€” | $1.65 | $0.165 | $2.0625 | 90% | +| claude-sonnet-4-5 | aihubmix | โ€” | $1.65 | $0.165 | $2.0625 | 90% | +| claude-sonnet-4-5-think | aihubmix | โ€” | $1.65 | $0.165 | $2.0625 | 90% | +| codex-mini-latest | aihubmix | โ€” | $0.75 | $0.1875 | โ€” | 75% | +| deepseek-v3.2 | aihubmix | โ€” | $0.151 | $0.0151 | โ€” | 90% | +| deepseek-v3.2-exp | aihubmix | โ€” | $0.137 | $0.0137 | โ€” | 90% | +| deepseek-v3.2-exp-think | aihubmix | โ€” | $0.137 | $0.0137 | โ€” | 90% | +| deepseek-v3.2-think | aihubmix | โ€” | $0.151 | $0.0151 | โ€” | 90% | +| doubao-1.5-lite-32k | aihubmix | โ€” | $0.025 | $0.005 | โ€” | 80% | +| doubao-1.5-pro-32k | aihubmix | โ€” | $0.067 | $0.0134 | โ€” | 80% | +| doubao-lite-32k | aihubmix | โ€” | $0.03 | $0.006 | โ€” | 80% | +| doubao-pro-32k | aihubmix | โ€” | $0.07 | $0.014 | โ€” | 80% | +| doubao-seed-1-6 | aihubmix | โ€” | $0.09 | $0.018 | โ€” | 80% | +| doubao-seed-1-6-250615 | aihubmix | โ€” | $0.09 | $0.018 | โ€” | 80% | +| doubao-seed-1-6-flash | aihubmix | โ€” | $0.022 | $0.0044 | โ€” | 80% | +| doubao-seed-1-6-flash-250615 | aihubmix | โ€” | $0.022 | $0.0044 | โ€” | 80% | +| doubao-seed-1-6-lite | aihubmix | โ€” | $0.041 | $0.0082 | โ€” | 80% | +| doubao-seed-1-6-thinking | aihubmix | โ€” | $0.09 | $0.018 | โ€” | 80% | +| doubao-seed-1-6-thinking-250615 | aihubmix | โ€” | $0.09 | $0.018 | โ€” | 80% | +| doubao-seed-1-6-vision-250815 | aihubmix | โ€” | $0.054795 | $0.010959 | โ€” | 80% | +| doubao-seed-1-8 | aihubmix | โ€” | $0.054795 | $0.010959 | โ€” | 80% | +| gemini-2.0-flash | aihubmix | โ€” | $0.05 | $0.0125 | โ€” | 75% | +| gemini-2.0-flash-001 | aihubmix | โ€” | $0.05 | $0.125 | โ€” | -150% | +| gemini-2.0-flash-search | aihubmix | โ€” | $0.05 | $0.0125 | โ€” | 75% | +| gemini-2.5-flash | aihubmix | โ€” | $0.15 | $0.015 | โ€” | 90% | +| gemini-2.5-flash-lite | aihubmix | โ€” | $0.05 | $0.005 | โ€” | 90% | +| gemini-2.5-flash-lite-nothink | aihubmix | โ€” | $0.05 | $0.005 | โ€” | 90% | +| gemini-2.5-flash-lite-preview-09-2025 | aihubmix | โ€” | $0.05 | $0.005 | โ€” | 90% | +| gemini-2.5-flash-lite-preview-09-2025-nothink | aihubmix | โ€” | $0.05 | $0.005 | โ€” | 90% | +| gemini-2.5-flash-nothink | aihubmix | โ€” | $0.15 | $0.015 | โ€” | 90% | +| gemini-2.5-flash-preview-05-20-nothink | aihubmix | โ€” | $0.15 | $0.015 | โ€” | 90% | +| gemini-2.5-flash-preview-05-20-search | aihubmix | โ€” | $0.15 | $0.015 | โ€” | 90% | +| gemini-2.5-flash-preview-09-2025 | aihubmix | โ€” | $0.15 | $0.015 | โ€” | 90% | +| gemini-2.5-flash-search | aihubmix | โ€” | $0.15 | $0.015 | โ€” | 90% | +| gemini-2.5-pro | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gemini-2.5-pro-exp-03-25 | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gemini-2.5-pro-preview-03-25 | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gemini-2.5-pro-preview-03-25-search | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gemini-2.5-pro-preview-05-06 | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gemini-2.5-pro-preview-05-06-search | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gemini-2.5-pro-preview-06-05 | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gemini-2.5-pro-preview-06-05-search | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gemini-2.5-pro-search | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| glm-4.5-airx | aihubmix | โ€” | $0.55 | $0.11 | โ€” | 80% | +| glm-4.5-x | aihubmix | โ€” | $1.1 | $0.22 | โ€” | 80% | +| glm-4.6 | aihubmix | โ€” | $0.136987 | $0.027397 | โ€” | 80% | +| glm-4.6v | aihubmix | โ€” | $0.0685 | $0.0137 | โ€” | 80% | +| glm-4.7 | aihubmix | โ€” | $0.136987 | $0.027397 | โ€” | 80% | +| gpt-4.1 | aihubmix | โ€” | $1 | $0.25 | โ€” | 75% | +| gpt-4.1-mini | aihubmix | โ€” | $0.2 | $0.05 | โ€” | 75% | +| gpt-4.1-nano | aihubmix | โ€” | $0.05 | $0.0125 | โ€” | 75% | +| gpt-4o | aihubmix | โ€” | $1.25 | $0.625 | โ€” | 50% | +| gpt-4o-2024-08-06 | aihubmix | โ€” | $1.25 | $0.625 | โ€” | 50% | +| gpt-4o-2024-08-06-global | aihubmix | โ€” | $1.25 | $0.625 | โ€” | 50% | +| gpt-4o-2024-11-20 | aihubmix | โ€” | $1.25 | $0.625 | โ€” | 50% | +| gpt-4o-mini | aihubmix | โ€” | $0.075 | $0.0375 | โ€” | 50% | +| gpt-4o-mini-2024-07-18 | aihubmix | โ€” | $0.075 | $0.0375 | โ€” | 50% | +| gpt-4o-mini-global | aihubmix | โ€” | $0.075 | $0.0375 | โ€” | 50% | +| gpt-4o-mini-search-preview | aihubmix | โ€” | $0.075 | $0.0375 | โ€” | 50% | +| gpt-4o-search-preview | aihubmix | โ€” | $1.25 | $0.625 | โ€” | 50% | +| gpt-5 | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gpt-5-chat-latest | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gpt-5-codex | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gpt-5-mini | aihubmix | โ€” | $0.125 | $0.0125 | โ€” | 90% | +| gpt-5-nano | aihubmix | โ€” | $0.025 | $0.0025 | โ€” | 90% | +| gpt-5.1 | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gpt-5.1-chat-latest | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gpt-5.1-codex | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gpt-5.1-codex-max | aihubmix | โ€” | $0.625 | $0.0625 | โ€” | 90% | +| gpt-5.1-codex-mini | aihubmix | โ€” | $0.125 | $0.0125 | โ€” | 90% | +| gpt-5.2 | aihubmix | โ€” | $0.875 | $0.0875 | โ€” | 90% | +| gpt-5.2-chat-latest | aihubmix | โ€” | $0.875 | $0.0875 | โ€” | 90% | +| gpt-5.2-codex | aihubmix | โ€” | $0.875 | $0.0875 | โ€” | 90% | +| gpt-5.2-high | aihubmix | โ€” | $0.875 | $0.0875 | โ€” | 90% | +| gpt-5.2-low | aihubmix | โ€” | $0.875 | $0.0875 | โ€” | 90% | +| gpt-5.2-pro | aihubmix | โ€” | $10.5 | $1.05 | โ€” | 90% | +| grok-4 | aihubmix | โ€” | $1.65 | $0.4125 | โ€” | 75% | +| grok-4-1-fast-non-reasoning | aihubmix | โ€” | $0.1 | $0.025 | โ€” | 75% | +| grok-4-1-fast-reasoning | aihubmix | โ€” | $0.1 | $0.025 | โ€” | 75% | +| grok-4-fast-non-reasoning | aihubmix | โ€” | $0.1 | $0.025 | โ€” | 75% | +| grok-4-fast-reasoning | aihubmix | โ€” | $0.1 | $0.025 | โ€” | 75% | +| grok-4.20-beta-0309-non-reasoning | aihubmix | โ€” | $1 | $0.1 | โ€” | 90% | +| grok-4.20-beta-0309-reasoning | aihubmix | โ€” | $1 | $0.1 | โ€” | 90% | +| grok-4.20-multi-agent-0309 | aihubmix | โ€” | $1 | $0.1 | โ€” | 90% | +| grok-4.20-multi-agent-beta-0309 | aihubmix | โ€” | $1 | $0.1 | โ€” | 90% | +| grok-code-fast-1 | aihubmix | โ€” | $0.1 | $0.025 | โ€” | 75% | +| kimi-k2-thinking | aihubmix | โ€” | $0.274 | $0.0685 | โ€” | 75% | +| kimi-k2-turbo-preview | aihubmix | โ€” | $0.6 | $0.15 | โ€” | 75% | +| kimi-k2.5 | aihubmix | โ€” | $0.3 | $0.0525 | โ€” | 82% | +| mimo-v2-flash | aihubmix | โ€” | $0.0959 | $0.01918 | โ€” | 80% | +| mimo-v2-omni | aihubmix | โ€” | $0.22 | $0.044 | โ€” | 80% | +| mimo-v2-pro | aihubmix | โ€” | $0.55 | $0.11 | โ€” | 80% | +| nvidia-nemotron-3-super-120b-a12b | aihubmix | โ€” | $0.055 | $0.01375 | โ€” | 75% | +| o1 | aihubmix | โ€” | $7.5 | $3.75 | โ€” | 50% | +| o1-2024-12-17 | aihubmix | โ€” | $7.5 | $3.75 | โ€” | 50% | +| o1-global | aihubmix | โ€” | $7.5 | $3.75 | โ€” | 50% | +| o1-mini | aihubmix | โ€” | $1.5 | $0.75 | โ€” | 50% | +| o1-mini-2024-09-12 | aihubmix | โ€” | $1.5 | $0.75 | โ€” | 50% | +| o1-preview | aihubmix | โ€” | $7.5 | $3.75 | โ€” | 50% | +| o1-preview-2024-09-12 | aihubmix | โ€” | $7.5 | $3.75 | โ€” | 50% | +| o3 | aihubmix | โ€” | $1 | $0.25 | โ€” | 75% | +| o3-deep-research | aihubmix | โ€” | $5 | $1.25 | โ€” | 75% | +| o3-global | aihubmix | โ€” | $1 | $0.25 | โ€” | 75% | +| o3-mini | aihubmix | โ€” | $0.55 | $0.275 | โ€” | 50% | +| o3-mini-global | aihubmix | โ€” | $0.55 | $0.275 | โ€” | 50% | +| o4-mini | aihubmix | โ€” | $0.55 | $0.1375 | โ€” | 75% | +| qwen-plus | aihubmix | โ€” | $0.0563 | $0.01126 | $0.070375 | 80% | +| qwen-plus-2025-04-28 | aihubmix | โ€” | $0.0563 | $0.01126 | $0.070375 | 80% | +| qwen-plus-2025-07-28 | aihubmix | โ€” | $0.0563 | $0.01126 | $0.070375 | 80% | +| qwen-plus-latest | aihubmix | โ€” | $0.0563 | $0.01126 | $0.070375 | 80% | +| qwen-turbo | aihubmix | โ€” | $0.023 | $0.0046 | โ€” | 80% | +| qwen-turbo-latest | aihubmix | โ€” | $0.023 | $0.0046 | โ€” | 80% | +| qwen3-coder-plus | aihubmix | โ€” | $0.27 | $0.054 | โ€” | 80% | +| qwen3-max | aihubmix | โ€” | $0.2254 | $0.04508 | $0.28175 | 80% | +| qwen3-max-2026-01-23 | aihubmix | โ€” | $0.2254 | $0.04508 | $0.28175 | 80% | +| qwen3-max-preview | aihubmix | โ€” | $0.423 | $0.0846 | โ€” | 80% | +| qwen3-vl-flash | aihubmix | โ€” | $0.0103 | $0.00206 | โ€” | 80% | +| qwen3-vl-plus | aihubmix | โ€” | $0.0685 | $0.0137 | โ€” | 80% | +| zai-glm-5-turbo | aihubmix | โ€” | $0.6 | $0.12 | โ€” | 80% | +| aion-2.0 | aion | โ€” | $0.7999999999999999 | $0.19999999999999998 | โ€” | 75% | +| aion-2.5 | aion | โ€” | $1 | $0.35 | โ€” | 65% | +| amazon-nova-2-lite | amazon-bedrock | โ€” | $0.33 | $0.0825 | โ€” | 75% | +| amazon-nova-lite | amazon-bedrock | โ€” | $0.06 | $0.015 | โ€” | 75% | +| amazon-nova-micro | amazon-bedrock | โ€” | $0.035 | $0.00875 | โ€” | 75% | +| amazon-nova-premier | amazon-bedrock | โ€” | $2.5 | $0.625 | โ€” | 75% | +| amazon-nova-pro | amazon-bedrock | โ€” | $0.8 | $0.2 | โ€” | 75% | +| claude-haiku-4-5-20251001 | auriko | โ€” | $1 | $0.1 | $1.25 | 90% | +| claude-opus-4-1-20250805 | auriko | โ€” | $15 | $1.5 | $18.75 | 90% | +| claude-opus-4-20250514 | auriko | โ€” | $15 | $1.5 | $18.75 | 90% | +| claude-opus-4-5-20251101 | auriko | โ€” | $5 | $0.5 | $6.25 | 90% | +| claude-opus-4-6 | auriko | โ€” | $5 | $0.5 | $6.25 | 90% | +| claude-opus-4-7 | auriko | โ€” | $5 | $0.5 | $6.25 | 90% | +| claude-sonnet-4-20250514 | auriko | โ€” | $3 | $0.3 | $3.75 | 90% | +| claude-sonnet-4-5-20250929 | auriko | โ€” | $3 | $0.3 | $3.75 | 90% | +| claude-sonnet-4-6 | auriko | โ€” | $3 | $0.3 | $3.75 | 90% | +| deepseek-r1-0528 | auriko | โ€” | $0.5 | $0.35 | โ€” | 30% | +| deepseek-v3-0324 | auriko | โ€” | $0.2 | $0.135 | โ€” | 32% | +| deepseek-v3.1 | auriko | โ€” | $0.21 | $0.13 | โ€” | 38% | +| deepseek-v3.1-terminus | auriko | โ€” | $0.27 | $0.13 | โ€” | 52% | +| deepseek-v3.2 | auriko | โ€” | $0.26 | $0.13 | โ€” | 50% | +| deepseek-v4-flash | auriko | โ€” | $0.14 | $0.0028 | โ€” | 98% | +| deepseek-v4-pro | auriko | โ€” | $0.435 | $0.003625 | โ€” | 99% | +| gemini-2.5-flash | auriko | โ€” | $0.3 | $0.03 | โ€” | 90% | +| gemini-2.5-flash-lite | auriko | โ€” | $0.1 | $0.01 | โ€” | 90% | +| gemini-2.5-pro | auriko | โ€” | $1.25 | $0.125 | โ€” | 90% | +| gemini-3-flash-preview | auriko | โ€” | $0.5 | $0.05 | โ€” | 90% | +| gemini-3.1-flash-lite | auriko | โ€” | $0.25 | $0.025 | โ€” | 90% | +| gemini-3.1-flash-lite-preview | auriko | โ€” | $0.25 | $0.025 | โ€” | 90% | +| gemini-3.1-pro-preview | auriko | โ€” | $2 | $0.2 | โ€” | 90% | +| gemini-3.1-pro-preview-customtools | auriko | โ€” | $2 | $0.2 | โ€” | 90% | +| gemini-flash-latest | auriko | โ€” | $0.5 | $0.05 | โ€” | 90% | +| gemini-flash-lite-latest | auriko | โ€” | $0.1 | $0.01 | โ€” | 90% | +| gemini-pro-latest | auriko | โ€” | $2 | $0.2 | โ€” | 90% | +| glm-4.5 | auriko | โ€” | $0.6 | $0.11 | โ€” | 82% | +| glm-4.5-air | auriko | โ€” | $0.2 | $0.03 | โ€” | 85% | +| glm-4.5-airx | auriko | โ€” | $1.1 | $0.22 | โ€” | 80% | +| glm-4.5-x | auriko | โ€” | $2.2 | $0.45 | โ€” | 80% | +| glm-4.5v | auriko | โ€” | $0.6 | $0.11 | โ€” | 82% | +| glm-4.6 | auriko | โ€” | $0.6 | $0.11 | โ€” | 82% | +| glm-4.6v | auriko | โ€” | $0.3 | $0.05 | โ€” | 83% | +| glm-4.6v-flashx | auriko | โ€” | $0.04 | $0.004 | โ€” | 90% | +| glm-4.7 | auriko | โ€” | $0.6 | $0.11 | โ€” | 82% | +| glm-4.7-flashx | auriko | โ€” | $0.07 | $0.01 | โ€” | 86% | +| glm-5 | auriko | โ€” | $1 | $0.2 | โ€” | 80% | +| glm-5-turbo | auriko | โ€” | $1.2 | $0.24 | โ€” | 80% | +| glm-5.1 | auriko | โ€” | $1.4 | $0.26 | โ€” | 81% | +| glm-5v-turbo | auriko | โ€” | $1.2 | $0.24 | โ€” | 80% | +| gpt-4.1-2025-04-14 | auriko | โ€” | $2 | $0.5 | โ€” | 75% | +| gpt-4.1-mini-2025-04-14 | auriko | โ€” | $0.4 | $0.1 | โ€” | 75% | +| gpt-4.1-nano-2025-04-14 | auriko | โ€” | $0.1 | $0.025 | โ€” | 75% | +| gpt-4o-2024-08-06 | auriko | โ€” | $2.5 | $1.25 | โ€” | 50% | +| gpt-4o-2024-11-20 | auriko | โ€” | $2.5 | $1.25 | โ€” | 50% | +| gpt-4o-mini-2024-07-18 | auriko | โ€” | $0.15 | $0.075 | โ€” | 50% | +| gpt-5-2025-08-07 | auriko | โ€” | $1.25 | $0.125 | โ€” | 90% | +| gpt-5-chat-latest | auriko | โ€” | $1.25 | $0.125 | โ€” | 90% | +| gpt-5-mini-2025-08-07 | auriko | โ€” | $0.25 | $0.025 | โ€” | 90% | +| gpt-5-nano-2025-08-07 | auriko | โ€” | $0.05 | $0.005 | โ€” | 90% | +| gpt-5.1-2025-11-13 | auriko | โ€” | $1.25 | $0.125 | โ€” | 90% | +| gpt-5.1-chat-latest | auriko | โ€” | $1.25 | $0.125 | โ€” | 90% | +| gpt-5.2-2025-12-11 | auriko | โ€” | $1.75 | $0.175 | โ€” | 90% | +| gpt-5.2-chat-latest | auriko | โ€” | $1.75 | $0.175 | โ€” | 90% | +| gpt-5.3-chat-latest | auriko | โ€” | $1.75 | $0.175 | โ€” | 90% | +| gpt-5.4-2026-03-05 | auriko | โ€” | $2.5 | $0.25 | โ€” | 90% | +| gpt-5.4-mini-2026-03-17 | auriko | โ€” | $0.75 | $0.075 | โ€” | 90% | +| gpt-5.4-nano-2026-03-17 | auriko | โ€” | $0.2 | $0.02 | โ€” | 90% | +| gpt-5.5-2026-04-23 | auriko | โ€” | $5 | $0.5 | โ€” | 90% | +| gpt-oss-120b | auriko | โ€” | $0.15 | $0.01 | โ€” | 93% | +| gpt-oss-20b | auriko | โ€” | $0.07 | $0.04 | โ€” | 43% | +| grok-4.20-0309-non-reasoning | auriko | โ€” | $1.25 | $0.2 | โ€” | 84% | +| grok-4.20-0309-reasoning | auriko | โ€” | $1.25 | $0.2 | โ€” | 84% | +| grok-4.3 | auriko | โ€” | $1.25 | $0.2 | โ€” | 84% | +| hy3-preview | auriko | โ€” | $0.066 | $0.029 | โ€” | 56% | +| kimi-k2-0711-preview | auriko | โ€” | $0.6 | $0.15 | โ€” | 75% | +| kimi-k2-0905-preview | auriko | โ€” | $0.6 | $0.15 | โ€” | 75% | +| kimi-k2-thinking | auriko | โ€” | $0.6 | $0.15 | โ€” | 75% | +| kimi-k2-thinking-turbo | auriko | โ€” | $1.15 | $0.15 | โ€” | 87% | + +> ๐Ÿ“„ ๆ˜พ็คบๅ‰ 200 ไธช๏ผŒๅ…ฑ 1374 ไธชๆจกๅž‹ใ€‚ไฝฟ็”จ[ไบคไบ’ๅผ็›ฎๅฝ•](https://i-need-token.github.io/ai-models/)ๆต่งˆๅ…จ้ƒจใ€‚ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ๆˆๆœฌไผ˜ๅŒ–ๆŠ€ๅทง +- [ๅฎšไปทๅฏนๆฏ”](pricing-comparison.md) โ€” ๅ„ๆไพ›ๅ•†ๅฎšไปทๅนถๆŽ’ๅฏนๆฏ” +- [ๅ…่ดน AI ๆจกๅž‹](free-models.md) โ€” 81 ไธชๅ…่ดนๆจกๅž‹ +- [ไธŠไธ‹ๆ–‡็ช—ๅฃๅฏนๆฏ”](context-windows.md) โ€” ๆœ€ๅคงไธŠไธ‹ๆ–‡็ช—ๅฃ +- [ๅผ€ๆบๆƒ้‡ๆจกๅž‹](open-weights.md) โ€” 527 ไธชๅฏ่‡ช่กŒ่ฟ่กŒ็š„ๆจกๅž‹ diff --git a/docs/zh/chat-models.md b/docs/zh/chat-models.md new file mode 100644 index 00000000..584b0ec6 --- /dev/null +++ b/docs/zh/chat-models.md @@ -0,0 +1,99 @@ +# ่Šๅคฉๆจกๅž‹ + +[English](../chat-models.md) + +ๆ”ฏๆŒ**ๅทฅๅ…ท่ฐƒ็”จ**็š„ AI ๆจกๅž‹ โ€” ๆž„ๅปบ่Šๅคฉๅบ”็”จใ€AI ๅŠฉๆ‰‹ๅ’Œๅฏน่ฏๆ™บ่ƒฝไฝ“็š„ๆ ธๅฟƒ่ƒฝๅŠ›ใ€‚่ฟ™ไบ›ๆจกๅž‹ๅฏไปฅ็†่งฃ่‡ช็„ถ่ฏญ่จ€ใ€็”Ÿๆˆๅ›žๅคๅนถ่ฐƒ็”จๅค–้ƒจๅทฅๅ…ทใ€‚ + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models)ใ€‚ + +## ไธบไป€ไนˆ่Šๅคฉๆจกๅž‹ๅพˆ้‡่ฆ + +่Šๅคฉๆจกๅž‹ๆ˜ฏ็Žฐไปฃ AI ๅบ”็”จ็š„ๅŸบ็Ÿณ๏ผš + +- **ๅฏน่ฏๅผ AI** โ€” ๅธฆไธŠไธ‹ๆ–‡็š„่‡ช็„ถ่ฏญ่จ€ๅฏน่ฏ +- **AI ๅŠฉๆ‰‹** โ€” ้ขๅ‘ไปปๅŠก็š„่ŠๅคฉไธŽๅทฅๅ…ทไฝฟ็”จ +- **ๅฎขๆˆทๆ”ฏๆŒ** โ€” ๅธฆ็Ÿฅ่ฏ†ๅบ“่ฎฟ้—ฎ็š„่‡ชๅŠจๅŒ–ๆ”ฏๆŒ +- **ๅ†…ๅฎน็”Ÿๆˆ** โ€” ๅ†™ไฝœใ€ๆ‘˜่ฆใ€็ฟป่ฏ‘ +- **ๆ•ฐๆฎๅˆ†ๆž** โ€” ่‡ช็„ถ่ฏญ่จ€ๆŸฅ่ฏข็ป“ๆž„ๅŒ–ๆ•ฐๆฎ + +ๅทฅๅ…ท่ฐƒ็”จๆ˜ฏๅ…ณ้”ฎๅทฎๅผ‚ๅŒ–่ƒฝๅŠ› โ€” ๅฎƒๅ…่ฎธๆจกๅž‹่ถ…่ถŠๆ–‡ๆœฌ็”Ÿๆˆ๏ผŒๅœจ็Žฐๅฎžไธ–็•Œไธญ้‡‡ๅ–่กŒๅŠจใ€‚ + +## ็ปŸ่ฎก + +| ๆŒ‡ๆ ‡ | ๆ•ฐ้‡ | +| ------------------------ | ---- | +| ่Šๅคฉๆจกๅž‹๏ผˆๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ๏ผ‰ | 2350 | +| ๆไพ›ๅ•† | 71 | +| ๅ…่ดน่Šๅคฉๆจกๅž‹ | 54 | +| ๅผ€ๆบๆƒ้‡่Šๅคฉๆจกๅž‹ | 278 | +| ๅธฆๆŽจ็†่ƒฝๅŠ› | 1080 | +| ๅธฆ็ป“ๆž„ๅŒ–่พ“ๅ‡บ | 758 | + +## ๆไพ›ๅ•† + +`01ai`, `302ai`, `aihubmix`, `aimlapi`, `alibaba`, `amazon`, `amazon-bedrock`, `anthropic`, `arcee`, `auriko`, `baidu`, `baseten`, `berget`, `bytedance`, `cerebras`, `chutes`, `clarifai`, `cloudferro-sherlock`, `cloudflare`, `cortecs`, `databricks`, `deepseek`, `digitalocean`, `dinference`, `evroc` ็ญ‰ 46 ไธช + +## ๅ…่ดน่Šๅคฉๆจกๅž‹ + +ๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ็š„ๅ…่ดนๆจกๅž‹ โ€” ้›ถๆˆๆœฌ่Šๅคฉๅบ”็”จใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/M | ่พ“ๅ‡บ $/M | ่ƒฝๅŠ› | +| ---------------------------------------------------- | ---------- | ------ | -------- | -------- | ----- | +| openrouter--owl-alpha | openrouter | 1M | Free | Free | ๐Ÿ“‹ | +| deepseek--deepseek-v4-flash--free | openrouter | 1M | Free | Free | ๐Ÿง  | +| qwen--qwen3-coder--free | openrouter | 1M | Free | Free | | +| nvidia--nemotron-3-super-120b-a12b--free | openrouter | 1M | Free | Free | ๐Ÿง  ๐Ÿ“‹ | +| google--gemma-4-26b-a4b-it--free | openrouter | 262K | Free | Free | ๐Ÿง  ๐Ÿ“‹ | +| arcee-ai--trinity-large-thinking--free | openrouter | 262K | Free | Free | ๐Ÿง  | +| google--gemma-4-31b-it--free | openrouter | 262K | Free | Free | ๐Ÿง  ๐Ÿ“‹ | +| gemma-4-26b-a4b-it | auriko | 262K | Free | Free | ๐Ÿง  ๐Ÿ“‹ | +| gemma-4-31b-it | auriko | 262K | Free | Free | ๐Ÿง  ๐Ÿ“‹ | +| nvidia--nemotron-3-nano-omni-30b-a3b-reasoning--free | openrouter | 256K | Free | Free | ๐Ÿง  | + +## ๆœ€ไพฟๅฎœ่Šๅคฉๆจกๅž‹ + +็”Ÿไบง็Žฏๅขƒ่Šๅคฉ็š„ๆœ€ไฝณๆ€งไปทๆฏ”ๆจกๅž‹ใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/M | ่พ“ๅ‡บ $/M | ่ƒฝๅŠ› | +| ------------------------------------------- | ------------ | ------ | -------- | -------- | ---- | +| ernie-4.5-0.3b | aihubmix | 0 | $0.0068 | $0.0272 | ๐Ÿ“‹ | +| bdc-coder | inferencenet | 131K | $0.01 | $0.01 | ๐Ÿ”“ | +| inclusionai--ling-2.6-flash | openrouter | 262K | $0.01 | $0.03 | ๐Ÿ“‹ | +| ling-2.6-flash | inclusionai | 262K | $0.01 | $0.03 | | +| qwen-3.5-0.8b | auriko | 262K | $0.01 | $0.05 | ๐Ÿง  | +| qwen3-vl-flash-2026-01-22 | aihubmix | 0 | $0.0103 | $0.103 | ๐Ÿ“‹ | +| qwen3-vl-flash | aihubmix | 0 | $0.0103 | $0.103 | ๐Ÿ“‹ | +| klusterai--Meta-Llama-3.1-8B-Instruct-Turbo | klusterai | 131K | $0.015 | $0.02 | | +| granite-4.0-h-micro | cloudflare | 131K | $0.017 | $0.112 | ๐Ÿ”“ | +| llama-3.1-8b-instruct | cortecs | 0 | $0.018 | $0.054 | ๐Ÿง  | + +## ๅคงไธŠไธ‹ๆ–‡่Šๅคฉๆจกๅž‹ + +ไธŠไธ‹ๆ–‡็ช—ๅฃๆœ€ๅคง็š„่Šๅคฉๆจกๅž‹ โ€” ้€‚็”จไบŽ้•ฟๅฏน่ฏๅ’Œๆ–‡ๆกฃๅˆ†ๆžใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/M | ่พ“ๅ‡บ $/M | ่ƒฝๅŠ› | +| ---------------------------- | ---------- | ------ | -------- | -------- | ---- | +| meta-llama--llama-4-scout | openrouter | 10M | $0.08 | $0.3 | ๐Ÿ“‹ | +| meta-llama-4-scout | meta | 10M | $0.17 | $0.66 | | +| gemini-1.5-pro | google | 2M | $1.25 | $5 | ๐Ÿ“‹ | +| grok-code-fast-1 | jiekou | 2M | $0.19 | $0.475 | | +| gpt-4o | jiekou | 2M | $1.9 | $5.7 | | +| grok-4.20-0309-non-reasoning | jiekou | 2M | $0.19 | $0.475 | | +| grok-4.20-0309-reasoning | jiekou | 2M | $1.9 | $5.7 | | +| grok-4-1-fast-reasoning | jiekou | 2M | $0.19 | $0.475 | | +| grok-4-fast-reasoning | jiekou | 2M | $0.19 | $0.475 | | +| x-ai--grok-4-fast | fastrouter | 2M | $0.2 | $0.5 | | + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๆ™บ่ƒฝไฝ“ๆจกๅž‹](agentic-models.md) โ€” 1,080 ไธชๅ…ทๅค‡ๅทฅๅ…ท่ฐƒ็”จ + ๆŽจ็†่ƒฝๅŠ›็š„ๆจกๅž‹ +- [ๆŽจ็†ๆจกๅž‹](reasoning-models.md) โ€” 1,306 ไธชๆ”ฏๆŒๆŽจ็†็š„ๆจกๅž‹ +- [ไปฃ็ ๆจกๅž‹](code-models.md) โ€” 189 ไธชไปฃ็ ๆจกๅž‹ +- [ๅ…่ดน AI ๆจกๅž‹](free-models.md) โ€” 81 ไธชๅ…่ดนๆจกๅž‹ๆŒ‰่ƒฝๅŠ›ๅˆ†็ฑป +- [็ป“ๆž„ๅŒ–่พ“ๅ‡บ](structured-output.md) โ€” 829 ไธช JSON ๆจกๅผๆจกๅž‹ +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ้€‰ๆ‹ฉๆจกๅž‹็š„ๅ†ณ็ญ–ๆก†ๆžถ +- [็ผ“ๅญ˜ๅฎšไปท](cached-pricing.md) โ€” 1,374 ไธชๆ”ฏๆŒๆ็คบ็ผ“ๅญ˜็š„ๆจกๅž‹ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/code-examples.md b/docs/zh/code-examples.md new file mode 100644 index 00000000..759b45c9 --- /dev/null +++ b/docs/zh/code-examples.md @@ -0,0 +1,367 @@ +# ไปฃ็ ็คบไพ‹ + +[English](../code-examples.md) | **ไธญๆ–‡** + +ๅคš็ง่ฏญ่จ€ไฝฟ็”จ AI Models Catalog ๆ•ฐๆฎ็š„ๅฎž็”จไปฃ็ ็คบไพ‹ใ€‚ + +## ไธ‹่ฝฝๆ•ฐๆฎ + +```bash +# JSON โ€” ๅฎŒๆ•ดๅ…ƒๆ•ฐๆฎ (2.3 MB) +curl -LO https://github.com/i-need-token/ai-models/releases/latest/download/models.json + +# CSV โ€” ้€‚็”จไบŽ Excel/Google Sheets ็š„ๅนณ้ข่กจๆ ผ (560 KB) +curl -LO https://github.com/i-need-token/ai-models/releases/latest/download/models.csv +``` + +ๆˆ–ไฝฟ็”จ [jsDelivr CDN](https://www.jsdelivr.com/package/npm/ai-models)๏ผˆๆ— ้œ€ไธ‹่ฝฝ๏ผŒๆ”ฏๆŒ CORS๏ผ‰๏ผš + +```bash +# ๅง‹็ปˆๆœ€ๆ–ฐ๏ผŒๅฏๅœจๆต่งˆๅ™จไธญไฝฟ็”จ +curl -s https://github.com/i-need-token/ai-models/releases/latest/download/models.json | jq '.models | length' +``` + +## TypeScript / JavaScript + +### ๅฎ‰่ฃ… npm ๅŒ… + +```bash +npm install ai-models +``` + +### ๅŸบๆœฌ็”จๆณ• + +```typescript +import catalog from "ai-models"; +import type { Model } from "ai-models"; + +// ๆจกๅž‹ๆ€ปๆ•ฐ +console.log(`Total models: ${catalog.models.length}`); + +// ๆŒ‰ๆไพ›ๅ•†ๆŸฅๆ‰พๆจกๅž‹ +const openaiModels = catalog.models.filter((m) => m.provider === "openai"); +console.log(`OpenAI models: ${openaiModels.length}`); +``` + +### ๆŸฅๆ‰พๆœ€ไพฟๅฎœ็š„ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹ + +```typescript +import catalog from "ai-models"; + +const affordable = catalog.models + .filter((m) => m.tool_call && m.pricing?.input && m.pricing.input < 1) + .sort((a, b) => a.pricing.input - b.pricing.input) + .slice(0, 10); + +for (const m of affordable) { + console.log(`${m.name}: $${m.pricing.input}/1M input, $${m.pricing.output}/1M output`); +} +``` + +### ๆŸฅๆ‰พๆœ€ๅคงไธŠไธ‹ๆ–‡็ช—ๅฃ็š„ๆจกๅž‹ + +```typescript +import catalog from "ai-models"; + +const largest = catalog.models + .filter((m) => m.limit?.context) + .sort((a, b) => b.limit.context - a.limit.context) + .slice(0, 10); + +for (const m of largest) { + console.log(`${m.name}: ${(m.limit.context / 1_000_000).toFixed(1)}M context`); +} +``` + +### ๆŸฅๆ‰พๆ”ฏๆŒ่ง†่ง‰็š„ๅ…่ดนๆจกๅž‹ + +```typescript +import catalog from "ai-models"; + +const freeVision = catalog.models.filter( + (m) => m.pricing?.unit === "free" && m.modalities?.input?.includes("image"), +); + +console.log(`Free vision models: ${freeVision.length}`); +for (const m of freeVision) { + console.log(`- ${m.name} (${m.provider})`); +} +``` + +## Python + +### ไฝฟ็”จ JSON ๆ•ฐๆฎ + +```python +import json +import urllib.request + +# ไธ‹่ฝฝๆœ€ๆ–ฐๆ•ฐๆฎ +url = "https://github.com/i-need-token/ai-models/releases/latest/download/models.json" +urllib.request.urlretrieve(url, "models.json") + +with open("models.json") as f: + catalog = json.load(f) + +print(f"Total models: {len(catalog['models'])}") +``` + +### ๆŸฅๆ‰พ่พ“ๅ‡บไปทๆ ผไฝŽไบŽ $5/1M ็š„ๆŽจ็†ๆจกๅž‹ + +```python +reasoning_cheap = [ + m for m in catalog["models"] + if m.get("reasoning") + and m.get("pricing", {}).get("output") + and m["pricing"]["output"] < 5 +] + +for m in sorted(reasoning_cheap, key=lambda x: x["pricing"]["output"]): + print(f"{m['name']}: ${m['pricing']['output']}/1M output") +``` + +### ไฝฟ็”จ pandas ๅค„็† CSV + +```python +import pandas as pd + +df = pd.read_csv("https://github.com/i-need-token/ai-models/releases/latest/download/models.csv") + +# ็ญ›้€‰ๅ’ŒๆŽ’ๅบ +tool_calling = df[df["tool_call"] == True].sort_values("pricing_input") +print(tool_calling[["name", "provider", "pricing_input", "pricing_output"]].head(10)) +``` + +### ๆŸฅๆ‰พๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ็š„ๅผ€ๆบๆจกๅž‹ + +```python +open_tool = [ + m for m in catalog["models"] + if m.get("open_weights") and m.get("tool_call") +] + +print(f"Open-weight models with tool calling: {len(open_tool)}") +for m in open_tool[:10]: + print(f" - {m['name']} ({m['provider']})") +``` + +## Go + +```go +package main + +import ( + "encoding/json" + "fmt" + "net/http" +) + +type Catalog struct { + Models []Model `json:"models"` +} + +type Model struct { + ID string `json:"id"` + Name string `json:"name"` + Provider string `json:"provider"` + ToolCall bool `json:"tool_call"` + Pricing Pricing `json:"pricing"` +} + +type Pricing struct { + Input float64 `json:"input"` + Output float64 `json:"output"` +} + +func main() { + resp, err := http.Get("https://github.com/i-need-token/ai-models/releases/latest/download/models.json") + if err != nil { + panic(err) + } + defer resp.Body.Close() + + var catalog Catalog + json.NewDecoder(resp.Body).Decode(&catalog) + + fmt.Printf("Total models: %d\n", len(catalog.Models)) + + // ๆŸฅๆ‰พ่พ“ๅ…ฅไปทๆ ผไฝŽไบŽ $1/1M ็š„ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹ + for _, m := range catalog.Models { + if m.ToolCall && m.Pricing.Input > 0 && m.Pricing.Input < 1 { + fmt.Printf("%s: $%.2f/1M input\n", m.Name, m.Pricing.Input) + } + } +} +``` + +## Rust + +```rust +use serde::Deserialize; + +#[derive(Deserialize)] +struct Catalog { + models: Vec, +} + +#[derive(Deserialize)] +struct Model { + id: String, + name: String, + provider: String, + #[serde(default)] + tool_call: bool, + pricing: Option, +} + +#[derive(Deserialize)] +struct Pricing { + input: f64, + output: f64, +} + +fn main() -> Result<(), Box> { + let data = reqwest::blocking::get( + "https://github.com/i-need-token/ai-models/releases/latest/download/models.json" + )?.text()?; + + let catalog: Catalog = serde_json::from_str(&data)?; + println!("Total models: {}", catalog.models.len()); + + // ๆŸฅๆ‰พๆŽจ็†ๆจกๅž‹ + let reasoning: Vec<_> = catalog.models.iter() + .filter(|m| m.tool_call) + .collect(); + + println!("Tool-calling models: {}", reasoning.len()); + Ok(()) +} +``` + +## Shell / jq + +```bash +# ไธ‹่ฝฝๆ•ฐๆฎ +curl -sLO https://github.com/i-need-token/ai-models/releases/latest/download/models.json + +# ็ปŸ่ฎกๆจกๅž‹ๆ€ปๆ•ฐ +jq '.models | length' models.json + +# ๆŸฅๆ‰พๆ‰€ๆœ‰ OpenAI ๆจกๅž‹ +jq '.models[] | select(.provider == "openai") | .name' models.json + +# ๆŸฅๆ‰พๆœ€ไพฟๅฎœ็š„ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹ +jq '[.models[] | select(.tool_call == true and .pricing.input != null)] | sort_by(.pricing.input) | .[:5] | .[] | {name, provider, input: .pricing.input}' models.json + +# ๆŸฅๆ‰พๅ…่ดนๆจกๅž‹ +jq '[.models[] | select(.pricing.unit == "free")] | length' models.json + +# ๅˆ—ๅ‡บๆ‰€ๆœ‰ๆไพ›ๅ•† +jq '.providers | keys' models.json +``` + +## Excel / Google Sheets + +1. ไธ‹่ฝฝ CSV๏ผš`https://github.com/i-need-token/ai-models/releases/latest/download/models.csv` +2. ๅœจ Excel ไธญๆ‰“ๅผ€ๆˆ–ๅฏผๅ…ฅ Google Sheets +3. ไฝฟ็”จ็ญ›้€‰ๅ™จๆŒ‰ๆไพ›ๅ•†ใ€่ƒฝๅŠ›ๆˆ–ไปทๆ ผ่Œƒๅ›ดๆŸฅๆ‰พๆจกๅž‹ + +## ๅธธ่งๆŸฅ่ฏข + +### ๆŸฅๆ‰พๆœ€้€‚ๅˆ็ผ–็จ‹็š„ๆจกๅž‹ + +```typescript +import catalog from "ai-models"; + +const codingModels = catalog.models.filter( + (m) => + m.tool_call && + m.structured_output && + m.limit?.context >= 128000 && + m.pricing?.input && + m.pricing.input <= 5, +); + +// ๆŒ‰ไธŠไธ‹ๆ–‡็ช—ๅฃ๏ผˆ้™ๅบ๏ผ‰ๆŽ’ๅบ๏ผŒ็„ถๅŽๆŒ‰ไปทๆ ผ๏ผˆๅ‡ๅบ๏ผ‰ๆŽ’ๅบ +codingModels.sort((a, b) => { + const ctxDiff = (b.limit?.context ?? 0) - (a.limit?.context ?? 0); + if (ctxDiff !== 0) return ctxDiff; + return (a.pricing?.input ?? 0) - (b.pricing?.input ?? 0); +}); +``` + +### ๆฏ”่พƒๅŒไธ€ๆจกๅž‹็ณปๅˆ—ๅœจไธๅŒๆไพ›ๅ•†็š„ไปทๆ ผ + +```typescript +import catalog from "ai-models"; + +// ๆŒ‰็ณปๅˆ—ๅˆ†็ป„ +const families = new Map(); +for (const m of catalog.models) { + if (!m.family) continue; + const list = families.get(m.family) ?? []; + list.push(m); + families.set(m.family, list); +} + +// ๆŸฅๆ‰พๅœจๅคšไธชๆไพ›ๅ•†ไธŠๅฏ็”จ็š„็ณปๅˆ— +for (const [family, models] of families) { + const providers = new Set(models.map((m) => m.provider)); + if (providers.size > 1) { + console.log(`\n${family}:`); + for (const m of models) { + console.log(` ${m.provider}: $${m.pricing?.input}/1M in, $${m.pricing?.output}/1M out`); + } + } +} +``` + +### ไธบไฝ ็š„ๅบ”็”จๆž„ๅปบๆจกๅž‹้€‰ๆ‹ฉๅ™จ + +```typescript +import catalog from "ai-models"; +import type { Model } from "ai-models"; + +interface ModelRequirements { + toolCall?: boolean; + vision?: boolean; + reasoning?: boolean; + structuredOutput?: boolean; + minContext?: number; + maxInputPrice?: number; + maxOutputPrice?: number; + openWeights?: boolean; + provider?: string; +} + +function findModels(req: ModelRequirements): Model[] { + return catalog.models.filter((m) => { + if (req.toolCall && !m.tool_call) return false; + if (req.vision && !m.modalities?.input?.includes("image")) return false; + if (req.reasoning && !m.reasoning) return false; + if (req.structuredOutput && !m.structured_output) return false; + if (req.minContext && (m.limit?.context ?? 0) < req.minContext) return false; + if (req.maxInputPrice && (m.pricing?.input ?? Infinity) > req.maxInputPrice) return false; + if (req.maxOutputPrice && (m.pricing?.output ?? Infinity) > req.maxOutputPrice) return false; + if (req.openWeights && !m.open_weights) return false; + if (req.provider && m.provider !== req.provider) return false; + return true; + }); +} + +// ็คบไพ‹๏ผšๆŸฅๆ‰พๆ”ฏๆŒ่ง†่ง‰ๅ’Œๅทฅๅ…ท่ฐƒ็”จ็š„ไพฟๅฎœๆจกๅž‹ +const results = findModels({ + vision: true, + toolCall: true, + maxInputPrice: 1, + maxOutputPrice: 5, +}); +``` + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [API ไธŽ็ผ–็จ‹่ฎฟ้—ฎ](api.md) โ€” npmใ€CDNใ€CSVใ€GitHub Action +- [ๅฟซ้€Ÿๅ…ฅ้—จ](quick-start.md) โ€” 30 ็ง’ๅ†…ๆ‰พๅˆฐ้€‚ๅˆ็š„ๆจกๅž‹ +- [ๆ•ฐๆฎๆจกๅผ](data-schema.md) โ€” ๅฎŒๆ•ด YAML ๆจกๅผๅ‚่€ƒ +- [ๅธธ่ง้—ฎ้ข˜](faq.md) โ€” ๅธธ่ง้—ฎ้ข˜ +- [ๆœฏ่ฏญ่กจ](glossary.md) โ€” ๅ…ณ้”ฎๆœฏ่ฏญๅ’Œๅฎšไน‰ diff --git a/docs/zh/code-models.md b/docs/zh/code-models.md new file mode 100644 index 00000000..70c9b62c --- /dev/null +++ b/docs/zh/code-models.md @@ -0,0 +1,61 @@ +[English](../code-models.md) | **ไธญๆ–‡** + +# ไปฃ็  AI ๆจกๅž‹ โ€” 189 ไธช็”จไบŽไปฃ็ ็”Ÿๆˆๅ’Œ็†่งฃ็š„ๆจกๅž‹ + +ไธ“ไธบ **ไปฃ็ ็”Ÿๆˆใ€ไปฃ็ ๅฎกๆŸฅใ€่ฐƒ่ฏ•ๅ’Œ่ฝฏไปถๅทฅ็จ‹** ไปปๅŠกไผ˜ๅŒ–็š„ๆจกๅž‹ใ€‚ๆ‰€ๆœ‰ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) ไธ€ๆ‰‹ APIใ€‚ + +## ็ปŸ่ฎก + +| Metric | Count | +| ------------------- | ----- | +| Code-focused models | 0 | +| Providers | 0 | +| With tool calling | 0 | +| With reasoning | 0 | +| With vision | 0 | +| Free | 0 | +| Open weights | 0 | + +## ๆœ€ไพฟๅฎœ็š„ไปฃ็ ๆจกๅž‹๏ผˆ็›ด่ฟžๆไพ›ๅ•†๏ผ‰ + +| Model | Provider | Context | Input $/1M | Output $/1M | Reasoning | +| ----- | -------- | ------- | ---------- | ----------- | --------- | + +## ๅธฆๆŽจ็†็š„ไปฃ็ ๆจกๅž‹๏ผˆ้€‚ๅˆๅคๆ‚ไปปๅŠก๏ผ‰ + +| Model | Provider | Context | Input $/1M | Output $/1M | Tool Call | +| ----- | -------- | ------- | ---------- | ----------- | --------- | + +## ๅ…่ดนไปฃ็ ๆจกๅž‹ + +| Model | Provider | Context | Reasoning | Tool Call | +| ----- | -------- | ------- | --------- | --------- | + +## ๆœ€ๅคงไธŠไธ‹ๆ–‡ไปฃ็ ๆจกๅž‹ + +| Model | Provider | Context | Input $/1M | Output $/1M | +| ----- | -------- | ------- | ---------- | ----------- | + +## ้€‰ๆ‹ฉไปฃ็ ๆจกๅž‹ + +| Use Case | Recommended | Why | +| ------------ | -------------------------- | --------------------- | +| Autocomplete | Qwen2.5-Coder, DeepSeek V3 | Fast, cheap | +| Code review | Claude Sonnet 4, GPT-4.1 | Reasoning + tool call | +| Bug fixing | DeepSeek R1, Claude Opus 4 | Deep reasoning | +| Refactoring | Gemini 2.5 Pro | Large context | +| Code agents | Claude Sonnet 4, GPT-4.1 | Tool call + reasoning | +| Self-hosted | Qwen2.5-Coder, Llama 4 | Open weights | + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [Reasoning Models](reasoning-models.md) โ€” 1,306 models with chain-of-thought +- [Tool Calling Models](tool-calling.md) โ€” 2,350 models with function calling +- [Agentic Models](agentic-models.md) โ€” 1,080 models for AI agents +- [OpenAI Alternatives](openai-alternatives.md) โ€” GPT-4 alternatives +- [Free AI Models](free-models.md) โ€” 81 models at zero cost +- [Open-Weight Models](open-weights.md) โ€” 527 models with open weights + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/context-windows.md b/docs/zh/context-windows.md new file mode 100644 index 00000000..7b0877a2 --- /dev/null +++ b/docs/zh/context-windows.md @@ -0,0 +1,77 @@ +[English](../context-windows.md) | **ไธญๆ–‡** + +# ไธŠไธ‹ๆ–‡็ช—ๅฃๅฏนๆฏ” + +ๅ“ชไบ›ๆจกๅž‹ๆ‹ฅๆœ‰ๆœ€ๅคง็š„ไธŠไธ‹ๆ–‡็ช—ๅฃ๏ผŸๆœฌ้กตๆŒ‰ไธŠไธ‹ๆ–‡็ช—ๅฃๅคงๅฐๅ’Œๅฎšไปทๅˆ—ๅ‡บๆจกๅž‹ใ€‚ + +> ๅฎŒๆ•ดๅˆ—่กจ่ฏทไธ‹่ฝฝ [models.json](https://github.com/i-need-token/ai-models/releases/latest) ๆˆ–ๆต่งˆ `providers/`ใ€‚ + +## ไธŠไธ‹ๆ–‡็ช—ๅฃๅˆ†ๅธƒ + +| ๅฑ‚็บง | ๆจกๅž‹ๆ•ฐ | ๆ่ฟฐ | +| ---------------- | -----: | -------------------------------- | +| 1M+ tokens | 391 | ๅฏๅค„็†ๆ•ดๆœฌไนฆใ€ๆ•ดไธชไปฃ็ ๅบ“ๆˆ–้•ฟๅฏน่ฏ | +| 256Kโ€“1M tokens | 459 | ๅคงๅž‹ๆ–‡ๆกฃใ€ๅคš่ฝฎๅฏน่ฏ | +| 128Kโ€“256K tokens | 1,310 | ๆ ‡ๅ‡†้•ฟไธŠไธ‹ๆ–‡๏ผŒๅคงๅคšๆ•ฐ็Žฐไปฃๆจกๅž‹ | +| 32Kโ€“128K tokens | 194 | ไธญ็ญ‰้•ฟๅบฆๆ–‡ๆกฃ | +| 8Kโ€“32K tokens | 97 | ็Ÿญๆ–‡ๆกฃใ€ๅ•่ฝฎๆŸฅ่ฏข | +| <8K tokens | 19 | ๆ—งๆจกๅž‹๏ผŒๆž็Ÿญ่พ“ๅ…ฅ | + +## ๆœ€ๅคงไธŠไธ‹ๆ–‡็ช—ๅฃ๏ผˆ1M+ tokens๏ผ‰ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/1M | ่พ“ๅ‡บ $/1M | ๅทฅๅ…ท่ฐƒ็”จ | ๆŽจ็† | +| ----------------------------- | ---------- | ------ | --------: | --------: | -------- | ---- | +| Llama 4 Scout | Meta | 10M | โ€” | โ€” | โœ… | โŒ | +| Llama 4 Scout | OpenRouter | 10M | $0.08 | $0.30 | โœ… | โŒ | +| Gemini 3 Pro Preview | Google | 2M | $2.00 | $12.00 | โœ… | โŒ | +| Gemini 3.1 Flash Lite Preview | Google | 2M | $0.25 | $1.50 | โœ… | โŒ | +| Gemini 3.1 Pro Preview | Google | 2M | $2.00 | $12.00 | โœ… | โŒ | +| Grok 4 Fast Reasoning | xAI | 2M | $0.20 | $0.50 | โœ… | โœ… | +| GPT-4.1 | OpenAI | ~1M | $2.00 | $8.00 | โœ… | โŒ | +| Gemini 2.5 Pro | Google | 1M | $1.25 | $10.00 | โœ… | โœ… | +| Gemini 2.5 Flash | Google | 1M | $0.15 | $0.60 | โœ… | โœ… | +| Llama 4 Maverick | Meta | 1M | โ€” | โ€” | โœ… | โŒ | +| Qwen3-235B-A22B | ้˜ฟ้‡Œไบ‘ | 128K\* | ยฅ1.00 | ยฅ4.00 | โœ… | โœ… | +| DeepSeek-V3 | DeepSeek | 128K | $0.27 | $1.10 | โœ… | โŒ | + +\*ๆณจ๏ผš้ƒจๅˆ†ๆจกๅž‹ๅœจไธๅŒๅนณๅฐไธŠ็š„ไธŠไธ‹ๆ–‡้™ๅˆถไธๅŒใ€‚่ฏทๆŸฅ็œ‹็‰นๅฎšๆไพ›ๅ•†็š„ YAML ๆ–‡ไปถ่Žทๅ–ๅ‡†็กฎๅ€ผใ€‚ + +## ๅ„ไธŠไธ‹ๆ–‡ๅฑ‚็บง็š„ๆœ€ไฝณๆ€งไปทๆฏ” + +### 1M+ tokens๏ผˆๆœ€ไพฟๅฎœ๏ผ‰ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ่พ“ๅ…ฅ $/1M | ่พ“ๅ‡บ $/1M | +| ---------------- | ----------- | ---------------: | --------: | +| Llama 4 Scout | OpenRouter | $0.08 | $0.30 | +| Gemini 2.5 Flash | Google | $0.15 | $0.60 | +| Llama 4 Scout | Together AI | $0.15 | $0.60 | +| Llama 4 Scout | Meta | ๅ…่ดน๏ผˆๅผ€ๆบๆƒ้‡๏ผ‰ | โ€” | + +### 128Kโ€“256K tokens๏ผˆๆœ€ไพฟๅฎœ๏ผ‰ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ่พ“ๅ…ฅ $/1M | ่พ“ๅ‡บ $/1M | +| ------------- | --------- | --------: | --------: | +| DeepSeek-V3 | DeepSeek | $0.27 | $1.10 | +| Qwen3-30B-A3B | ้˜ฟ้‡Œไบ‘ | ยฅ0.10 | ยฅ0.30 | +| Phi-4 | Microsoft | $0.10 | $0.40 | +| Gemma 3 27B | Google | $0.20 | $0.80 | + +## ่ฆ็‚นๆ€ป็ป“ + +- **Llama 4 Scout** ๆ‹ฅๆœ‰ๆœ€ๅคง็š„ไธŠไธ‹ๆ–‡็ช—ๅฃ๏ผŒ่พพ **10M tokens** โ€” ๆ˜ฏๅ…ถไป–ๆจกๅž‹็š„ 10 ๅ€ +- **1M+ ไธŠไธ‹ๆ–‡**็Žฐๅทฒๅœจ 6+ ไธชๆไพ›ๅ•†ไธญๅฏ็”จ๏ผŒๅŒ…ๆ‹ฌๅ…่ดนๅผ€ๆบๆƒ้‡ๆจกๅž‹ +- **128K ไธŠไธ‹ๆ–‡**ๆ˜ฏๆœ€ๅธธ่ง็š„ๅฑ‚็บง๏ผˆ1,310 ไธชๆจกๅž‹๏ผ‰โ€” ่ถณไปฅๆปก่ถณๅคงๅคšๆ•ฐ็”จไพ‹ +- **ๆˆๆœฌ้šไธŠไธ‹ๆ–‡ๅขž้•ฟ**๏ผš1M+ ไธŠไธ‹ๆ–‡ๆจกๅž‹็š„ๆฏ token ๆˆๆœฌๆ˜ฏ 128K ๆจกๅž‹็š„ 2โ€“10 ๅ€ +- **็ผ“ๅญ˜่ฏปๅ–ๅฎšไปท**ๅฏๆ˜พ่‘—้™ไฝŽ้‡ๅคๆŸฅ่ฏข็š„ๆˆๆœฌ๏ผˆๆœ€้ซ˜ 90% ๆŠ˜ๆ‰ฃ๏ผ‰ + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ๅคงไธŠไธ‹ๆ–‡ๆจกๅž‹ๆŽจ่ +- [ๅฎšไปทๅฏนๆฏ”](pricing-comparison.md) โ€” ๅ„ๆไพ›ๅ•†ๅฎšไปทๅนถๆŽ’ๅฏนๆฏ” +- [ๅ…่ดน AI ๆจกๅž‹](free-models.md) โ€” 81 ไธชๅ…่ดนๆจกๅž‹ๆŒ‰ไธŠไธ‹ๆ–‡็ช—ๅฃๅˆ†็ฑป +- [่ง†่ง‰ๆจกๅž‹](vision-models.md) โ€” 1,487 ไธช่ง†่ง‰ๆจกๅž‹ๅซไธŠไธ‹ๆ–‡ไฟกๆฏ +- [็ผ“ๅญ˜ๅฎšไปท](cached-pricing.md) โ€” 1,374 ไธชๆ”ฏๆŒๆ็คบ็ผ“ๅญ˜็š„ๆจกๅž‹ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/data-acquisition.md b/docs/zh/data-acquisition.md index 83578930..936a65f3 100644 --- a/docs/zh/data-acquisition.md +++ b/docs/zh/data-acquisition.md @@ -256,3 +256,15 @@ parseModality | toLowerCase | toUpperCase | trim | removeCommas | identity 2. ็›ดๆŽฅๆ›ดๆ–ฐ YAML ๆ–‡ไปถ 3. ๅฐ† `last_updated` ่ฎพไธบๅฝ“ๅ‰ๆ—ฅๆœŸ 4. ็”จ `npm run validate` ้ชŒ่ฏ + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๆ•ฐๆฎๆจกๅผ](data-schema.md) โ€” ๅฎŒๆ•ด YAML ๆจกๅผๅ‚่€ƒ +- [่ฎพ่ฎกๅŽŸๅˆ™](lessons-learned.md) โ€” ็ป้ชŒๆ•™่ฎญ +- [ๆไพ›ๅ•†ๆฆ‚่งˆ](providers.md) โ€” 95 ไธชๆไพ›ๅ•† +- [ๅธธ่ง้—ฎ้ข˜](faq.md) โ€” ๅธธ่ง้—ฎ้ข˜ +- [่ดก็ŒฎๆŒ‡ๅ—](https://github.com/i-need-token/ai-models/blob/main/CONTRIBUTING.md) โ€” ๅฆ‚ไฝ•่ดก็Œฎ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/data-schema.md b/docs/zh/data-schema.md new file mode 100644 index 00000000..ded0ab32 --- /dev/null +++ b/docs/zh/data-schema.md @@ -0,0 +1,221 @@ +[English](../data-schema.md) | **ไธญๆ–‡** + +# ๆ•ฐๆฎ Schema ๅ‚่€ƒ + +ๆœฌ็›ฎๅฝ•ไฝฟ็”จ็š„ YAML ๆ•ฐๆฎ Schema ๅฎŒๆ•ดๅ‚่€ƒใ€‚ๆ‰€ๆœ‰ๆจกๅž‹ๆ•ฐๆฎๆ–‡ไปถ้ตๅพช [`types/`](../../types/) ไธญ็š„ TypeScript ็ฑปๅž‹ๅฎšไน‰๏ผŒๅนถๅœจ่ฟ่กŒๆ—ถ็”ฑ [`types/schemas.ts`](../../types/schemas.ts) ไธญ็š„ Zod schema ๆ ก้ชŒใ€‚ + +## ๆจกๅž‹ Schema + +ๆฏไธชๆจกๅž‹ๆ˜ฏ `providers//models/.yaml` ไธ‹็š„ๅ•ไธช YAML ๆ–‡ไปถใ€‚ + +### ๅฟ…ๅกซๅญ—ๆฎต + +| ๅญ—ๆฎต | ็ฑปๅž‹ | ๆ่ฟฐ | ็คบไพ‹ | +| -------------- | ------- | ---------------------------------------- | ------------------------------------------ | +| `id` | string | ็จณๅฎš็š„ๆจกๅž‹ ID๏ผˆๆ— ๆ—ฅๆœŸๅŽ็ผ€๏ผ‰ | `gpt-4o`, `claude-sonnet-4-5` | +| `name` | string | ๆ˜พ็คบๅ็งฐ | `GPT-4o`, `Claude Sonnet 4.5` | +| `family` | string | ๆจกๅž‹ๅฎถๆ—๏ผˆๅนฟๆณ›่ฐฑ็ณป๏ผ‰ | `gpt-4o`, `claude-sonnet` | +| `pricing` | Pricing | ๆจกๅž‹ๅฎšไปท๏ผˆ่งไธ‹ๆ–‡๏ผ‰ | โ€” | +| `modalities` | object | ่พ“ๅ…ฅ/่พ“ๅ‡บๆจกๆ€ | `{ input: [text, image], output: [text] }` | +| `last_updated` | string | ๆœ€ๅŽๆ•ฐๆฎๆ›ดๆ–ฐๆ—ฅๆœŸ (YYYY-MM-DD ๆˆ– YYYY-MM) | `2024-08-06` | + +### ๅฏ้€‰ๅญ—ๆฎต + +| ๅญ—ๆฎต | ็ฑปๅž‹ | ้ป˜่ฎคๅ€ผ | ๆ่ฟฐ | ็คบไพ‹ | +| ------------------- | ------- | ------- | ------------------------ | ------------------------------------ | +| `reasoning` | boolean | `false` | ๆ”ฏๆŒๆŽจ็†/ๆ€่€ƒๆจกๅผ | `true` | +| `temperature` | boolean | `true` | ๆ”ฏๆŒ temperature ๅ‚ๆ•ฐ | `false` | +| `tool_call` | boolean | `false` | ๆ”ฏๆŒๅทฅๅ…ท/ๅ‡ฝๆ•ฐ่ฐƒ็”จ | `true` | +| `attachment` | boolean | `false` | ๆ”ฏๆŒๆ–‡ไปถ้™„ไปถ | `true` | +| `structured_output` | boolean | `false` | ๆ”ฏๆŒ็ป“ๆž„ๅŒ–/JSON ่พ“ๅ‡บ | `true` | +| `open_weights` | boolean | `false` | ๅผ€ๆบๆƒ้‡ๆจกๅž‹ | `true` | +| `deprecated` | boolean | `false` | ๅทฒๅผƒ็”จไฝ†ไปๅฏ่ฎฟ้—ฎ | `true` | +| `limit` | object | โ€” | Token ้™ๅˆถ | `{ context: 128000, output: 16384 }` | +| `limit.context` | number | โ€” | ไธŠไธ‹ๆ–‡็ช—ๅฃๅคงๅฐ๏ผˆtokens๏ผ‰ | `128000` | +| `limit.output` | number | โ€” | ๆœ€ๅคง่พ“ๅ‡บ tokens | `16384` | +| `knowledge` | string | โ€” | ่ฎญ็ปƒๆ•ฐๆฎๆˆชๆญขๆ—ฅๆœŸ | `2023-10` | +| `release_date` | string | โ€” | ๆจกๅž‹ๅ‘ๅธƒๆ—ฅๆœŸ | `2024-05-13` | +| `snapshots` | array | โ€” | ๅธฆๆ—ฅๆœŸ็š„ๆจกๅž‹็‰ˆๆœฌ | ่งไธ‹ๆ–‡ | + +### ๆจกๆ€็ฑปๅž‹ + +| ๆจกๆ€ | ๆ่ฟฐ | +| ------- | -------------- | +| `text` | ๆ–‡ๆœฌ่พ“ๅ…ฅๆˆ–่พ“ๅ‡บ | +| `image` | ๅ›พๅƒ่พ“ๅ…ฅๆˆ–่พ“ๅ‡บ | +| `video` | ่ง†้ข‘่พ“ๅ…ฅ | +| `audio` | ้Ÿณ้ข‘่พ“ๅ…ฅๆˆ–่พ“ๅ‡บ | +| `pdf` | PDF ๆ–‡ๆกฃ่พ“ๅ…ฅ | + +## ๅฎšไปท Schema + +ๅฎšไปทๆ˜ฏๅ››็ง็ฑปๅž‹็š„่”ๅˆไฝ“ใ€‚ๆฏไธชๆจกๅž‹ๅชไฝฟ็”จไธ€็งใ€‚ + +### TokenPricing๏ผˆๆœ€ๅธธ่ง๏ผ‰ + +ๆŒ‰็™พไธ‡ token ่ฎก่ดนใ€‚่ดงๅธ้ป˜่ฎค USD๏ผŒๅ•ไฝ้ป˜่ฎค `per_mtok`ใ€‚ + +```yaml +pricing: + currency: USD # ๅฏ้€‰๏ผŒ้ป˜่ฎค USD + unit: per_mtok # ๅฏ้€‰๏ผŒ้ป˜่ฎค per_mtok + input: 2.5 # $/็™พไธ‡ ่พ“ๅ…ฅ token + output: 10 # $/็™พไธ‡ ่พ“ๅ‡บ token + cache_write: 1.25 # ๅฏ้€‰๏ผŒ$/็™พไธ‡ ็ผ“ๅญ˜ๅ†™ๅ…ฅ + cache_read: 0.625 # ๅฏ้€‰๏ผŒ$/็™พไธ‡ ็ผ“ๅญ˜่ฏปๅ– +``` + +**่ฟ›้˜ถ๏ผšๆŒ‰ไธŠไธ‹ๆ–‡้•ฟๅบฆๅˆ†ๅฑ‚ๅฎšไปท** + +```yaml +pricing: + input: + - up_to: 128000 # โ‰ค 128K ไธŠไธ‹ๆ–‡ + price: 2.5 + - price: 5.0 # > 128K ไธŠไธ‹ๆ–‡๏ผˆๆ—  up_to = ๆœ€็ปˆๅฑ‚็บง๏ผ‰ + output: 10 +``` + +**่ฟ›้˜ถ๏ผšๆŒ‰ๆจกๆ€ๅฎšไปท** + +```yaml +pricing: + input: + text: 1.25 + image: 2.5 + audio: 5.0 + output: + text: 5.0 + audio: 10.0 +``` + +### VideoPricing + +ๆŒ‰็ง’่ฎก่ดน๏ผŒๅฏ้€‰ๆŒ‰ๅˆ†่พจ็އๅˆ†ๅฑ‚ใ€‚ + +```yaml +pricing: + currency: USD + unit: per_second + price: 0.03 # ๅ›บๅฎšๆฏ็ง’ไปทๆ ผ +``` + +```yaml +pricing: + unit: per_second + price: # ๆŒ‰ๅˆ†่พจ็އๅฎšไปท + 720p: 0.02 + 1080p: 0.03 + 4k: 0.05 +``` + +### UnitPricing + +ๆŒ‰ๅ›พๅƒๆˆ–ๆŒ‰่ฏทๆฑ‚่ฎก่ดนใ€‚ + +```yaml +pricing: + unit: per_image + price: 0.04 +``` + +```yaml +pricing: + unit: per_request + price: 0.005 +``` + +### FreePricing + +ๅ…่ดนใ€‚ + +```yaml +pricing: + unit: free +``` + +## ๅฟซ็…ง Schema + +ๅฟซ็…งไปฃ่กจๆจกๅž‹็š„ๅธฆๆ—ฅๆœŸ็‰ˆๆœฌใ€‚ๅฎƒไปฌ็ปงๆ‰ฟ็ˆถ็บง็š„ๆ‰€ๆœ‰ๅญ—ๆฎต๏ผŒๅช่ฆ†็›–ไธๅŒ็š„้ƒจๅˆ†ใ€‚ + +```yaml +id: gpt-4o +name: GPT-4o +# ... ็ˆถ็บงๅญ—ๆฎต ... +snapshots: + - id: gpt-4o-2024-08-06 # ๆœ€ๆ–ฐ็š„ๅœจๅ‰ + last_updated: "2024-08-06" + - id: gpt-4o-2024-05-13 + deprecated: true # ๆญคๅฟซ็…งๅทฒๅผƒ็”จ + last_updated: "2024-05-13" +``` + +ๅฟซ็…งๅฏไปฅ่ฆ†็›–็ˆถ็บง็š„ไปปไฝ•ๅฏ้€‰ๅญ—ๆฎต๏ผš + +```yaml +snapshots: + - id: gemini-2.0-flash-exp + limit: + context: 1048576 # ไธๅŒ็š„ไธŠไธ‹ๆ–‡็ช—ๅฃ + output: 8192 + pricing: + unit: free # ๅฎž้ชŒ็‰ˆ = ๅ…่ดน +``` + +## ๆไพ›ๅ•† Schema + +ๆฏไธชๆไพ›ๅ•†ๅœจ `providers//provider.yaml` ๆœ‰ไธ€ไธช `provider.yaml` ๆ–‡ไปถใ€‚ + +| ๅญ—ๆฎต | ็ฑปๅž‹ | ๅฟ…ๅกซ | ๆ่ฟฐ | ็คบไพ‹ | +| ---------------- | ------ | ---- | ------------------------- | ---------------------------------- | +| `id` | string | โœ… | ๆไพ›ๅ•† ID๏ผˆไธŽ็›ฎๅฝ•ๅๅŒน้…๏ผ‰ | `openai` | +| `name` | string | โœ… | ๆ˜พ็คบๅ็งฐ | `OpenAI` | +| `url` | string | โœ… | ๅฎ˜ๆ–น็ฝ‘็ซ™ URL | `https://openai.com` | +| `api_docs` | string | โŒ | API ๆ–‡ๆกฃ URL | `https://platform.openai.com/docs` | +| `apis` | object | โœ… | ๆŒ‰ๆ ผๅผๅˆ†็ฑป็š„ API ็ซฏ็‚น | ่งไธ‹ๆ–‡ | +| `apis.openai` | string | โŒ | OpenAI ๅ…ผๅฎน API ็ซฏ็‚น | `https://api.openai.com/v1` | +| `apis.anthropic` | string | โŒ | Anthropic API ็ซฏ็‚น | โ€” | +| `apis.google` | string | โŒ | Google AI API ็ซฏ็‚น | โ€” | +| `currency` | string | โŒ | ้ป˜่ฎค่ดงๅธ (USD/CNY/EUR) | `USD` | + +### API ๆ ผๅผ + +| ๆ ผๅผ | ๆ่ฟฐ | ไฝฟ็”จ่€… | +| ----------- | ---------------------------------- | ----------------- | +| `openai` | OpenAI ๅ…ผๅฎน็š„ Chat Completions API | ๅคงๅคšๆ•ฐๆไพ›ๅ•† | +| `anthropic` | Anthropic Messages API | Anthropic | +| `google` | Google Generative AI API | Google, Vertex AI | + +## ่ดงๅธๅ‚่€ƒ + +| ่ดงๅธ | ไปฃ็  | ไฝฟ็”จ่€… | +| ------ | ----- | ----------------------------------------- | +| ็พŽๅ…ƒ | `USD` | ๅคงๅคšๆ•ฐๆไพ›ๅ•†๏ผˆ้ป˜่ฎค๏ผ‰ | +| ไบบๆฐ‘ๅธ | `CNY` | ้˜ฟ้‡Œไบ‘ใ€302.AIใ€AIHubMixใ€PPIO ็ญ‰ | +| ๆฌงๅ…ƒ | `EUR` | Bergetใ€CloudFerroใ€OVHcloudใ€Scaleway ็ญ‰ | + +## ๆ ก้ชŒ + +ๆ‰€ๆœ‰ YAML ๆ–‡ไปถๅœจ่ฟ่กŒๆ—ถ็”ฑ Zod schema ๆ ก้ชŒ๏ผš + +```bash +# ๆ ก้ชŒๆ‰€ๆœ‰ๆจกๅž‹ๆ•ฐๆฎ +npx tsx scripts/validate.ts + +# ๆ ก้ชŒ็‰นๅฎšๆไพ›ๅ•† +npx tsx scripts/validate.ts openai +``` + +ๆ ก้ชŒไฝฟ็”จ [`types/schemas.ts`](../../types/schemas.ts) ไธญ็š„ `ModelSchema`๏ผŒไธŽ TypeScript ็ฑปๅž‹ๅฎŒๅ…จๅฏนๅบ”ใ€‚ไปปไฝ•ไธ็ฌฆๅˆ schema ็š„ YAML ๆ–‡ไปถๅฐ†ไบง็”Ÿๆ ก้ชŒ้”™่ฏฏ๏ผŒๅŒ…ๅซๅ…ทไฝ“็š„ๅญ—ๆฎต่ทฏๅพ„ๅ’Œ้—ฎ้ข˜ใ€‚ + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๆ•ฐๆฎ่Žทๅ–](data-acquisition.md) โ€” ๅฆ‚ไฝ•่Žทๅ–ๅ’Œๆ›ดๆ–ฐๆ•ฐๆฎ +- [API ไธŽ็ผ–็จ‹่ฎฟ้—ฎ](api.md) โ€” npmใ€CDNใ€CSV ่ฎฟ้—ฎ +- [ไปฃ็ ็คบไพ‹](code-examples.md) โ€” ๅฎž็”จไปฃ็ ็คบไพ‹ +- [่ฎพ่ฎกๅŽŸๅˆ™](lessons-learned.md) โ€” ็ป้ชŒๆ•™่ฎญ +- [ๅธธ่ง้—ฎ้ข˜](faq.md) โ€” ๅธธ่ง้—ฎ้ข˜ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/embedding-models.md b/docs/zh/embedding-models.md new file mode 100644 index 00000000..6fbf69c3 --- /dev/null +++ b/docs/zh/embedding-models.md @@ -0,0 +1,71 @@ +# ๅตŒๅ…ฅๆจกๅž‹ + +[English](../embedding-models.md) + +็”Ÿๆˆ**ๅ‘้‡ๅตŒๅ…ฅ**็š„ AI ๆจกๅž‹ โ€” ๆ–‡ๆœฌใ€ๅ›พๅƒๅ’Œๅ…ถไป–ๆ•ฐๆฎ็š„ๆ•ฐๅ€ผ่กจ็คบใ€‚่ฏญไน‰ๆœ็ดขใ€RAG๏ผˆๆฃ€็ดขๅขžๅผบ็”Ÿๆˆ๏ผ‰ใ€่š็ฑปๅ’Œ็›ธไผผๅบฆไปปๅŠก็š„ๅŸบ็ก€ใ€‚ + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models)ใ€‚ + +## ไธบไป€ไนˆๅตŒๅ…ฅๆจกๅž‹ๅพˆ้‡่ฆ + +ๅตŒๅ…ฅๆจกๅž‹ๆ˜ฏ่ฎธๅคš AI ็ณป็ปŸ็š„ๅŸบ็ก€๏ผš + +- **่ฏญไน‰ๆœ็ดข** โ€” ๆŒ‰ๅซไน‰่€Œ้žๅ…ณ้”ฎ่ฏๆŸฅๆ‰พ็›ธๅ…ณๆ–‡ๆกฃ +- **RAG** โ€” ไธบ LLM ๆฃ€็ดขไธŠไธ‹ๆ–‡ไปฅ็”Ÿๆˆๆœ‰ไพๆฎ็š„็ญ”ๆกˆ +- **่š็ฑป** โ€” ๅฐ†็›ธไผผ้กน็›ฎๅˆ†็ป„ +- **็›ธไผผๅบฆ** โ€” ๆŸฅๆ‰พ้‡ๅค้กนใ€ๆŽจ่ๅ’Œ็›ธๅ…ณๅ†…ๅฎน +- **ๅˆ†็ฑป** โ€” ้€š่ฟ‡ๅตŒๅ…ฅ่ฟ›่กŒ้›ถๆ ทๆœฌๅ’Œๅฐ‘ๆ ทๆœฌๅˆ†็ฑป + +## ็ปŸ่ฎก + +| ๆŒ‡ๆ ‡ | ๆ•ฐ้‡ | +| ---------------- | ---- | +| ๅตŒๅ…ฅๆจกๅž‹ | 5 | +| ๆไพ›ๅ•† | 3 | +| ๅ…่ดนๅตŒๅ…ฅๆจกๅž‹ | 0 | +| ๅผ€ๆบๆƒ้‡ๅตŒๅ…ฅๆจกๅž‹ | 1 | + +## ๆไพ›ๅ•† + +`openai`ใ€`tencent`ใ€`upstage` + +## ๅ…่ดนๅตŒๅ…ฅๆจกๅž‹ + +ๅ…่ดนๅตŒๅ…ฅๆจกๅž‹ โ€” ้›ถๆˆๆœฌ่ฏญไน‰ๆœ็ดขๅ’Œ RAGใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/M | +| ---- | ------ | ------ | -------- | + +## ๆœ€ไพฟๅฎœๅตŒๅ…ฅๆจกๅž‹ + +็”Ÿไบง็ŽฏๅขƒๅตŒๅ…ฅ็š„ๆœ€ไฝณๆ€งไปทๆฏ”ๆจกๅž‹ใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/M | +| ----------------------- | ------- | ------ | -------- | --- | +| text-embedding-3-small | openai | 8K | $0.02 | | +| solar-embedding-1-large | upstage | 0 | $0.1 | ๐Ÿ”“ | +| text-embedding-ada-002 | openai | 8K | $0.1 | | +| text-embedding-3-large | openai | 8K | $0.13 | | +| hunyuan-embedding | tencent | 0 | $0.7 | | + +## ๅคงไธŠไธ‹ๆ–‡ๅตŒๅ…ฅๆจกๅž‹ + +ไธŠไธ‹ๆ–‡็ช—ๅฃๆœ€ๅคง็š„ๅตŒๅ…ฅๆจกๅž‹ โ€” ้€‚็”จไบŽๅตŒๅ…ฅ้•ฟๆ–‡ๆกฃใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/M | +| ---------------------- | ------ | ------ | -------- | --- | +| text-embedding-ada-002 | openai | 8K | $0.1 | | +| text-embedding-3-small | openai | 8K | $0.02 | | +| text-embedding-3-large | openai | 8K | $0.13 | | + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๅ…่ดน AI ๆจกๅž‹](free-models.md) โ€” 81 ไธชๅ…่ดนๆจกๅž‹ๆŒ‰่ƒฝๅŠ›ๅˆ†็ฑป +- [ๅผ€ๆบๆƒ้‡](open-weights.md) โ€” 527 ไธชๅผ€ๆบๆƒ้‡ๆจกๅž‹ +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ้€‰ๆ‹ฉๆจกๅž‹็š„ๅ†ณ็ญ–ๆก†ๆžถ +- [API ๅ‚่€ƒ](api.md) โ€” ็ผ–็จ‹่ฎฟ้—ฎ +- [ๅฟซ้€Ÿๅ…ฅ้—จ](quick-start.md) โ€” 5 ๅˆ†้’ŸไธŠๆ‰‹ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/faq.md b/docs/zh/faq.md new file mode 100644 index 00000000..34a39187 --- /dev/null +++ b/docs/zh/faq.md @@ -0,0 +1,114 @@ +# ๅธธ่ง้—ฎ้ข˜ + +[English](../faq.md) + +## ้€š็”จ + +### ไป€ไนˆๆ˜ฏ AI Models Catalog๏ผŸ + +AI Models Catalog ๆ˜ฏไธ€ไธช็ป“ๆž„ๅŒ–็š„ YAML ็›ฎๅฝ•๏ผŒๆ”ถๅฝ•ไบ† 95+ ไธช AI ๆไพ›ๅ•†็š„ๆจกๅž‹ๅ…ƒๆ•ฐๆฎใ€‚ๅŒ…ๆ‹ฌๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃใ€ๆจกๆ€ใ€่ƒฝๅŠ›็ญ‰ไฟกๆฏโ€”โ€”ๆ‰€ๆœ‰ๆ•ฐๆฎๅ‡ๆฅ่‡ชไธ€ๆ‰‹ API ๅ’Œๅฎ˜ๆ–นๆ–‡ๆกฃใ€‚ + +### ไธŽๅ…ถไป–ๆจกๅž‹็›ฎๅฝ•ๆœ‰ไฝ•ไธๅŒ๏ผŸ + +- **ไป…ไฝฟ็”จไธ€ๆ‰‹ๆ•ฐๆฎ** โ€” ๆ‰€ๆœ‰ๆ•ฐๆฎ็›ดๆŽฅๆฅ่‡ชๆไพ›ๅ•† API ๅ’Œๅฎ˜ๆ–นๆ–‡ๆกฃ๏ผŒ่€Œ้ž็ฌฌไธ‰ๆ–น่šๅˆๅ™จ +- **็ป“ๆž„ๅŒ– YAML** โ€” ๆœบๅ™จๅฏ่ฏป๏ผŒๆ”ฏๆŒ TypeScript ็ฑปๅž‹ๅ’Œ Zod ๆ ก้ชŒ +- **ๅ…จ้ข็š„ๅ…ƒๆ•ฐๆฎ** โ€” ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃใ€ๆจกๆ€ใ€่ƒฝๅŠ›ใ€ๅฟซ็…ง +- **็ผ–็จ‹่ฎฟ้—ฎ** โ€” npm ๅŒ…ใ€CDNใ€GitHub Actionใ€CSV ๅฏผๅ‡บ +- **ๅผ€ๆบ** โ€” ็คพๅŒบ้ฉฑๅŠจ๏ผŒ่‡ชๅŠจๅŒ–ๆŠ“ๅ– + +### ๆ•ฐๆฎๅคšไน…ๆ›ดๆ–ฐไธ€ๆฌก๏ผŸ + +ๆ•ฐๆฎ้€š่ฟ‡่‡ชๅŠจๅŒ– CI ๅทฅไฝœๆตๆฏๅ‘จๅŒๆญฅใ€‚ๆไพ›ๅ•† API ๅœจๅ‘จไธ€ๅฎšๆ—ถๆŠ“ๅ–๏ผŒnpm ๅŒ…ๅœจๆ–ฐ็‰ˆๆœฌๅ‘ๅธƒๆ—ถ่‡ชๅŠจๅ‘ๅธƒใ€‚ + +## ่ฎฟ้—ฎไธŽไฝฟ็”จ + +### ๅฆ‚ไฝ•่Žทๅ–ๆ•ฐๆฎ๏ผŸ + +ๆœ‰ๅคš็งๆ–นๅผ๏ผš + +| ๆ–นๅผ | ้€‚็”จๅœบๆ™ฏ | +| ------------------------------------------------------------------------------------- | -------------------------- | +| `npm install ai-models` | TypeScript/JavaScript ้กน็›ฎ | +| `curl https://github.com/i-need-token/ai-models/releases/latest/download/models.json` | ไปปไฝ•่ฏญ่จ€็š„ๅฟซ้€Ÿ่ฎฟ้—ฎ | +| GitHub Action | CI/CD ๆตๆฐด็บฟ | +| CSV ไธ‹่ฝฝ | Excelใ€ๆ•ฐๆฎๅˆ†ๆž | +| Hugging Face ๆ•ฐๆฎ้›† | ML ๅทฅไฝœๆต | + +่ฏฆ่ง[ๅฟซ้€Ÿๅ…ฅ้—จ](quick-start.md)ใ€‚ + +### ๆ•ฐๆฎๅ…่ดนไฝฟ็”จๅ—๏ผŸ + +ๆ˜ฏ็š„๏ผ็›ฎๅฝ•ๆ•ฐๆฎ้‡‡็”จ MIT ่ฎธๅฏ่ฏๅ‘ๅธƒ๏ผŒๅฏๅœจๅ•†ไธšๅ’Œ้žๅ•†ไธš้กน็›ฎไธญๆ— ้™ๅˆถไฝฟ็”จใ€‚ + +### ๅฎšไปทๆ•ฐๆฎๅ‡†็กฎๅ—๏ผŸ + +ๅฎšไปทๆ•ฐๆฎ็›ดๆŽฅๆฅ่‡ชๆฏไธชๆไพ›ๅ•†็š„ๅฎ˜ๆ–น API ๅ’Œๆ–‡ๆกฃใ€‚ไฝ†ๆไพ›ๅ•†ๅฏ่ƒฝๅœจไธ้€š็Ÿฅ็š„ๆƒ…ๅ†ตไธ‹ๆ›ดๆ”นๅฎšไปทใ€‚ๅœจๅšๅ‡บๅ…ณ้”ฎๅฎšไปทๅ†ณ็ญ–ๆ—ถ๏ผŒ่ฏทๅŠกๅฟ…ๅฏน็…งๆไพ›ๅ•†่‡ชๅทฑ็š„็ฝ‘็ซ™่ฟ›่กŒๆ ธๅฎžใ€‚ + +## ๆŠ€ๆœฏ + +### ไธบไป€ไนˆ็”จ YAML ่€Œไธๆ˜ฏ JSON๏ผŸ + +YAML ๆ”ฏๆŒๆณจ้‡Š๏ผŒๆ›ด้€‚ๅˆๆ‰‹ๅŠจ็ผ–่พ‘๏ผŒๅนถๅ…่ฎธๆจกๅž‹ๆ–‡ไปถๅ†…็š„ๅฟซ็…ง็ปงๆ‰ฟใ€‚ๆ•ฐๆฎไผš็ผ–่ฏ‘ไธบ JSON ไปฅไพ›็ผ–็จ‹ไฝฟ็”จใ€‚ + +### ไป€ไนˆๆ˜ฏๅฟซ็…ง็ปงๆ‰ฟ๏ผŸ + +ๅœจๅ•ไธชๆจกๅž‹ๆ–‡ไปถๅ†…๏ผŒๅฟซ็…งไปŽ็ˆถๆจกๅž‹็ปงๆ‰ฟๅญ—ๆฎต๏ผŒๅช่ฆ†็›–ไธๅŒ็š„้ƒจๅˆ†ใ€‚่ฟ™ไฝฟๆจกๅž‹ๆ–‡ไปถไฟๆŒ DRY๏ผŒๆ— ้œ€่ทจๆจกๅž‹็ปงๆ‰ฟใ€‚ + +### ๅฆ‚ไฝ•ๆ ก้ชŒ YAML ๆ–‡ไปถ๏ผŸ + +```bash +# ไฝฟ็”จๅ†…็ฝฎๆ ก้ชŒๅ™จ +npx tsx scripts/validate.ts + +# ไฝฟ็”จ JSON Schema +npx ajv validate -s schema.json -d providers/openai/models/gpt-4o.yaml +``` + +### ๅฏไปฅๅœจ CI/CD ๆตๆฐด็บฟไธญไฝฟ็”จๅ—๏ผŸ + +ๅฏไปฅ๏ผไฝฟ็”จๅฏๅค็”จ็š„ GitHub Action๏ผš + +```yaml +- uses: i-need-token/ai-models@v1 + with: + format: json + filter: "[?tool_call && open_weights]" +``` + +่ฏฆ่ง [API ๆ–‡ๆกฃ](api.md#github-action)ใ€‚ + +## ่ดก็Œฎ + +### ๅฆ‚ไฝ•ๆทปๅŠ ๆ–ฐ็š„ๆไพ›ๅ•†๏ผŸ + +ๅ‚่ง[่ดก็ŒฎๆŒ‡ๅ—](https://github.com/i-need-token/ai-models/blob/main/CONTRIBUTING.md)็š„ๅˆ†ๆญฅ่ฏดๆ˜Žใ€‚็ฎ€่ฆๆญฅ้ชค๏ผš + +1. ๅˆ›ๅปบ `providers//provider.yaml` +2. ๅˆ›ๅปบ `providers//scrape.ts`๏ผŒๅŒ…ๅซ `scrape()` ๅ‡ฝๆ•ฐ +3. ่ฟ่กŒ `npx tsx scripts/validate.ts` ๆ ก้ชŒ + +### ๅฆ‚ไฝ•ๆŠฅๅ‘Šๆ•ฐๆฎ้”™่ฏฏ๏ผŸ + +ๆไบค[ๆ•ฐๆฎๆ›ดๆ–ฐ issue](https://github.com/i-need-token/ai-models/issues/new?template=data_update.md)๏ผŒๆณจๆ˜Žๆไพ›ๅ•†ๅ็งฐใ€ๆจกๅž‹ ID ๅ’Œ้œ€่ฆๆ›ดๆญฃ็š„ๅ†…ๅฎนใ€‚ + +### ไธๅ†™ไปฃ็ ไนŸ่ƒฝ่ดก็Œฎๅ—๏ผŸ + +ๅฝ“็„ถๅฏไปฅ๏ผไฝ ๅฏไปฅ๏ผš + +- โญ ็ป™ไป“ๅบ“ๅŠ ๆ˜Ÿ๏ผŒๅธฎๅŠฉๆ›ดๅคšไบบๅ‘็Žฐ +- ๐Ÿ“ข ๅˆ†ไบซ็ป™ไฝ ็š„็ฝ‘็ปœ +- ๐Ÿ› ๆŠฅๅ‘Šๆ•ฐๆฎ้—ฎ้ข˜ๆˆ– bug +- ๐Ÿ“– ๆ”น่ฟ›ๆ–‡ๆกฃ +- ๐Ÿท๏ธ ๅปบ่ฎฎๆทปๅŠ ๆ–ฐ็š„ๆไพ›ๅ•† + +--- + +ๆ›ดๅคš้—ฎ้ข˜๏ผŸ[ๆไบค issue](https://github.com/i-need-token/ai-models/issues/new) ๆˆ–ๅ‘่ตท[่ฎจ่ฎบ](https://github.com/i-need-token/ai-models/discussions)ใ€‚ + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๅฟซ้€Ÿๅ…ฅ้—จ](quick-start.md) โ€” 30 ็ง’ๅ†…ๆ‰พๅˆฐ้€‚ๅˆ็š„ๆจกๅž‹ +- [API ไธŽ็ผ–็จ‹่ฎฟ้—ฎ](api.md) โ€” npmใ€CDNใ€CSV ่ฎฟ้—ฎ +- [ๆœฏ่ฏญ่กจ](glossary.md) โ€” ๅ…ณ้”ฎๆœฏ่ฏญๅ’Œๅฎšไน‰ +- [ๆ•ฐๆฎๆจกๅผ](data-schema.md) โ€” ๅฎŒๆ•ด YAML ๆจกๅผ +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ๅ†ณ็ญ–ๆก†ๆžถ diff --git a/docs/zh/free-models.md b/docs/zh/free-models.md new file mode 100644 index 00000000..c85e0fc4 --- /dev/null +++ b/docs/zh/free-models.md @@ -0,0 +1,124 @@ +[English](../free-models.md) | **ไธญๆ–‡** + +# ๅ…่ดน AI ๆจกๅž‹ + +ๆœฌ็›ฎๅฝ•ไธญๆœ‰ 81 ไธชๆจกๅž‹ๅฏๅ…่ดนไฝฟ็”จใ€‚ๆœฌ้กตๆŒ‰่ƒฝๅŠ›ๅˆ†็ฑปๅˆ—ๅ‡บ๏ผŒๅธฎๅŠฉไฝ ๆ‰พๅˆฐ้€‚ๅˆ้กน็›ฎ็š„ๅ…่ดนๆจกๅž‹ใ€‚ + +> ๆ‰€ๆœ‰ๆ•ฐๆฎๆฅ่‡ชไธ€ๆ‰‹ API ๅ’Œๆ–‡ๆกฃใ€‚ๅ…่ดนๅฑ‚ๅฏ่ƒฝๆœ‰้€Ÿ็އ้™ๅˆถ โ€” ่ฏทๆŸฅ็œ‹ๆไพ›ๅ•†็ฝ‘็ซ™ไบ†่งฃ่ฏฆๆƒ…ใ€‚ + +## ๅฟซ้€Ÿ็ปŸ่ฎก + +| ่ƒฝๅŠ› | ๅ…่ดนๆจกๅž‹ๆ•ฐ | +| -------------------- | ---------: | +| ๆ€ปๅ…่ดนๆจกๅž‹ | 81 | +| ๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ | 45 | +| ๆ”ฏๆŒๆŽจ็† | 11 | +| ๆ”ฏๆŒ่ง†่ง‰๏ผˆๅ›พๅƒ่พ“ๅ…ฅ๏ผ‰ | 17 | + +## ๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ็š„ๅ…่ดนๆจกๅž‹ + +่ฟ™ไบ›ๆจกๅž‹ๆ”ฏๆŒๅ‡ฝๆ•ฐ/ๅทฅๅ…ท่ฐƒ็”จไธ”้›ถๆˆๆœฌ โ€” ้€‚ๅˆๆž„ๅปบ AI ไปฃ็†ๅ’Œ่‡ชๅŠจๅŒ–๏ผš + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่ง†่ง‰ | +| ------------------------------ | ------ | ------ | ---- | +| gemini-2.0-flash | Google | 1M | โœ… | +| gemini-2.5-flash-preview-05-20 | Google | 1M | โœ… | +| gemma-3-27b-it | Chutes | 128K | โœ… | +| qwen3-235b-a22b | Chutes | 128K | โœ… | +| qwen3-30b-a3b | Chutes | 128K | โœ… | +| qwen3-4b | Chutes | 128K | โœ… | +| deepseek-r1 | Chutes | 128K | โŒ | +| deepseek-v3-0324 | Chutes | 128K | โŒ | +| llama-4-maverick | Chutes | 1M | โœ… | +| llama-4-scout | Chutes | 10M | โœ… | +| llama-3.3-70b-instruct | Chutes | 128K | โŒ | +| qwen2.5-72b-instruct | Chutes | 128K | โŒ | +| mistral-small-3.1-24b-instruct | Chutes | 128K | โœ… | +| phi-4 | Chutes | 16K | โŒ | +| command-r | Chutes | 128K | โŒ | + +## ๆ”ฏๆŒๆŽจ็†็š„ๅ…่ดนๆจกๅž‹ + +่ฟ™ไบ›ๆจกๅž‹ๆ”ฏๆŒ้“พๅผๆ€็ปดๆŽจ็†ไธ”้›ถๆˆๆœฌ๏ผš + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | +| ------------------------------ | ------ | ------ | +| gemini-2.5-flash-preview-05-20 | Google | 1M | +| deepseek-r1 | Chutes | 128K | +| deepseek-r1-0528 | Chutes | 128K | +| qwen3-235b-a22b | Chutes | 128K | +| qwen3-30b-a3b | Chutes | 128K | +| qwen3-4b | Chutes | 128K | +| gemma-3-27b-it | Chutes | 128K | +| phi-4-reasoning | Chutes | 32K | + +## ๆ”ฏๆŒ่ง†่ง‰็š„ๅ…่ดนๆจกๅž‹ + +่ฟ™ไบ›ๆจกๅž‹ๆŽฅๅ—ๅ›พๅƒ่พ“ๅ…ฅไธ”้›ถๆˆๆœฌ๏ผš + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | +| ------------------------------ | ------ | ------ | +| gemini-2.0-flash | Google | 1M | +| gemini-2.5-flash-preview-05-20 | Google | 1M | +| gemma-3-27b-it | Chutes | 128K | +| qwen3-235b-a22b | Chutes | 128K | +| llama-4-maverick | Chutes | 1M | +| llama-4-scout | Chutes | 10M | +| mistral-small-3.1-24b-instruct | Chutes | 128K | + +## ๆŒ‰ๆไพ›ๅ•†ๅˆ†็ฑป + +### Google๏ผˆ้€š่ฟ‡ AI Studio๏ผ‰ + +Google ้€š่ฟ‡ AI Studio ๆไพ›ๅ…่ดน Gemini ๆจกๅž‹่ฎฟ้—ฎ๏ผˆๆœ‰้€Ÿ็އ้™ๅˆถ๏ผ‰๏ผš + +- gemini-2.0-flash โ€” 1M ไธŠไธ‹ๆ–‡๏ผŒๅทฅๅ…ท่ฐƒ็”จ๏ผŒ่ง†่ง‰๏ผŒๆŽจ็† +- gemini-2.5-flash-preview-05-20 โ€” 1M ไธŠไธ‹ๆ–‡๏ผŒๅทฅๅ…ท่ฐƒ็”จ๏ผŒ่ง†่ง‰๏ผŒๆŽจ็† + +### Chutes + +Chutes ๆไพ›ๅ…่ดน็คพๅŒบๆ‰˜็ฎกๆŽจ็†๏ผŒๆ”ฏๆŒๅผ€ๆบๆƒ้‡ๆจกๅž‹๏ผš + +- 70+ ไธชๅ…่ดนๆจกๅž‹๏ผŒๅŒ…ๆ‹ฌ Llama 4ใ€Qwen3ใ€DeepSeek-R1ใ€Gemma 3ใ€Mistralใ€Phi-4 +- ๆœ€ๅคงๅ…่ดนๆจกๅž‹๏ผšLlama 4 Scout๏ผˆ10M ไธŠไธ‹ๆ–‡๏ผ‰ +- ๆœ€ไฝณๅ…่ดนๆŽจ็†๏ผšDeepSeek-R1ใ€Qwen3-235B-A22B + +### Cloudflare Workers AI + +Cloudflare ๆไพ›ๅ…่ดน่พน็ผ˜ๆŽจ็†๏ผš + +- ๅ„็งๅฐๅž‹ๅ’Œไธญๅž‹ๆจกๅž‹๏ผˆๆœ‰้€Ÿ็އ้™ๅˆถ๏ผ‰ +- ่พน็ผ˜้ƒจ็ฝฒ๏ผŒไฝŽๅปถ่ฟŸ + +### Cerebras + +Cerebras ไธบ้ƒจๅˆ†ๆจกๅž‹ๆไพ›ๅ…่ดนๅฑ‚๏ผš + +- ไฝฟ็”จ CS-3 ๆ™ถๅœ†็บงๅผ•ๆ“Ž็š„ๅฟซ้€ŸๆŽจ็† + +### Groq + +Groq ไธบ้ƒจๅˆ†ๆจกๅž‹ๆไพ›ๅ…่ดนๅฑ‚๏ผš + +- ไฝฟ็”จ LPU ๅŠ ้€Ÿ็š„่ถ…ๅฟซๆŽจ็† + +## ่ฆ็‚นๆ€ป็ป“ + +- **Google AI Studio** ๆไพ›ๆ•ดไฝ“ๆœ€ไฝณ็š„ๅ…่ดนๆจกๅž‹ โ€” 1M ไธŠไธ‹ๆ–‡ใ€ๅทฅๅ…ท่ฐƒ็”จใ€่ง†่ง‰ๅ’ŒๆŽจ็† +- **Chutes** ๆ‹ฅๆœ‰ๆœ€ๅคš็š„ๅ…่ดนๆจกๅž‹้€‰ๆ‹ฉ โ€” 70+ ไธช๏ผŒๅŒ…ๆ‹ฌๆ‰€ๆœ‰ไธป่ฆๅผ€ๆบๆƒ้‡ๆจกๅž‹ +- **Llama 4 Scout** ๅœจ Chutes ไธŠๆไพ›ๆœ€ๅคง็š„ๅ…่ดนไธŠไธ‹ๆ–‡็ช—ๅฃ๏ผˆ10M tokens๏ผ‰ +- ๅ…่ดนๅฑ‚้€šๅธธๆœ‰้€Ÿ็އ้™ๅˆถ๏ผˆๆฏๅˆ†้’Ÿ่ฏทๆฑ‚ๆ•ฐ๏ผ‰โ€” ่ฏทๆŸฅ็œ‹ๆไพ›ๅ•†ๆ–‡ๆกฃไบ†่งฃๅ…ทไฝ“้™ๅˆถ +- ็”Ÿไบง็Žฏๅขƒๅปบ่ฎฎๅ‡็บงๅˆฐไป˜่ดนๅฑ‚ไปฅ่Žทๅพ—ๅฏ้ ๆ€งๅ’Œๆ›ด้ซ˜็š„้€Ÿ็އ้™ๅˆถ + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ้€‰ๆ‹ฉๆจกๅž‹็š„ๅ†ณ็ญ–ๆก†ๆžถ +- [ๅผ€ๆบๆƒ้‡ๆจกๅž‹](open-weights.md) โ€” 527 ไธชๅฏ่‡ช่กŒ่ฟ่กŒ็š„ๆจกๅž‹ +- [็ผ“ๅญ˜ๅฎšไปท](cached-pricing.md) โ€” 1,374 ไธชๆ”ฏๆŒๆ็คบ็ผ“ๅญ˜็š„ๆจกๅž‹ +- [ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹](tool-calling.md) โ€” 2,350 ไธชๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ็š„ๆจกๅž‹ +- [ๆŽจ็†ๆจกๅž‹](reasoning-models.md) โ€” 1,306 ไธชๆ”ฏๆŒๆŽจ็†็š„ๆจกๅž‹ +- [OpenAI ๆ›ฟไปฃๆ–นๆกˆ](openai-alternatives.md) โ€” ๅ…่ดน GPT-4 ๆ›ฟไปฃ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/glossary.md b/docs/zh/glossary.md new file mode 100644 index 00000000..c040f22d --- /dev/null +++ b/docs/zh/glossary.md @@ -0,0 +1,79 @@ +# ๆœฏ่ฏญ่กจ + +[English](../glossary.md) + +AI Models Catalog ไธญไฝฟ็”จ็š„ๆœฏ่ฏญๅฟซ้€Ÿๅ‚่€ƒใ€‚ + +## ๆจกๅž‹ๅฑžๆ€ง + +| ๆœฏ่ฏญ | ๅฎšไน‰ | +| ------------------------ | --------------------------------------------------------------------------------------------------- | +| **ๆจกๅž‹ ID** | ๆจกๅž‹็š„็จณๅฎšๅ”ฏไธ€ๆ ‡่ฏ†็ฌฆ๏ผˆๅฆ‚ `gpt-4.1`ใ€`claude-sonnet-4`๏ผ‰ใ€‚ๆ— ๆ—ฅๆœŸๅŽ็ผ€๏ผŒๆ— ๅˆซๅใ€‚ | +| **็ณปๅˆ—๏ผˆFamily๏ผ‰** | ๅ…ฑไบซ็›ธๅŒๆžถๆž„ๆˆ–ๅ“็‰Œ็š„็›ธๅ…ณๆจกๅž‹็ป„๏ผˆๅฆ‚ `gpt-4.1` ็ณปๅˆ—ๅŒ…ๆ‹ฌ `gpt-4.1`ใ€`gpt-4.1-mini`ใ€`gpt-4.1-nano`๏ผ‰ใ€‚ | +| **ๅฟซ็…ง๏ผˆSnapshot๏ผ‰** | ๆจกๅž‹็š„ๆ—ฅๆœŸ็‰ˆๆœฌ๏ผŒๅตŒๅฅ—ๅœจ็ˆถๆจกๅž‹ๆ–‡ไปถไธญใ€‚็ปงๆ‰ฟๆ‰€ๆœ‰็ˆถๅญ—ๆฎต๏ผŒๅช่ฆ†็›–ไธๅŒ็š„้ƒจๅˆ†ใ€‚ | +| **ๅทฒๅผƒ็”จ๏ผˆDeprecated๏ผ‰** | ๆไพ›ๅ•† API ไธญไปๅˆ—ๅ‡บไฝ†ไธๆŽจ่็”จไบŽๆ–ฐ้กน็›ฎ็š„ๆจกๅž‹ใ€‚ๆ ‡่ฎฐไธบ `deprecated: true`ใ€‚ | +| **ๅทฒ้€€ๅฝน๏ผˆRetired๏ผ‰** | ๅฎŒๅ…จไปŽๆไพ›ๅ•† API ไธญ็งป้™ค็š„ๆจกๅž‹ใ€‚ไธๅœจ็›ฎๅฝ•ไธญๆ”ถๅฝ•ใ€‚ | + +## ่ƒฝๅŠ› + +| ๆœฏ่ฏญ | ๅฎšไน‰ | +| ----------------------------------- | -------------------------------------------------------------------------------------------------- | +| **ๅทฅๅ…ท่ฐƒ็”จ๏ผˆTool calling๏ผ‰** | ๆจกๅž‹ๅœจ็”Ÿๆˆ่ฟ‡็จ‹ไธญๅฏไปฅ่ฐƒ็”จๅค–้ƒจๅทฅๅ…ท/ๅ‡ฝๆ•ฐ๏ผˆๅฆ‚็ฝ‘้กตๆœ็ดขใ€่ฎก็ฎ—ๅ™จใ€API ่ฐƒ็”จ๏ผ‰ใ€‚ไนŸ็งฐ"ๅ‡ฝๆ•ฐ่ฐƒ็”จ"ใ€‚ | +| **็ป“ๆž„ๅŒ–่พ“ๅ‡บ๏ผˆStructured output๏ผ‰** | ๆจกๅž‹ๅฏไปฅๆŒ‰ๆŒ‡ๅฎšๆ ผๅผ๏ผˆ้€šๅธธไธบ JSON๏ผ‰็”Ÿๆˆๅ“ๅบ”๏ผŒ็ฌฆๅˆๆไพ›็š„ schemaใ€‚ไนŸ็งฐ"JSON ๆจกๅผ"ใ€‚ | +| **ๆŽจ็†๏ผˆReasoning๏ผ‰** | ๆจกๅž‹ไฝฟ็”จ้“พๅผๆ€็ปดๆˆ–ๆ‰ฉๅฑ•ๆ€่€ƒ้€ๆญฅ่งฃๅ†ณๅคๆ‚้—ฎ้ข˜๏ผŒ็„ถๅŽ็”Ÿๆˆๆœ€็ปˆ็ญ”ๆกˆใ€‚ | +| **ๅผ€ๆบๆƒ้‡๏ผˆOpen weights๏ผ‰** | ๆจกๅž‹ๆƒ้‡ๅ…ฌๅผ€ๅฏ็”จ๏ผŒๅ…่ฎธๅœจ่‡ชๅทฑ็š„ๅŸบ็ก€่ฎพๆ–ฝไธŠ่ฟ่กŒใ€‚ๅนถ้žๆ‰€ๆœ‰ๅผ€ๆบๆƒ้‡ๆจกๅž‹้ƒฝๆ˜ฏ็œŸๆญฃ็š„"ๅผ€ๆบ"โ€”โ€”่ฏทๆฃ€ๆŸฅ่ฎธๅฏ่ฏใ€‚ | + +## ๆจกๆ€ + +| ๆœฏ่ฏญ | ๅฎšไน‰ | +| -------------------- | ------------------------------------------------------------------ | +| **ๆ–‡ๆœฌ่พ“ๅ…ฅ** | ๆจกๅž‹ๆŽฅๅ—ๆ–‡ๆœฌๆ็คบไฝœไธบ่พ“ๅ…ฅใ€‚ | +| **ๆ–‡ๆœฌ่พ“ๅ‡บ** | ๆจกๅž‹็”Ÿๆˆๆ–‡ๆœฌไฝœไธบ่พ“ๅ‡บใ€‚ | +| **ๅ›พๅƒ่พ“ๅ…ฅ๏ผˆ่ง†่ง‰๏ผ‰** | ๆจกๅž‹ๅฏไปฅๅฐ†ๅ›พๅƒไฝœไธบ่พ“ๅ…ฅ็š„ไธ€้ƒจๅˆ†่ฟ›่กŒๅค„็†ใ€‚ไนŸ็งฐ"่ง†่ง‰"ๆˆ–"ๅคšๆจกๆ€่พ“ๅ…ฅ"ใ€‚ | +| **ๅ›พๅƒ่พ“ๅ‡บ** | ๆจกๅž‹ๅฏไปฅ็”Ÿๆˆๅ›พๅƒ๏ผˆๅฆ‚ DALLยทEใ€Imagen๏ผ‰ใ€‚ไนŸ็งฐ"ๅ›พๅƒ็”Ÿๆˆ"ใ€‚ | +| **้Ÿณ้ข‘่พ“ๅ…ฅ** | ๆจกๅž‹ๅฏไปฅๅฐ†้Ÿณ้ข‘ๆ–‡ไปถๆˆ–่ฏญ้Ÿณไฝœไธบ่พ“ๅ…ฅ่ฟ›่กŒๅค„็†ใ€‚ | +| **้Ÿณ้ข‘่พ“ๅ‡บ** | ๆจกๅž‹ๅฏไปฅ็”Ÿๆˆ้Ÿณ้ข‘ๆˆ–่ฏญ้Ÿณไฝœไธบ่พ“ๅ‡บ๏ผˆๅฆ‚ TTS ๆจกๅž‹๏ผ‰ใ€‚ | +| **่ง†้ข‘่พ“ๅ…ฅ** | ๆจกๅž‹ๅฏไปฅๅฐ†่ง†้ข‘ๆ–‡ไปถไฝœไธบ่พ“ๅ…ฅ่ฟ›่กŒๅค„็†ใ€‚ | +| **่ง†้ข‘่พ“ๅ‡บ** | ๆจกๅž‹ๅฏไปฅ็”Ÿๆˆ่ง†้ข‘ไฝœไธบ่พ“ๅ‡บใ€‚ | +| **ๅตŒๅ…ฅ่พ“ๅ‡บ** | ๆจกๅž‹็”Ÿๆˆๅ‘้‡ๅตŒๅ…ฅ่€Œ้žๆ–‡ๆœฌ๏ผŒ็”จไบŽ็›ธไผผๆ€งๆœ็ดขๅ’Œๆฃ€็ดขใ€‚ | + +## ๅฎšไปท + +| ๆœฏ่ฏญ | ๅฎšไน‰ | +| ---------------- | --------------------------------------------------------------- | +| **่พ“ๅ…ฅไปทๆ ผ** | ๆฏ็™พไธ‡่พ“ๅ…ฅ token ็š„ๆˆๆœฌ๏ผŒไปฅ USD ่ฎก๏ผˆ้ƒจๅˆ†ๆไพ›ๅ•†ไปฅ CNY/EUR ่ฎก๏ผ‰ใ€‚ | +| **่พ“ๅ‡บไปทๆ ผ** | ๆฏ็™พไธ‡่พ“ๅ‡บ token ็š„ๆˆๆœฌ๏ผŒไปฅ USD ่ฎก๏ผˆ้ƒจๅˆ†ๆไพ›ๅ•†ไปฅ CNY/EUR ่ฎก๏ผ‰ใ€‚ | +| **็ผ“ๅญ˜่ฏปๅ–ไปทๆ ผ** | ไปŽๅ…ˆๅ‰็ผ“ๅญ˜็š„ๆ็คบ่ฏปๅ–็š„ๆŠ˜ๆ‰ฃไปทๆ ผใ€‚้€šๅธธๆฏ”ๅธธ่ง„่พ“ๅ…ฅไพฟๅฎœ 50-90%ใ€‚ | +| **็ผ“ๅญ˜ๅ†™ๅ…ฅไปทๆ ผ** | ๅฐ†ๆ็คบๅ†™ๅ…ฅๆไพ›ๅ•†็ผ“ๅญ˜็š„ไปทๆ ผใ€‚้ƒจๅˆ†ๆไพ›ๅ•†ๅ•็‹ฌๆ”ถๅ–ๆญค่ดน็”จใ€‚ | +| **ๅ…่ดน** | ๆจกๅž‹็š„่พ“ๅ…ฅๅ’Œ่พ“ๅ‡บ token ๆˆๆœฌไธบ้›ถใ€‚ๅฏ่ƒฝๆœ‰้€Ÿ็އ้™ๅˆถใ€‚ | +| **Token** | ๆ–‡ๆœฌๅค„็†็š„ๅ•ไฝใ€‚ๅœจ่‹ฑ่ฏญไธญ็บฆ็ญ‰ไบŽ 4 ไธชๅญ—็ฌฆๆˆ– 0.75 ไธช่ฏใ€‚ | + +## ไธŠไธ‹ๆ–‡ไธŽ้™ๅˆถ + +| ๆœฏ่ฏญ | ๅฎšไน‰ | +| -------------- | ---------------------------------------------------------------------------------- | +| **ไธŠไธ‹ๆ–‡็ช—ๅฃ** | ๆจกๅž‹ๅœจๅ•ไธช่ฏทๆฑ‚ไธญๅฏๅค„็†็š„ๆœ€ๅคง token ๆ•ฐ๏ผˆ้ƒจๅˆ†ๆไพ›ๅ•†ไธบ่พ“ๅ…ฅ+่พ“ๅ‡บๅˆ่ฎก๏ผŒ้ƒจๅˆ†ไป…่พ“ๅ…ฅ๏ผ‰ใ€‚ | +| **่พ“ๅ‡บ้™ๅˆถ** | ๆจกๅž‹ๅœจๅ•ไธชๅ“ๅบ”ไธญๅฏ็”Ÿๆˆ็š„ๆœ€ๅคง token ๆ•ฐใ€‚ | +| **้€Ÿ็އ้™ๅˆถ** | ๆไพ›ๅ•†่ฎพ็ฝฎ็š„ๆฏๅˆ†้’Ÿ/ๅฐๆ—ถๆœ€ๅคง่ฏทๆฑ‚ๆ•ฐๆˆ– token ๆ•ฐใ€‚ไธๅœจ็›ฎๅฝ•ไธญๆ”ถๅฝ•๏ผˆ่ฏทๆŸฅ็œ‹ๆไพ›ๅ•†ๆ–‡ๆกฃ๏ผ‰ใ€‚ | + +## ๆ•ฐๆฎไธŽๆžถๆž„ + +| ๆœฏ่ฏญ | ๅฎšไน‰ | +| --------------- | --------------------------------------------------------------------------------------- | +| **YAML** | ๆ‰€ๆœ‰ๆจกๅž‹ๆ•ฐๆฎ็š„ๆบๆ ผๅผใ€‚ไบบ็ฑปๅฏ่ฏป๏ผŒๆ”ฏๆŒๆณจ้‡Š๏ผŒๅ…่ฎธๅฟซ็…ง็ปงๆ‰ฟใ€‚ | +| **ๅฟซ็…ง็ปงๆ‰ฟ** | ๅœจๆจกๅž‹ๆ–‡ไปถๅ†…๏ผŒๅฟซ็…ง็ปงๆ‰ฟ็ˆถๆจกๅž‹็š„ๆ‰€ๆœ‰ๅญ—ๆฎต๏ผŒๅช่ฆ†็›–ไธๅŒ็š„้ƒจๅˆ†ใ€‚ๆ— ่ทจๆจกๅž‹็ปงๆ‰ฟใ€‚ | +| **ไธ€ๆ‰‹ๆ•ฐๆฎ** | ็›ดๆŽฅๆฅ่‡ชๆไพ›ๅ•†่‡ช่บซ API ๆˆ–ๅฎ˜ๆ–นๆ–‡ๆกฃ็š„ๆ•ฐๆฎ๏ผŒ่€Œ้ž็ฌฌไธ‰ๆ–น่šๅˆๅ™จใ€‚ | +| **Zod schema** | ่ฟ่กŒๆ—ถๆ ก้ชŒ schema๏ผŒ็กฎไฟๆ‰€ๆœ‰ YAML ๆจกๅž‹ๆ–‡ไปถ็ฌฆๅˆ้ข„ๆœŸ็ป“ๆž„ใ€‚ | +| **models.json** | ไปŽ YAML ๆบๆ–‡ไปถ็ผ–่ฏ‘็š„ JSON ่พ“ๅ‡บ๏ผŒๅŒ…ๅซๆ‰€ๆœ‰ๆจกๅž‹ใ€‚ๅฏ้€š่ฟ‡ npmใ€CDN ๅ’Œ GitHub Releases ่Žทๅ–ใ€‚ | + +--- + +่ฏฆ่ง[ๆ•ฐๆฎ Schema ๅ‚่€ƒ](data-schema.md)่Žทๅ–ๅฎŒๆ•ด็š„ YAML ๅญ—ๆฎต่ง„่Œƒใ€‚ + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๅธธ่ง้—ฎ้ข˜](faq.md) โ€” ๅธธ่ง้—ฎ้ข˜ +- [ๆ•ฐๆฎๆจกๅผ](data-schema.md) โ€” ๅฎŒๆ•ด YAML ๆจกๅผๅ‚่€ƒ +- [ๅฟซ้€Ÿๅ…ฅ้—จ](quick-start.md) โ€” 30 ็ง’ๅ†…ๆ‰พๅˆฐ้€‚ๅˆ็š„ๆจกๅž‹ +- [ๆจกๅž‹ๅฏนๆฏ”](model-comparison.md) โ€” ๆจกๅž‹ๅฏนๆฏ” +- [ๆจกๆ€็Ÿฉ้˜ต](modality-matrix.md) โ€” ๆ‰€ๆœ‰ๆจกๆ€ไธ€่งˆ diff --git a/docs/zh/image-generation.md b/docs/zh/image-generation.md new file mode 100644 index 00000000..23d9374d --- /dev/null +++ b/docs/zh/image-generation.md @@ -0,0 +1,70 @@ +[English](../image-generation.md) | **ไธญๆ–‡** + +# AI ๅ›พๅƒ็”Ÿๆˆๆจกๅž‹ + +ๆœฌ็›ฎๅฝ•ไธญๆœ‰ 28 ไธชๆจกๅž‹ๅฏไปฅ็”Ÿๆˆๅ›พๅƒ๏ผˆๅ›พๅƒ่พ“ๅ‡บๆจกๆ€๏ผ‰ใ€‚ๆœฌ้กตๆถต็›–ๆ–‡ๆœฌ็”Ÿๆˆๅ›พๅƒใ€ๅ›พๅƒ็ผ–่พ‘ๅ’Œๅคšๆจกๆ€็”Ÿๆˆๆจกๅž‹ใ€‚ + +> ๆ‰€ๆœ‰ๆ•ฐๆฎๆฅ่‡ชไธ€ๆ‰‹ API ๅ’Œๆ–‡ๆกฃใ€‚"ๅ›พๅƒ่พ“ๅ‡บ"่กจ็คบๆจกๅž‹ๅœจๅ›žๅคไธญ็”Ÿๆˆๅ›พๅƒใ€‚ + +## ๅฟซ้€Ÿ็ปŸ่ฎก + +| ่ƒฝๅŠ› | ๅ›พๅƒ็”Ÿๆˆๆจกๅž‹ๆ•ฐ | +| -------------- | -------------: | +| ๆ€ปๅ›พๅƒ็”Ÿๆˆๆจกๅž‹ | 28 | +| ๅ”ฏไธ€ๆจกๅž‹ ID | 19 | +| ๆ”ฏๆŒๆŽจ็† | 5 | +| ๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ | 1 | +| ๅ…่ดนไฝฟ็”จ | 9 | + +## ๆ‰€ๆœ‰ๅ›พๅƒ็”Ÿๆˆๆจกๅž‹ + +| ๆจกๅž‹ | ่พ“ๅ…ฅ | ่พ“ๅ‡บ $/1M | ไธŠไธ‹ๆ–‡ | ๆŽจ็† | ๅ…่ดน | +| ------------------------------ | ------------------------- | --------: | ------ | ---- | ---- | +| DALLยทE 3 | text | โ€” | โ€” | โŒ | โœ… | +| Imagen 4.0 Fast | text, image | โ€” | โ€” | โŒ | โœ… | +| Imagen 4.0 | text, image | โ€” | โ€” | โŒ | โœ… | +| Image 01 | text, image | โ€” | โ€” | โŒ | โœ… | +| Image 01 Live | text, image | โ€” | โ€” | โŒ | โœ… | +| Step 1X Edit | text, image | โ€” | โ€” | โŒ | โœ… | +| Step 1X Medium | text, image | โ€” | โ€” | โŒ | โœ… | +| Step 2X Large | text, image | โ€” | โ€” | โŒ | โœ… | +| Step Image Edit 2 | text, image | โ€” | โ€” | โŒ | โœ… | +| Gemini 2.5 Flash Image | text, image | $0.039 | 33K | โŒ | โŒ | +| Gemini 3.1 Flash Image Preview | text, image | $1.50 | 66K | โœ… | โŒ | +| Gemini 3 Pro Image Preview | text, image | $12.00 | 131K | โœ… | โŒ | +| GPT-5 Image Mini | text, image, PDF | $2.00 | 400K | โœ… | โŒ | +| GPT-5 Image | text, image, PDF | $10.00 | 400K | โœ… | โŒ | +| GPT-5.4 Image 2 | text, image, PDF | $15.00 | 272K | โœ… | โŒ | +| Amazon Nova 2.0 Omni | text, image, audio, video | $1.30 | 64K | โœ… | โŒ | + +## ๆœ€ไฝณๆ€งไปทๆฏ”ๅ›พๅƒ็”Ÿๆˆ + +| ็”จ้€” | ๆœ€ไฝณๆจกๅž‹ | ๅŽŸๅ›  | +| ---------------------------- | ----------------------------------- | -------------------------------- | +| **ๅ…่ดนๆ–‡ๆœฌ็”Ÿๆˆๅ›พๅƒ** | DALLยทE 3, Imagen 4.0 | ้›ถๆˆๆœฌ๏ผŒ้ซ˜่ดจ้‡ | +| **ๅ…่ดนๅ›พๅƒ็ผ–่พ‘** | Step 1X Edit, Step Image Edit 2 | ๅ…่ดน็ผ–่พ‘็Žฐๆœ‰ๅ›พๅƒ | +| **ๆœ€ไพฟๅฎœ API** | Gemini 2.5 Flash Image | $0.039/1M ่พ“ๅ‡บ tokens | +| **ๆœ€ไฝณ่ดจ้‡** | GPT-5.4 Image 2, Gemini 3 Pro Image | ๆœ€ๅ…ˆ่ฟ›็š„็”Ÿๆˆ่ƒฝๅŠ› | +| **ๅคšๆจกๆ€๏ผˆ้Ÿณ้ข‘+่ง†้ข‘+ๅ›พๅƒ๏ผ‰** | Amazon Nova 2.0 Omni | ๅ”ฏไธ€ๆ”ฏๆŒๆ‰€ๆœ‰ๆจกๆ€็š„ๆจกๅž‹ | +| **ๅคงไธŠไธ‹ๆ–‡** | GPT-5 Image Mini | 400K ไธŠไธ‹ๆ–‡้€‚ๅˆๅคๆ‚ๆ็คบ | +| **ๆŽจ็† + ็”Ÿๆˆ** | GPT-5 Image Mini | $2.50/1M ่พ“ๅ…ฅ๏ผŒ400K ไธŠไธ‹ๆ–‡๏ผŒๆŽจ็† | + +## ่ฆ็‚นๆ€ป็ป“ + +- **9 ไธชๅ…่ดนๅ›พๅƒ็”Ÿๆˆๆจกๅž‹** โ€” DALLยทE 3ใ€Imagen 4.0ใ€Step ็ณปๅˆ—็ญ‰ +- **Gemini 2.5 Flash Image** ๆ˜ฏๆœ€ไพฟๅฎœ็š„ API ้€‰้กน๏ผŒไป… $0.039/1M ่พ“ๅ‡บ tokens +- **GPT-5 Image Mini** ๆไพ›ๆŽจ็† + ็”Ÿๆˆ + ๅคงไธŠไธ‹ๆ–‡็š„ๆœ€ไฝณ็ป„ๅˆ +- **Amazon Nova 2.0 Omni** ๆ˜ฏๅ”ฏไธ€ๅฏไปฅไปŽ้Ÿณ้ข‘ๅ’Œ่ง†้ข‘่พ“ๅ…ฅ็”Ÿๆˆๅ›พๅƒ็š„ๆจกๅž‹ +- ๅคงๅคšๆ•ฐๅ›พๅƒ็”Ÿๆˆๆจกๅž‹ๅŒๆ—ถๆŽฅๅ—ๆ–‡ๆœฌๅ’Œๅ›พๅƒ่พ“ๅ…ฅ๏ผˆ็”จไบŽ็ผ–่พ‘/ๅ‚่€ƒ๏ผ‰ + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [่ง†่ง‰ๆจกๅž‹](vision-models.md) โ€” 1,487 ไธช่ง†่ง‰ๆจกๅž‹ +- [่ง†้ข‘ๆจกๅž‹](video-models.md) โ€” 167 ไธช่ง†้ข‘่พ“ๅ…ฅ/่พ“ๅ‡บๆจกๅž‹ +- [ๆจกๆ€็Ÿฉ้˜ต](modality-matrix.md) โ€” ๆ‰€ๆœ‰ๆจกๆ€ไธ€่งˆ +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ๅ†ณ็ญ–ๆก†ๆžถ +- [ๅ…่ดน AI ๆจกๅž‹](free-models.md) โ€” 81 ไธชๅ…่ดนๆจกๅž‹ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/large-context-models.md b/docs/zh/large-context-models.md new file mode 100644 index 00000000..5267e125 --- /dev/null +++ b/docs/zh/large-context-models.md @@ -0,0 +1,112 @@ +# ๅคงไธŠไธ‹ๆ–‡ๆจกๅž‹ + +[English](../large-context-models.md) + +ๅ…ทๆœ‰ **128K+ token ไธŠไธ‹ๆ–‡็ช—ๅฃ**็š„ AI ๆจกๅž‹ โ€” ๅœจๅ•ไธช่ฏทๆฑ‚ไธญๅค„็†ๆ•ดไธชไปฃ็ ๅบ“ใ€้•ฟๆ–‡ๆกฃๅ’Œๅคšๅฐๆ—ถๅฏน่ฏใ€‚ + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models)ใ€‚ + +## ไธบไป€ไนˆๅคงไธŠไธ‹ๆ–‡ๅพˆ้‡่ฆ + +ๅคงไธŠไธ‹ๆ–‡็ช—ๅฃ่งฃ้”ไบ†ๅฐๆจกๅž‹ๆ— ๆณ•ๅฎž็Žฐ็š„่ƒฝๅŠ›๏ผš + +- **ๅฎŒๆ•ดไปฃ็ ๅบ“ๅˆ†ๆž** โ€” ๅœจไธ€ไธชๆ็คบไธญ็†่งฃๆ•ดไธชไป“ๅบ“ +- **ๆ–‡ๆกฃๅค„็†** โ€” ๆ— ้œ€ๅˆ†ๅ—ๅณๅฏๅˆ†ๆž 100+ ้กต PDF +- **ๅคš่ฝฎๅฏน่ฏ** โ€” ๅœจ้•ฟ่Šๅคฉไผš่ฏไธญไฟๆŒไธŠไธ‹ๆ–‡ +- **ๆ•ฐๆฎๅˆ†ๆž** โ€” ๅœจๅ•ไธช่ฏทๆฑ‚ไธญๅค„็†ๅคงๅž‹ๆ•ฐๆฎ้›† +- **ๆณ•ๅพ‹/ๅŒป็–—ๅฎกๆŸฅ** โ€” ๅฎกๆŸฅๅ†—้•ฟ็š„ๅˆๅŒๅ’ŒๅŒป็–—่ฎฐๅฝ• +- **ๅ†…ๅฎนๅˆ›ไฝœ** โ€” ๅœจ้•ฟ็ฏ‡ๅ†™ไฝœไธญไฟๆŒไธ€่‡ดๆ€ง + +## ็ปŸ่ฎก + +| ๆŒ‡ๆ ‡ | ๆ•ฐ้‡ | +| -------------------- | ---- | +| ๅคงไธŠไธ‹ๆ–‡ๆจกๅž‹ (128K+) | 2195 | +| 256K+ ไธŠไธ‹ๆ–‡ | 861 | +| 1M+ ไธŠไธ‹ๆ–‡ | 397 | +| ๆไพ›ๅ•† | 78 | +| ๅ…่ดนๅคงไธŠไธ‹ๆ–‡ๆจกๅž‹ | 51 | +| ๅธฆๅทฅๅ…ท่ฐƒ็”จ | 1637 | + +## ๆไพ›ๅ•† + +`302ai`ใ€`ai21`ใ€`aimlapi`ใ€`aion`ใ€`alibaba`ใ€`amazon`ใ€`amazon-bedrock`ใ€`anthropic`ใ€`arcee`ใ€`auriko`ใ€`baichuan`ใ€`baidu`ใ€`baseten`ใ€`bytedance`ใ€`cerebras`ใ€`chutes`ใ€`clarifai`ใ€`cloudferro-sherlock`ใ€`cloudflare`ใ€`databricks`ใ€`deepinfra`ใ€`deepseek`ใ€`digitalocean`ใ€`dinference`ใ€`evroc` ็ญ‰ 53 ไธช + +## ๆœ€ๅคงไธŠไธ‹ๆ–‡็ช—ๅฃ + +ๅฏ็”จไธŠไธ‹ๆ–‡็ช—ๅฃๆœ€ๅคง็š„ๆจกๅž‹ใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/M | ่พ“ๅ‡บ $/M | ่ƒฝๅŠ› | +| ------------------------------ | ---------- | ------ | -------- | -------- | -------- | +| meta-llama--llama-4-scout | openrouter | 10M | $0.08 | $0.3 | ๐Ÿ”ง ๐Ÿ“‹ | +| meta-llama-4-scout | meta | 10M | $0.17 | $0.66 | ๐Ÿ”ง | +| gemini-1.5-pro | google | 2M | $1.25 | $5 | ๐Ÿ”ง ๐Ÿ“‹ | +| grok-code-fast-1 | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ”ง | +| gpt-4o | jiekou | 2M | $1.9 | $5.7 | ๐Ÿ”ง | +| grok-4.20-0309-non-reasoning | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ”ง | +| grok-4.20-0309-reasoning | jiekou | 2M | $1.9 | $5.7 | ๐Ÿ”ง | +| grok-4-1-fast-reasoning | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ”ง | +| grok-4-fast-reasoning | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ”ง | +| x-ai--grok-4-fast | fastrouter | 2M | $0.2 | $0.5 | ๐Ÿ”ง | +| x-ai--grok-4.1-fast | fastrouter | 2M | $0.2 | $0.5 | ๐Ÿ”ง | +| xai--grok-4-fast-reasoning | aimlapi | 2M | $0.52 | $1.3 | ๐Ÿ”ง | +| xai--grok-4-fast-non-reasoning | aimlapi | 2M | $0.52 | $1.3 | ๐Ÿ”ง | +| grok-4-20-multi-agent | venice | 2M | $1.42 | $2.83 | ๐Ÿง  ๐Ÿ“‹ | +| grok-4-20 | venice | 2M | $1.42 | $2.83 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ“‹ | + +## ๆœ€ไพฟๅฎœ็š„ 1M+ ไธŠไธ‹ๆ–‡ๆจกๅž‹ + +1M+ token ไธŠไธ‹ๆ–‡็š„ๆœ€ไฝณๆ€งไปทๆฏ”ๆจกๅž‹ โ€” ๅค„็†่ถ…้•ฟ่พ“ๅ…ฅใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/M | ่พ“ๅ‡บ $/M | ่ƒฝๅŠ› | +| --------------------------------- | ------------- | ------ | -------- | -------- | -------- | +| gemini-1.5-flash-8b | deepinfra | 1M | $0.0375 | $0.15 | | +| gpt-5-nano | meganova | 1M | $0.04 | $0.32 | ๐Ÿ”ง | +| qwen--qwen3.5-flash-02-23 | openrouter | 1M | $0.065 | $0.26 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ“‹ | +| google--gemini-2.0-flash-lite-001 | openrouter | 1M | $0.075 | $0.3 | ๐Ÿ”ง ๐Ÿ“‹ | +| google--gemini-2.0-flash-lite-001 | fastrouter | 1M | $0.075 | $0.3 | ๐Ÿ”ง | +| gemini-1.5-flash | deepinfra | 1M | $0.075 | $0.3 | | +| gemini-2.0-flash-lite | google | 1M | $0.075 | $0.3 | ๐Ÿ”ง ๐Ÿ“‹ | +| gemini-1.5-flash | google | 1M | $0.075 | $0.3 | ๐Ÿ”ง ๐Ÿ“‹ | +| gemini-1.5-flash-8b | google | 1M | $0.075 | $0.3 | ๐Ÿ”ง ๐Ÿ“‹ | +| gemini-2-0-flash-lite | google-vertex | 1M | $0.075 | $0.3 | ๐Ÿ”ง | + +## ๅ…่ดนๅคงไธŠไธ‹ๆ–‡ๆจกๅž‹ + +128K+ ไธŠไธ‹ๆ–‡็š„ๅ…่ดนๆจกๅž‹ โ€” ้›ถๆˆๆœฌ้•ฟๆ–‡ๆกฃๅค„็†ใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/M | ่พ“ๅ‡บ $/M | ่ƒฝๅŠ› | +| ---------------------------------------- | ---------- | ------ | -------- | -------- | -------- | +| openrouter--owl-alpha | openrouter | 1M | Free | Free | ๐Ÿ”ง ๐Ÿ“‹ | +| deepseek--deepseek-v4-flash--free | openrouter | 1M | Free | Free | ๐Ÿ”ง ๐Ÿง  | +| google--lyria-3-clip-preview | openrouter | 1M | Free | Free | ๐Ÿ“‹ | +| google--lyria-3-pro-preview | openrouter | 1M | Free | Free | ๐Ÿ“‹ | +| qwen--qwen3-coder--free | openrouter | 1M | Free | Free | ๐Ÿ”ง | +| nvidia--nemotron-3-super-120b-a12b--free | openrouter | 1M | Free | Free | ๐Ÿ”ง ๐Ÿง  ๐Ÿ“‹ | +| google--gemma-4-26b-a4b-it--free | openrouter | 262K | Free | Free | ๐Ÿ”ง ๐Ÿง  ๐Ÿ“‹ | +| arcee-ai--trinity-large-thinking--free | openrouter | 262K | Free | Free | ๐Ÿ”ง ๐Ÿง  | +| google--gemma-4-31b-it--free | openrouter | 262K | Free | Free | ๐Ÿ”ง ๐Ÿง  ๐Ÿ“‹ | +| gemma-4-26b-a4b-it | auriko | 262K | Free | Free | ๐Ÿ”ง ๐Ÿง  ๐Ÿ“‹ | + +## ไธŠไธ‹ๆ–‡็ช—ๅฃๅฑ‚็บง + +| ๅฑ‚็บง | ไธŠไธ‹ๆ–‡ | ็”จไพ‹ | ็คบไพ‹ๆจกๅž‹ | +| ---- | ------ | ------------------ | ------------------------- | +| ๆ ‡ๅ‡† | 128K | ้•ฟๆ–‡ๆกฃใ€ไปฃ็ ๆ–‡ไปถ | gpt-4.1, claude-sonnet-4 | +| ๆ‰ฉๅฑ• | 256K | ไปฃ็ ๅบ“ใ€ๅคšๆ–‡ไปถๅˆ†ๆž | claude-opus-4, o3 | +| ่ถ…ๅคง | 1M | ๅฎŒๆ•ดไป“ๅบ“ใ€ไนฆ็ฑ | gemini-2.5-flash, gpt-4.1 | +| ๅทจๅž‹ | 10M | ๆ•ดไธชๆ•ฐๆฎ้›†ใ€่ง†้ข‘ | llama-4-scout | + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ไธŠไธ‹ๆ–‡็ช—ๅฃ](context-windows.md) โ€” ่ฏฆ็ป†็š„ไธŠไธ‹ๆ–‡็ช—ๅฃๅฏนๆฏ” +- [่Šๅคฉๆจกๅž‹](chat-models.md) โ€” 2,350 ไธชๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ็š„่Šๅคฉๆจกๅž‹ +- [ไปฃ็ ๆจกๅž‹](code-models.md) โ€” 189 ไธชไปฃ็ ๆจกๅž‹ +- [ๅ…่ดน AI ๆจกๅž‹](free-models.md) โ€” 81 ไธชๅ…่ดนๆจกๅž‹ๆŒ‰่ƒฝๅŠ›ๅˆ†็ฑป +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ้€‰ๆ‹ฉๆจกๅž‹็š„ๅ†ณ็ญ–ๆก†ๆžถ +- [่ฟ็งปๆŒ‡ๅ—](migration-guide.md) โ€” ๅˆ‡ๆขๆไพ›ๅ•† +- [ๆไพ›ๅ•†ๅฏนๆฏ”](provider-comparison.md) โ€” ๅ‰ 30 ไธชๆไพ›ๅ•† + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/lessons-learned.md b/docs/zh/lessons-learned.md index 16c05433..6d8ede7e 100644 --- a/docs/zh/lessons-learned.md +++ b/docs/zh/lessons-learned.md @@ -290,3 +290,15 @@ - **nano-gpt**๏ผšๅ…ฌๅผ€ API ่Žทๅ–ๆจกๅž‹ๅˆ—่กจ + JS ๅŒ…่Žทๅ–ๆŒ‰ token USD ๅฎšไปท๏ผˆ555 ไธชๆจกๅž‹๏ผ‰ใ€‚ ่ฟ™ไบ›ๅนณๅฐ่ขซ่ง†ไธบๆŽจ็†ๅนณๅฐ๏ผŒ่€Œ้ž่ขซๆ‹’็ปไธบโ€œๅชๆ˜ฏ่ทฏ็”ฑๅ™จโ€๏ผŒๅ› ไธบๅฎƒไปฌๆไพ›ๅฏ้ชŒ่ฏ็š„็ฌฌไธ€ๆ–นๆŒ‰ token ๅฎšไปทๆ•ฐๆฎใ€‚ + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๆ•ฐๆฎ่Žทๅ–](data-acquisition.md) โ€” ๅฆ‚ไฝ•่Žทๅ–ๅ’Œๆ›ดๆ–ฐๆ•ฐๆฎ +- [ๆ•ฐๆฎๆจกๅผ](data-schema.md) โ€” ๅฎŒๆ•ด YAML ๆจกๅผๅ‚่€ƒ +- [ๆไพ›ๅ•†ๆฆ‚่งˆ](providers.md) โ€” 95 ไธชๆไพ›ๅ•† +- [ๅธธ่ง้—ฎ้ข˜](faq.md) โ€” ๅธธ่ง้—ฎ้ข˜ +- [่ดก็ŒฎๆŒ‡ๅ—](https://github.com/i-need-token/ai-models/blob/main/CONTRIBUTING.md) โ€” ๅฆ‚ไฝ•่ดก็Œฎ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/migration-guide.md b/docs/zh/migration-guide.md new file mode 100644 index 00000000..84d45516 --- /dev/null +++ b/docs/zh/migration-guide.md @@ -0,0 +1,100 @@ +# ่ฟ็งปๆŒ‡ๅ—๏ผšๅˆ‡ๆข AI ๆจกๅž‹ๆไพ›ๅ•† + +[English](../migration-guide.md) + +ๅˆ‡ๆข AI ๆจกๅž‹ๆไพ›ๅ•†็š„ๅฎž็”จๆŒ‡ๅ— โ€” ๆฏ”่พƒๅฎšไปทใ€่ƒฝๅŠ›ๅ’ŒไธŠไธ‹ๆ–‡็ช—ๅฃ๏ผŒๆ‰พๅˆฐๆœ€้€‚ๅˆๆ‚จ็”จไพ‹็š„ๆ›ฟไปฃๆ–นๆกˆใ€‚ + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models)ใ€‚ + +## ไธบไป€ไนˆ่ฆๅˆ‡ๆขๆไพ›ๅ•†๏ผŸ + +- **่Š‚็œๆˆๆœฌ** โ€” ๆŸไบ›ๆไพ›ๅ•†ไปฅไฝŽ 2-10 ๅ€็š„ไปทๆ ผๆไพ›็›ธๅŒๆจกๅž‹ +- **ๆ›ดๅฅฝ็š„่ƒฝๅŠ›** โ€” ๆ–ฐๆจกๅž‹ๅฏ่ƒฝๆไพ›ๅทฅๅ…ท่ฐƒ็”จใ€ๆŽจ็†ๆˆ–่ง†่ง‰่ƒฝๅŠ› +- **ๆ›ดๅคง็š„ไธŠไธ‹ๆ–‡** โ€” ๅœจๅ•ไธช่ฏทๆฑ‚ไธญๅค„็†ๆ›ดๅคšๆ•ฐๆฎ +- **ๅฏ้ ๆ€ง** โ€” ๅ‡ๅฐ‘ๅฏนๅ•ไธ€ๆไพ›ๅ•†็š„ไพ่ต– +- **ๅˆ่ง„ๆ€ง** โ€” ๆ•ฐๆฎ้ฉป็•™่ฆๆฑ‚ๅฏ่ƒฝ้œ€่ฆ็‰นๅฎšๆไพ›ๅ•† + +## ไธป่ฆๆไพ›ๅ•†ๅฏนๆฏ” + +| ๆไพ›ๅ•† | ๆจกๅž‹ๆ•ฐ | ๆœ€ไฝŽ่พ“ๅ…ฅ $/M | ๆœ€ๅคงไธŠไธ‹ๆ–‡ | ๅทฅๅ…ท่ฐƒ็”จ | ๆŽจ็† | +| --------- | ------ | -----------: | ---------- | -------- | ---- | +| openai | 28 | $0.02 | 1047576 | 18 | 8 | +| anthropic | 11 | $1 | 1000000 | 11 | 11 | +| google | 21 | $0.075 | 2097152 | 8 | 2 | +| deepseek | 4 | $0.14 | 1000000 | 4 | 3 | +| meta | 12 | $0.1 | 10000000 | 9 | 0 | +| mistral | 16 | $0.04 | 256000 | 12 | 1 | +| xai | 6 | $0.2 | 131072 | 6 | 5 | +| alibaba | 62 | $0.15 | 1000000 | 62 | 52 | + +## ๅธธ่ง่ฟ็งป่ทฏๅพ„ + +### OpenAI โ†’ ๆ›ดไพฟๅฎœ็š„ๆ›ฟไปฃๆ–นๆกˆ + +| OpenAI ๆจกๅž‹ | ๆœ€ไพฟๅฎœ็š„ๆ›ฟไปฃๆ–นๆกˆ | ๆไพ›ๅ•† | ่พ“ๅ…ฅ $/M | ่Š‚็œ | +| -------------------- | ---------------- | --------- | -------- | ---- | +| gpt-4.1 ($2) | gpt-4.1-mini | openai | $0.40 | 80% | +| gpt-4.1-mini ($0.40) | gpt-4.1-nano | openai | $0.10 | 75% | +| o4-mini ($1.10) | deepseek-r1 | deepseek | $0.55 | 50% | +| gpt-4.1 ($2) | claude-haiku-4 | anthropic | $1 | 50% | +| gpt-4.1 ($2) | gemini-2.5-flash | google | $0.15 | 93% | + +### Anthropic โ†’ ๆ›ดไพฟๅฎœ็š„ๆ›ฟไปฃๆ–นๆกˆ + +| Anthropic ๆจกๅž‹ | ๆœ€ไพฟๅฎœ็š„ๆ›ฟไปฃๆ–นๆกˆ | ๆไพ›ๅ•† | ่พ“ๅ…ฅ $/M | ่Š‚็œ | +| -------------------- | ---------------- | -------- | -------- | ---- | +| claude-opus-4 ($15) | o4-mini | openai | $1.10 | 93% | +| claude-sonnet-4 ($3) | gemini-2.5-flash | google | $0.15 | 95% | +| claude-sonnet-4 ($3) | deepseek-chat | deepseek | $0.14 | 95% | +| claude-haiku-4 ($1) | gemini-2.5-flash | google | $0.15 | 85% | + +### Google โ†’ ๆ›ดไพฟๅฎœ็š„ๆ›ฟไปฃๆ–นๆกˆ + +| Google ๆจกๅž‹ | ๆœ€ไพฟๅฎœ็š„ๆ›ฟไปฃๆ–นๆกˆ | ๆไพ›ๅ•† | ่พ“ๅ…ฅ $/M | ่Š‚็œ | +| ---------------------- | ---------------- | -------- | -------- | ---- | +| gemini-2.5-pro ($1.25) | gemini-2.5-flash | google | $0.15 | 88% | +| gemini-2.5-pro ($1.25) | deepseek-chat | deepseek | $0.14 | 89% | + +## ่ฟ็งปๆฃ€ๆŸฅๆธ…ๅ• + +ๅˆ‡ๆขๆไพ›ๅ•†ๆ—ถ๏ผŒ่ฏท้ชŒ่ฏไปฅไธ‹ๅ…ผๅฎนๆ€ง่ฆ็‚น๏ผš + +- [ ] **API ๆ ผๅผ** โ€” OpenAI ๅ…ผๅฎน vs ไธ“ๆœ‰ API +- [ ] **ๆจกๅž‹ๅ็งฐ** โ€” ไธๅŒๆไพ›ๅ•†ไฝฟ็”จไธๅŒ็š„ๆจกๅž‹ ID +- [ ] **ๅทฅๅ…ท่ฐƒ็”จๆ ผๅผ** โ€” ๅ‡ฝๆ•ฐ่ฐƒ็”จ่ฏญๆณ•ไธๅŒ +- [ ] **ๆตๅผไผ ่พ“** โ€” SSE vs WebSocket vs HTTP ๆตๅผไผ ่พ“ +- [ ] **้€Ÿ็އ้™ๅˆถ** โ€” ๆฏๅˆ†้’Ÿ่ฏทๆฑ‚ๆ•ฐใ€ๆฏๅˆ†้’Ÿ token ๆ•ฐ +- [ ] **ไธŠไธ‹ๆ–‡็ช—ๅฃ** โ€” ๅฏ่ƒฝไธŽๅŽŸๆไพ›ๅ•†ไธๅŒ +- [ ] **ๆจกๆ€** โ€” ่ง†่ง‰ใ€้Ÿณ้ข‘ใ€่ง†้ข‘ๆ”ฏๆŒไธๅŒ +- [ ] **็ป“ๆž„ๅŒ–่พ“ๅ‡บ** โ€” JSON ๆจกๅผๅฏ็”จๆ€ง +- [ ] **ๆ็คบ็ผ“ๅญ˜** โ€” ๅฏ้™ไฝŽ 50-90% ๆˆๆœฌ +- [ ] **ๆ•ฐๆฎ้ฉป็•™** โ€” ๆ•ฐๆฎๅœจๅ“ช้‡Œๅค„็†ๅ’Œๅญ˜ๅ‚จ + +## OpenAI ๅ…ผๅฎนๆไพ›ๅ•† + +่ฟ™ไบ›ๆไพ›ๅ•†ๆไพ› OpenAI ๅ…ผๅฎน API โ€” ๅช้œ€ๆœ€ๅฐ‘็š„ไปฃ็ ๆ›ดๆ”น๏ผš + +| ๆไพ›ๅ•† | Base URL | ๅค‡ๆณจ | +| ----------- | ------------------------------- | ----------------- | +| openrouter | `openrouter.ai/api/v1` | ่šๅˆๅ™จ๏ผŒ356+ ๆจกๅž‹ | +| deepinfra | `api.deepinfra.com/v1` | ไธ“ๆณจๅผ€ๆบๆจกๅž‹ | +| togetherai | `api.together.xyz/v1` | ๅผ€ๆบๆจกๅž‹ๆ‰˜็ฎก | +| groq | `api.groq.com/openai/v1` | ่ถ…ๅฟซๆŽจ็† | +| cerebras | `api.cerebras.ai/v1` | ๆœ€ๅฟซๆŽจ็†้€Ÿๅบฆ | +| fireworks | `api.fireworks.ai/inference/v1` | ๆ— ๆœๅŠกๅ™จๆจกๅž‹ๆ‰˜็ฎก | +| siliconflow | `api.siliconflow.cn/v1` | ไธญๅ›ฝๅธ‚ๅœบๆไพ›ๅ•† | + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๅฎšไปทๅฏนๆฏ”](pricing-comparison.md) โ€” ่ทจๆไพ›ๅ•†ๅฎšไปทๅฏนๆฏ” +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ้€‰ๆ‹ฉๆจกๅž‹็š„ๅ†ณ็ญ–ๆก†ๆžถ +- [ๅ…่ดน AI ๆจกๅž‹](free-models.md) โ€” 81 ไธชๅ…่ดนๆจกๅž‹ๆŒ‰่ƒฝๅŠ›ๅˆ†็ฑป +- [็ผ“ๅญ˜ๅฎšไปท](cached-pricing.md) โ€” 1,374 ไธชๆ”ฏๆŒๆ็คบ็ผ“ๅญ˜็š„ๆจกๅž‹ +- [่Šๅคฉๆจกๅž‹](chat-models.md) โ€” 2,350 ไธชๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ็š„่Šๅคฉๆจกๅž‹ +- [ๆ™บ่ƒฝไฝ“ๆจกๅž‹](agentic-models.md) โ€” 1,080 ไธชๅ…ทๅค‡ๅทฅๅ…ท่ฐƒ็”จ + ๆŽจ็†่ƒฝๅŠ›็š„ๆจกๅž‹ +- [API ๅ‚่€ƒ](api.md) โ€” ็ผ–็จ‹่ฎฟ้—ฎๆจกๅž‹ๆ•ฐๆฎ +- [OpenAI ๆ›ฟไปฃๆ–นๆกˆ](openai-alternatives.md) โ€” GPT-4/GPT-3.5 ๅฎšไปทๆ›ฟไปฃ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/modality-matrix.md b/docs/zh/modality-matrix.md new file mode 100644 index 00000000..5cfc4d31 --- /dev/null +++ b/docs/zh/modality-matrix.md @@ -0,0 +1,106 @@ +[English](../modality-matrix.md) | **ไธญๆ–‡** + +# ๆจกๆ€็Ÿฉ้˜ต + +ๅ“ชไบ›ๆจกๅž‹ๆ”ฏๆŒ่ง†่ง‰ใ€้Ÿณ้ข‘ใ€ๅ›พๅƒ็”Ÿๆˆๅ’Œ่ง†้ข‘๏ผŸๆœฌ้กตๅˆ—ๅ‡บๅ„ๆจกๆ€็š„้กถ็บงๆจกๅž‹ใ€‚ + +> ๅฎŒๆ•ดๅˆ—่กจ่ฏทๆต่งˆ `providers/` ็›ฎๅฝ•ๆˆ–ไธ‹่ฝฝ [models.json](https://github.com/i-need-token/ai-models/releases/latest)ใ€‚ + +## ่ง†่ง‰๏ผˆๅ›พๅƒ่พ“ๅ…ฅ๏ผ‰ + +1,487 ไธชๆจกๅž‹ๆŽฅๅ—ๅ›พๅƒ่พ“ๅ…ฅใ€‚ไปฅไธ‹ๆ˜ฏๆœ€ๅผบๅคง็š„ๆ——่ˆฐๆจกๅž‹๏ผš + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/1M | ่พ“ๅ‡บ $/1M | +| ---------------- | --------- | ------ | --------: | --------: | +| GPT-4.1 | OpenAI | 1M | $2.00 | $8.00 | +| Claude Opus 4 | Anthropic | 200K | $15.00 | $75.00 | +| Gemini 2.5 Pro | Google | 1M | $1.25 | $10.00 | +| Qwen3-235B-A22B | ้˜ฟ้‡Œไบ‘ | 128K | ยฅ1.00 | ยฅ4.00 | +| DeepSeek-V3 | DeepSeek | 128K | $0.27 | $1.10 | +| Llama 4 Maverick | Meta | 1M | โ€” | โ€” | +| Mistral Large | Mistral | 128K | $2.00 | $6.00 | +| Grok 3 | xAI | 131K | $3.00 | $15.00 | + +**ๆœ€ไพฟๅฎœ็š„่ง†่ง‰ๆจกๅž‹๏ผˆUSD๏ผ‰๏ผš** + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ่พ“ๅ…ฅ $/1M | ่พ“ๅ‡บ $/1M | +| ------------- | ----------- | --------: | --------: | +| DeepSeek-V3 | DeepSeek | $0.27 | $1.10 | +| Qwen3-30B-A3B | ้˜ฟ้‡Œไบ‘ | ยฅ0.10 | ยฅ0.30 | +| Llama 4 Scout | Together AI | $0.15 | $0.60 | +| Gemma 3 27B | Google | $0.20 | $0.80 | +| Phi-4 | Microsoft | $0.10 | $0.40 | + +## ๅ›พๅƒ่พ“ๅ‡บ๏ผˆๅ›พๅƒ็”Ÿๆˆ๏ผ‰ + +28 ไธชๆจกๅž‹ๅฏไปฅ็”Ÿๆˆๅ›พๅƒ๏ผš + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ็ฑปๅž‹ | +| -------------------- | ----------------- | ------------ | +| GPT-Image-1 | OpenAI | ๅŽŸ็”Ÿๅ›พๅƒ็”Ÿๆˆ | +| DALL-E 3 | OpenAI | ๅŽŸ็”Ÿๅ›พๅƒ็”Ÿๆˆ | +| Gemini 2.0 Flash | Google | ๅคšๆจกๆ€่พ“ๅ‡บ | +| Flux Pro | Black Forest Labs | ๅ›พๅƒ็”Ÿๆˆ | +| Flux Dev | Black Forest Labs | ๅ›พๅƒ็”Ÿๆˆ | +| Ideogram 3 | Ideogram | ๅ›พๅƒ็”Ÿๆˆ | +| Stable Diffusion 3.5 | Stability AI | ๅ›พๅƒ็”Ÿๆˆ | +| Midjourney v7 | Midjourney | ๅ›พๅƒ็”Ÿๆˆ | + +## ้Ÿณ้ข‘่พ“ๅ…ฅ๏ผˆ่ฏญ้Ÿณ่ฏ†ๅˆซ๏ผ‰ + +118 ไธชๆจกๅž‹ๆŽฅๅ—้Ÿณ้ข‘่พ“ๅ…ฅ๏ผš + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ่ƒฝๅŠ› | +| --------------- | --------- | --------------- | +| GPT-4o-audio | OpenAI | ้Ÿณ้ข‘็†่งฃ + ็”Ÿๆˆ | +| Gemini 2.5 Pro | Google | ้Ÿณ้ข‘็†่งฃ | +| Claude Sonnet 4 | Anthropic | ้Ÿณ้ข‘็†่งฃ | +| Qwen2-Audio | ้˜ฟ้‡Œไบ‘ | ้Ÿณ้ข‘็†่งฃ | +| Whisper | OpenAI | ่ฏญ้Ÿณ่ฏ†ๅˆซ | + +## ้Ÿณ้ข‘่พ“ๅ‡บ๏ผˆ่ฏญ้Ÿณ็”Ÿๆˆ๏ผ‰ + +34 ไธชๆจกๅž‹ๅฏไปฅ็”Ÿๆˆ้Ÿณ้ข‘๏ผš + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ็ฑปๅž‹ | +| -------------- | ------ | ---------- | +| GPT-4o-audio | OpenAI | ้Ÿณ้ข‘่พ“ๅ‡บ | +| Gemini 2.5 Pro | Google | ้Ÿณ้ข‘่พ“ๅ‡บ | +| Qwen2-Audio | ้˜ฟ้‡Œไบ‘ | ้Ÿณ้ข‘่พ“ๅ‡บ | +| TTS-1 | OpenAI | ๆ–‡ๆœฌ่ฝฌ่ฏญ้Ÿณ | +| TTS-1-HD | OpenAI | ๆ–‡ๆœฌ่ฝฌ่ฏญ้Ÿณ | + +## ่ง†้ข‘่พ“ๅ…ฅ + +167 ไธชๆจกๅž‹ๆŽฅๅ—่ง†้ข‘่พ“ๅ…ฅ๏ผš + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | +| ---------------- | --------- | ----------- | +| Gemini 2.5 Pro | Google | 1M tokens | +| GPT-4.1 | OpenAI | 1M tokens | +| Claude Opus 4 | Anthropic | 200K tokens | +| Qwen3-235B-A22B | ้˜ฟ้‡Œไบ‘ | 128K tokens | +| Llama 4 Maverick | Meta | 1M tokens | + +## ๅคšๆจกๆ€ๆจกๅž‹๏ผˆ3+ ่พ“ๅ…ฅๆจกๆ€๏ผ‰ + +ๆŽฅๅ—ๆ–‡ๆœฌ + ่‡ณๅฐ‘ 2 ็ง้ขๅค–่พ“ๅ…ฅๆจกๆ€็š„ๆจกๅž‹๏ผš + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ่พ“ๅ…ฅๆจกๆ€ | +| -------------- | --------- | ---------------------- | +| GPT-4o-audio | OpenAI | ๆ–‡ๆœฌใ€ๅ›พๅƒใ€้Ÿณ้ข‘ | +| Gemini 2.5 Pro | Google | ๆ–‡ๆœฌใ€ๅ›พๅƒใ€้Ÿณ้ข‘ใ€่ง†้ข‘ | +| Claude Opus 4 | Anthropic | ๆ–‡ๆœฌใ€ๅ›พๅƒใ€้Ÿณ้ข‘ | +| Qwen2-Audio | ้˜ฟ้‡Œไบ‘ | ๆ–‡ๆœฌใ€ๅ›พๅƒใ€้Ÿณ้ข‘ | + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [่ง†่ง‰ๆจกๅž‹](vision-models.md) โ€” 1,487 ไธช่ง†่ง‰ๆจกๅž‹ +- [้Ÿณ้ข‘ๆจกๅž‹](audio-models.md) โ€” 118 ไธช้Ÿณ้ข‘่พ“ๅ…ฅ + 34 ไธช้Ÿณ้ข‘่พ“ๅ‡บๆจกๅž‹ +- [่ง†้ข‘ๆจกๅž‹](video-models.md) โ€” 167 ไธช่ง†้ข‘่พ“ๅ…ฅ/่พ“ๅ‡บๆจกๅž‹ +- [ๅ›พๅƒ็”Ÿๆˆ](image-generation.md) โ€” 28 ไธชๅ›พๅƒ็”Ÿๆˆๆจกๅž‹ +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ๅ†ณ็ญ–ๆก†ๆžถ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/model-comparison.md b/docs/zh/model-comparison.md new file mode 100644 index 00000000..418aa9cf --- /dev/null +++ b/docs/zh/model-comparison.md @@ -0,0 +1,109 @@ +[English](../model-comparison.md) | **ไธญๆ–‡** + +# ๆจกๅž‹ๅฏนๆฏ” + +็ƒญ้—จ AI ๆจกๅž‹็ฑปๅˆซ็š„ๅฟซ้€Ÿๅ‚่€ƒๅฏนๆฏ”ใ€‚ๆ‰€ๆœ‰ๆ•ฐๆฎๆฅ่‡ช็ฌฌไธ€ๆ–นๆไพ›ๅ•† API ๅ’Œๆ–‡ๆกฃใ€‚ + +## ้กถ็บงๆ——่ˆฐๆจกๅž‹ + +ๅ„ไธป่ฆๆไพ›ๅ•†ๆœ€ๅผบๅคง็š„ๆจกๅž‹ใ€‚ๅฎšไปทไธบ็›ดๆŽฅๆไพ›ๅ•† API ไปทๆ ผใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/็™พไธ‡token | ่พ“ๅ‡บ $/็™พไธ‡token | ๆŽจ็† | ๅทฅๅ…ท่ฐƒ็”จ | ่ง†่ง‰ | +| ---------------- | --------- | -----: | ---------------: | ---------------: | :--: | :------: | :--: | +| o3 | OpenAI | 200K | 10.00 | 40.00 | โœ… | โœ… | โœ… | +| Claude Opus 4.7 | Anthropic | 1M | 5.00 | 25.00 | โœ… | โœ… | โœ… | +| Gemini 2.5 Pro | Google | 1M | 1.25 | 10.00 | โœ… | โœ… | โœ… | +| DeepSeek-V4-Pro | DeepSeek | 1M | 0.435 | 0.87 | โœ… | โœ… | โŒ | +| Grok 4 | xAI | 131K | 3.00 | 15.00 | โœ… | โœ… | โœ… | +| Llama 4 Maverick | Meta | 1M | 0.24 | 0.97 | โŒ | โœ… | โœ… | +| Qwen3-235B | ้˜ฟ้‡Œไบ‘ | โ€” | 2.00 | 8.00 | โœ… | โœ… | โŒ | +| Mistral Large | Mistral | 128K | 2.00 | 6.00 | โŒ | โœ… | โœ… | + +## ้ซ˜ๆ€งไปทๆฏ”ๆจกๅž‹ + +้€‚ๅˆ้ซ˜ๅžๅ้‡ๅทฅไฝœ่ดŸ่ฝฝ็š„ๆœ€ไฝณๆ€งไปทๆฏ”ๆจกๅž‹ใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/็™พไธ‡token | ่พ“ๅ‡บ $/็™พไธ‡token | ๆŽจ็† | ๅทฅๅ…ท่ฐƒ็”จ | +| ----------------- | --------- | -----: | ---------------: | ---------------: | :--: | :------: | +| GPT-4.1 Nano | OpenAI | 1M | 0.10 | 0.40 | โŒ | โœ… | +| o4-mini | OpenAI | 200K | 1.10 | 4.40 | โœ… | โœ… | +| Claude Haiku 4.5 | Anthropic | 200K | 1.00 | 5.00 | โœ… | โœ… | +| Gemini 2.5 Flash | Google | 1M | 0.15 | 3.50 | โœ… | โœ… | +| DeepSeek-V4-Flash | DeepSeek | 1M | 0.14 | 0.28 | โœ… | โœ… | +| Llama 4 Scout | Meta | 10M | 0.17 | 0.66 | โŒ | โœ… | +| Qwen3-30B | ้˜ฟ้‡Œไบ‘ | โ€” | 0.75 | 3.00 | โœ… | โœ… | +| Mistral Small | Mistral | 128K | 0.20 | 0.60 | โŒ | โœ… | +| Grok 3 Mini | xAI | 131K | 0.25 | 1.27 | โœ… | โœ… | + +## ๆœ€ๅคงไธŠไธ‹ๆ–‡็ช—ๅฃ + +้€‚ๅˆ้•ฟๆ–‡ๆกฃๅค„็†็š„ๆœ€ๅคงไธŠไธ‹ๆ–‡็ช—ๅฃๆจกๅž‹ใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ (tokens) | ่พ“ๅ…ฅ $/็™พไธ‡token | ่พ“ๅ‡บ $/็™พไธ‡token | +| ----------------- | --------- | --------------: | ---------------: | ---------------: | +| Llama 4 Scout | Meta | 10,000,000 | 0.17 | 0.66 | +| Claude Opus 4.7 | Anthropic | 1,000,000 | 5.00 | 25.00 | +| Claude Sonnet 4.6 | Anthropic | 1,000,000 | 3.00 | 15.00 | +| GPT-4.1 | OpenAI | 1,048,576 | 2.00 | 8.00 | +| Gemini 2.5 Pro | Google | 1,048,576 | 1.25 | 10.00 | +| Gemini 2.5 Flash | Google | 1,048,576 | 0.15 | 3.50 | +| Llama 4 Maverick | Meta | 1,000,000 | 0.24 | 0.97 | +| DeepSeek-V4-Pro | DeepSeek | 1,000,000 | 0.435 | 0.87 | + +## ๅ…่ดนๆจกๅž‹ + +ๆ•ฐๆฎ้‡‡้›†ๆ—ถๅ…่ดนๅฏ็”จ็š„ๆจกๅž‹ใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ๆŽจ็† | ๅทฅๅ…ท่ฐƒ็”จ | +| -------------------------- | -------- | -----: | :--: | :------: | +| DeepSeek-V4-Flash (ๅ…่ดนๅฑ‚) | DeepSeek | 1M | โœ… | โœ… | +| Gemini 2.5 Flash (ๅ…่ดนๅฑ‚) | Google | 1M | โœ… | โœ… | +| Llama 4 Scout (่‡ชๆ‰˜็ฎก) | Meta | 10M | โŒ | โœ… | +| Qwen3-30B (่‡ชๆ‰˜็ฎก) | ้˜ฟ้‡Œไบ‘ | โ€” | โœ… | โœ… | +| Mistral Small (่‡ชๆ‰˜็ฎก) | Mistral | 128K | โŒ | โœ… | + +> ๅ…่ดนๅฑ‚้€šๅธธๆœ‰้€Ÿ็އ้™ๅˆถใ€‚่‡ชๆ‰˜็ฎกๆจกๅž‹้œ€่ฆ่‡ชๅทฑ็š„ๅŸบ็ก€่ฎพๆ–ฝใ€‚ + +## ่ง†่ง‰ๆจกๅž‹ + +ๆ”ฏๆŒๅ›พๅƒ่พ“ๅ…ฅ็š„ๆจกๅž‹ใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ๅ›พๅƒ่พ“ๅ…ฅ | ๅ›พๅƒ่พ“ๅ‡บ | ่ง†้ข‘่พ“ๅ…ฅ | +| ---------------- | --------- | :------: | :------: | :------: | +| o3 | OpenAI | โœ… | โŒ | โŒ | +| Claude Opus 4.7 | Anthropic | โœ… | โŒ | โŒ | +| Gemini 2.5 Pro | Google | โœ… | โŒ | โŒ | +| GPT-4.1 | OpenAI | โœ… | โŒ | โŒ | +| Llama 4 Maverick | Meta | โœ… | โŒ | โŒ | +| Grok 3 | xAI | โœ… | โŒ | โŒ | + +## ๅผ€ๆบๆƒ้‡ๆจกๅž‹ + +ๆƒ้‡ๅ…ฌๅผ€ๅฏ็”จ็š„่‡ชๆ‰˜็ฎกๆจกๅž‹ใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/็™พไธ‡token | ่พ“ๅ‡บ $/็™พไธ‡token | ๆŽจ็† | +| ----------------- | --------- | -----: | ---------------: | ---------------: | :--: | +| Llama 4 Maverick | Meta | 1M | 0.24 | 0.97 | โŒ | +| Llama 4 Scout | Meta | 10M | 0.17 | 0.66 | โŒ | +| Qwen3-235B | ้˜ฟ้‡Œไบ‘ | โ€” | 2.00 | 8.00 | โœ… | +| Qwen3-30B | ้˜ฟ้‡Œไบ‘ | โ€” | 0.75 | 3.00 | โœ… | +| Mistral Small 3.2 | Mistral | 128K | 0.20 | 0.60 | โŒ | +| Phi-4 | Microsoft | 16K | 0.125 | 0.50 | โŒ | + +> ๅฎšไปทไธบๆ‰˜็ฎกๆŽจ็†ไปทๆ ผใ€‚่‡ชๆ‰˜็ฎกๆจกๅž‹ๆ— ๆŒ‰ token ่ฎก่ดน๏ผŒไฝ†้œ€่ฆๅŸบ็ก€่ฎพๆ–ฝใ€‚ + +--- + +**ๆณจๆ„**๏ผšๆ‰€ๆœ‰ๅฎšไปทๅ’Œ่ƒฝๅŠ›ๆ•ฐๆฎๆฅ่‡ช็ฌฌไธ€ๆ–นๆฅๆบใ€‚ๆŽจ็†ๅนณๅฐไปทๆ ผๅฏ่ƒฝไธๅŒใ€‚ๆŸฅ็œ‹ `providers//models/` ่Žทๅ–ๆœ€ๆ–ฐๆ•ฐๆฎใ€‚ + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ้€‰ๆ‹ฉๆจกๅž‹็š„ๅ†ณ็ญ–ๆก†ๆžถ +- [ๅฎšไปทๅฏนๆฏ”](pricing-comparison.md) โ€” ๅ„ๆไพ›ๅ•†ๅฎšไปทๅนถๆŽ’ๅฏนๆฏ” +- [ๅ…่ดน AI ๆจกๅž‹](free-models.md) โ€” 81 ไธชๅ…่ดนๆจกๅž‹ +- [ๅผ€ๆบๆƒ้‡ๆจกๅž‹](open-weights.md) โ€” 527 ไธชๅฏ่‡ช่กŒ่ฟ่กŒ็š„ๆจกๅž‹ +- [ไธŠไธ‹ๆ–‡็ช—ๅฃๅฏนๆฏ”](context-windows.md) โ€” ๆœ€ๅคงไธŠไธ‹ๆ–‡็ช—ๅฃ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/model-selection-cheatsheet.md b/docs/zh/model-selection-cheatsheet.md new file mode 100644 index 00000000..407cf496 --- /dev/null +++ b/docs/zh/model-selection-cheatsheet.md @@ -0,0 +1,105 @@ +# AI ๆจกๅž‹้€‰ๆ‹ฉ้€ŸๆŸฅ่กจ + +> ๆŒ‰ไฝฟ็”จๅœบๆ™ฏๅฟซ้€Ÿ้€‰ๆ‹ฉ AI ๆจกๅž‹็š„ๅ‚่€ƒๆŒ‡ๅ—ใ€‚ๆ•ฐๆฎๆฅ่‡ช [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” 95 ไธชๆไพ›ๅ•†ใ€4,587+ ๆจกๅž‹ใ€‚ + +## ๐ŸŽฏ ๅ†ณ็ญ–ๆ ‘ + +``` +ไฝ ้œ€่ฆไป€ไนˆ๏ผŸ +โ”œโ”€โ”€ ๆœ€ไพฟๅฎœ็š„ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹ โ†’ ling-2.6-flash ($0.01/$0.03/M) +โ”œโ”€โ”€ ๆœ€ไฝณๅ…่ดนๆŽจ็†ๆจกๅž‹ โ†’ DeepSeek R1 (92% MATH-500) +โ”œโ”€โ”€ ๆœ€ๅคงไธŠไธ‹ๆ–‡็ช—ๅฃ โ†’ Gemini 2.5 Pro (1M tokens) +โ”œโ”€โ”€ ๆœ€ไฝณ็ผ–็จ‹ๅŠฉๆ‰‹ โ†’ Claude Sonnet 4 / GPT-4.1 +โ”œโ”€โ”€ ๅผ€ๆบๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹ โ†’ Qwen3 4B ($0.03/$0.15/M) +โ”œโ”€โ”€ ๅ…่ดน่ง†่ง‰ๆจกๅž‹ โ†’ Gemma 4 27B IT +โ””โ”€โ”€ ๆœ€ไฝŽ็”Ÿไบงๆˆๆœฌ โ†’ bdc-coder ($0.01/$0.01/M) +``` + +## ๐Ÿ’ฐ ๆŒ‰้ข„็ฎ—้€‰ๆ‹ฉ + +| ้ข„็ฎ— | ๆœ€ไฝณ้€‰ๆ‹ฉ | ่พ“ๅ…ฅ/่พ“ๅ‡บ $/M | ็†็”ฑ | +| ------------- | --------------- | ------------- | ---------------------- | +| **ๅ…่ดน** | DeepSeek R1 | $0/$0 | ๅ…่ดนๆจกๅž‹ไธญๆŽจ็†่ƒฝๅŠ›ๆœ€ๅผบ | +| **ๅ…่ดน** | Gemma 4 27B IT | $0/$0 | ๅ…่ดน่ง†่ง‰ + ๅทฅๅ…ท่ฐƒ็”จ | +| **< $0.05/M** | ling-2.6-flash | $0.01/$0.03 | ๆœ€ไพฟๅฎœ็š„ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹ | +| **< $0.10/M** | Qwen3 4B | $0.03/$0.15 | ๅผ€ๆบๆŽจ็† + ๅทฅๅ…ท่ฐƒ็”จ | +| **< $0.50/M** | GPT-4.1-mini | $0.40/$1.60 | ๆœ€ไฝณๆ€งไปทๆฏ”ๅ‰ๆฒฟๆจกๅž‹ | +| **< $2/M** | Claude Sonnet 4 | $3/$15 | ้กถ็บง็ผ–็จ‹ + ๆŽจ็† | +| **< $5/M** | GPT-4.1 | $2/$8 | 1M ไธŠไธ‹ๆ–‡ + ่ง†่ง‰ | +| **้ซ˜็ซฏ** | o3 | $10/$40 | ๆœ€ไฝณๆŽจ็†ๅŸบๅ‡†ๅˆ†ๆ•ฐ | + +## ๐Ÿ› ๏ธ ๆŒ‰ไฝฟ็”จๅœบๆ™ฏ้€‰ๆ‹ฉ + +### AI Agent + +้œ€ๆฑ‚๏ผšๅทฅๅ…ท่ฐƒ็”จ + ๆŽจ็† + ไฝŽๅปถ่ฟŸ + +- **ๆœ€ไฝณๆ€งไปทๆฏ”**๏ผšling-2.6-flash ($0.01/$0.03/M) โ€” ๆœ€ไพฟๅฎœ็š„ TC ๆจกๅž‹ +- **ๅ‡่กกไน‹้€‰**๏ผšGPT-4.1-mini ($0.40/$1.60/M) โ€” ๅฏ้  + 1M ไธŠไธ‹ๆ–‡ +- **้ซ˜็ซฏ้€‰ๆ‹ฉ**๏ผšClaude Sonnet 4 ($3/$15/M) โ€” ๆœ€ไฝณ Agent ๆ€ง่ƒฝ + +### ไปฃ็ ็”Ÿๆˆ + +้œ€ๆฑ‚๏ผšๅทฅๅ…ท่ฐƒ็”จ + ็ป“ๆž„ๅŒ–่พ“ๅ‡บ + ๅคงไธŠไธ‹ๆ–‡ + +- **ๆœ€ไฝณๆ€งไปทๆฏ”**๏ผšbdc-coder ($0.01/$0.01/M) โ€” ๆœ€ไพฟๅฎœ็š„็ผ–็จ‹ๆจกๅž‹ +- **ๅ‡่กกไน‹้€‰**๏ผšGPT-4.1-mini ($0.40/$1.60/M) โ€” ไปฃ็ ่ดจ้‡ไผ˜็ง€ +- **้ซ˜็ซฏ้€‰ๆ‹ฉ**๏ผšClaude Sonnet 4 ($3/$15/M) โ€” SWE-bench SOTA + +### ๅฏน่ฏ / RAG + +้œ€ๆฑ‚๏ผšๅคงไธŠไธ‹ๆ–‡ + ไฝŽๆˆๆœฌ + ๅฟซ้€Ÿๅ“ๅบ” + +- **ๆœ€ไฝณๆ€งไปทๆฏ”**๏ผšQwen3 4B ($0.03/$0.15/M) โ€” ไพฟๅฎœ + 262K ไธŠไธ‹ๆ–‡ +- **ๅ‡่กกไน‹้€‰**๏ผšGPT-4.1-nano ($0.10/$0.40/M) โ€” ๅฟซ้€Ÿ + ไพฟๅฎœ +- **้ซ˜็ซฏ้€‰ๆ‹ฉ**๏ผšGemini 2.5 Pro ($1.25/$10/M) โ€” 1M ไธŠไธ‹ๆ–‡ + ๆŽจ็† + +### ่ง†่ง‰ / ๅคšๆจกๆ€ + +้œ€ๆฑ‚๏ผšๅ›พๅƒ่พ“ๅ…ฅ + ๆ–‡ๆœฌ่พ“ๅ‡บ + ๅทฅๅ…ท่ฐƒ็”จ + +- **ๅ…่ดน**๏ผšGemma 4 27B IT โ€” ๅ…่ดน่ง†่ง‰ + TC +- **ๆœ€ไฝณๆ€งไปทๆฏ”**๏ผšGPT-4.1-mini ($0.40/$1.60/M) โ€” ่ง†่ง‰ + 1M ไธŠไธ‹ๆ–‡ +- **้ซ˜็ซฏ้€‰ๆ‹ฉ**๏ผšClaude Sonnet 4 ($3/$15/M) โ€” ๆœ€ไฝณ่ง†่ง‰็†่งฃ + +### ๆŽจ็† / ๆ•ฐๅญฆ + +้œ€ๆฑ‚๏ผšๆŽจ็†่ƒฝๅŠ› + ็ป“ๆž„ๅŒ–่พ“ๅ‡บ + +- **ๅ…่ดน**๏ผšDeepSeek R1 โ€” 92% MATH-500 +- **ๆœ€ไฝณๆ€งไปทๆฏ”**๏ผšQwen3.5 4B ($0.03/$0.15/M) โ€” ไพฟๅฎœๆŽจ็† +- **้ซ˜็ซฏ้€‰ๆ‹ฉ**๏ผšo3 ($10/$40/M) โ€” GPQAใ€MATH-500 SOTA + +### ๅคง่ง„ๆจก็”Ÿไบง + +้œ€ๆฑ‚๏ผšๆœ€ไฝŽ token ๆˆๆœฌ + ๅฏ้ ๆ€ง + +- **ๆœ€ไพฟๅฎœ TC**๏ผšling-2.6-flash ($0.01/$0.03/M) +- **ๆœ€ไพฟๅฎœๆŽจ็†**๏ผšQwen3.5 0.8B ($0.01/$0.05/M) +- **ๆœ€ไพฟๅฎœ็ผ–็จ‹**๏ผšbdc-coder ($0.01/$0.01/M) + +## ๐Ÿ“Š ๅฟซ้€Ÿ็ปŸ่ฎก + +| ๆŒ‡ๆ ‡ | ๆ•ฐ้‡ | +| ------------ | ----- | +| ๆจกๅž‹ๆ€ปๆ•ฐ | 4,587 | +| ๆไพ›ๅ•† | 95 | +| ๅ…่ดนๆจกๅž‹ | 81 | +| ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹ | 2,350 | +| ๆŽจ็†ๆจกๅž‹ | 1,306 | +| ่ง†่ง‰ๆจกๅž‹ | 1,487 | +| ๅผ€ๆบๆจกๅž‹ | 527 | +| ็ป“ๆž„ๅŒ–่พ“ๅ‡บ | 829 | + +## ๐Ÿ”— ๆ›ดๅคš่ต„ๆบ + +- [ไบคไบ’ๅผ็›ฎๅฝ•](https://i-need-token.github.io/ai-models/) โ€” ๆœ็ดขใ€็ญ›้€‰ใ€ๅฏนๆฏ”ๆ‰€ๆœ‰ๆจกๅž‹ +- [ๅ…่ดนๆจกๅž‹ๆŒ‡ๅ—](free-models.md) โ€” 81 ไธชๅ…่ดนๆจกๅž‹ +- [ๅทฅๅ…ท่ฐƒ็”จๆŒ‡ๅ—](tool-calling.md) โ€” 2,350 ไธชๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹ +- [ๅฎšไปทๅฏนๆฏ”](pricing-comparison.md) โ€” ๆ‰พๅˆฐๆœ€ไพฟๅฎœ็š„ๆจกๅž‹ +- [ไธŠไธ‹ๆ–‡็ช—ๅฃ](context-windows.md) โ€” ๆœ€ๅคงไธŠไธ‹ๆ–‡็ช—ๅฃ +- [ๆจกๅž‹ๅฏนๆฏ”](model-comparison.md) โ€” ้ขๅฏน้ขๅฏนๆฏ” + +--- + +_ๆ•ฐๆฎๆฅ่‡ช [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ไป…ไฝฟ็”จไธ€ๆ‰‹ๆ•ฐๆฎ๏ผŒ่‡ชๅŠจๆ›ดๆ–ฐใ€‚_ diff --git a/docs/zh/model-selection.md b/docs/zh/model-selection.md new file mode 100644 index 00000000..7817d877 --- /dev/null +++ b/docs/zh/model-selection.md @@ -0,0 +1,128 @@ +# ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ— + +> ๐Ÿ“‹ **ๅฟซ้€Ÿๅ‚่€ƒ๏ผŸ** ๆŸฅ็œ‹[ๆจกๅž‹้€‰ๆ‹ฉ้€ŸๆŸฅ่กจ](model-selection-cheatsheet.md)๏ผŒๆŒ‰้ข„็ฎ—้€‰ๆ‹ฉๆœ€ไฝณๆจกๅž‹ใ€‚ +> [English](../model-selection.md) + +ๅฆ‚ไฝ•ๆ นๆฎไฝฟ็”จๅœบๆ™ฏ้€‰ๆ‹ฉๅˆ้€‚็š„ AI ๆจกๅž‹ โ€” ๅŸบไบŽๆˆๆœฌใ€่ƒฝๅŠ›ๅ’ŒไธŠไธ‹ๆ–‡็ช—ๅฃ็š„ๅฎž็”จๅปบ่ฎฎใ€‚ + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models)ใ€‚ + +## ๅ†ณ็ญ–ๆก†ๆžถ + +``` +ไฝ ้œ€่ฆไป€ไนˆ๏ผŸ +โ”œโ”€โ”€ ๅฐฝๅฏ่ƒฝไพฟๅฎœ โ†’ ๅ…่ดนๆจกๅž‹๏ผˆ81 ไธชๅฏ็”จ๏ผ‰ +โ”‚ โ”œโ”€โ”€ ๅธฆๅทฅๅ…ท่ฐƒ็”จ โ†’ ่งไธ‹ๆ–น"ๅ…่ดน + ๅทฅๅ…ท่ฐƒ็”จ" +โ”‚ โ”œโ”€โ”€ ๅธฆๆŽจ็† โ†’ ่งไธ‹ๆ–น"ๅ…่ดน + ๆŽจ็†" +โ”‚ โ””โ”€โ”€ ๆœ€ไฝณๅ…่ดนๆจกๅž‹ โ†’ ่งไธ‹ๆ–น"ๆœ€ไฝณๅ…่ดนๆจกๅž‹" +โ”œโ”€โ”€ ๆœ€ไฝณๆ€งไปทๆฏ”๏ผˆไพฟๅฎœ + ่ƒฝๅŠ›ๅผบ๏ผ‰โ†’ ่งไธ‹ๆ–น"ๆœ€ไฝณๆ€งไปทๆฏ”ๆจกๅž‹" +โ”œโ”€โ”€ ๆœ€ๅคงไธŠไธ‹ๆ–‡ โ†’ ่งไธ‹ๆ–น"ๅคงไธŠไธ‹ๆ–‡ๆจกๅž‹" +โ”œโ”€โ”€ ็‰นๅฎš่ƒฝๅŠ› +โ”‚ โ”œโ”€โ”€ ๅทฅๅ…ท่ฐƒ็”จ โ†’ [ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹](tool-calling.md) +โ”‚ โ”œโ”€โ”€ ๆŽจ็† โ†’ [ๆŽจ็†ๆจกๅž‹](reasoning-models.md) +โ”‚ โ”œโ”€โ”€ ่ง†่ง‰ โ†’ [่ง†่ง‰ๆจกๅž‹](vision-models.md) +โ”‚ โ”œโ”€โ”€ ็ป“ๆž„ๅŒ–่พ“ๅ‡บ โ†’ [็ป“ๆž„ๅŒ–่พ“ๅ‡บ](structured-output.md) +โ”‚ โ””โ”€โ”€ ๆ็คบ็ผ“ๅญ˜ โ†’ [็ผ“ๅญ˜ๅฎšไปท](cached-pricing.md) +โ””โ”€โ”€ ๅฎŒๆ•ดๅฏนๆฏ” โ†’ [ๆจกๅž‹ๅฏนๆฏ”](model-comparison.md) ยท [ๅฎšไปทๅฏนๆฏ”](pricing-comparison.md) +``` + +## ๆœ€ไฝณๅ…่ดนๆจกๅž‹ + +่พ“ๅ…ฅๅ’Œ่พ“ๅ‡บๅฎšไปทๅ‡ไธบ $0 ็š„ๆจกๅž‹ โ€” ้žๅธธ้€‚ๅˆๅŽŸๅž‹ๅผ€ๅ‘ๅ’Œๅผ€ๅ‘้˜ถๆฎตใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่ƒฝๅŠ› | +| ---- | ------ | ------ | ---- | + +> ๆŸฅ็œ‹[ๅ…่ดน AI ๆจกๅž‹](free-models.md)่Žทๅ– 81 ไธชๅ…่ดนๆจกๅž‹็š„ๅฎŒๆ•ดๅˆ—่กจใ€‚ + +## ๅ…่ดน + ๅทฅๅ…ท่ฐƒ็”จ + +ๆ”ฏๆŒๅ‡ฝๆ•ฐ/ๅทฅๅ…ท่ฐƒ็”จ็š„ๅ…่ดนๆจกๅž‹ โ€” ้›ถๆˆๆœฌๆž„ๅปบ Agent ็š„็†ๆƒณ้€‰ๆ‹ฉใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่ƒฝๅŠ› | +| ---- | ------ | ------ | ---- | + +## ๅ…่ดน + ๆŽจ็† + +ๅ…ทๆœ‰้“พๅผๆ€็ปดๆŽจ็†็š„ๅ…่ดนๆจกๅž‹ โ€” ้›ถๆˆๆœฌ่งฃๅ†ณๅคๆ‚้—ฎ้ข˜ใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่ƒฝๅŠ› | +| ---- | ------ | ------ | ---- | + +## ๆœ€ไฝณๆ€งไปทๆฏ”ๆจกๅž‹ + +ๆœ€ไพฟๅฎœ็š„ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹ โ€” ็”Ÿไบง Agent ็š„ๆœ€ไฝณๆ€งไปทๆฏ”ใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/M | ่พ“ๅ‡บ $/M | ่ƒฝๅŠ› | +| --------------------------- | ------------ | ------ | -------- | -------- | -------- | +| ernie-4.5-0.3b | aihubmix | 0 | $0.0068 | $0.0272 | ๐Ÿ”ง ๐Ÿ‘ ๐Ÿ“‹ | +| bdc-coder | inferencenet | 131K | $0.01 | $0.01 | ๐Ÿ”ง ๐Ÿ”“ | +| inclusionai--ling-2.6-flash | openrouter | 262K | $0.01 | $0.03 | ๐Ÿ”ง ๐Ÿ“‹ | +| ling-2.6-flash | inclusionai | 262K | $0.01 | $0.03 | ๐Ÿ”ง | +| qwen-3.5-0.8b | auriko | 262K | $0.01 | $0.05 | ๐Ÿง  ๐Ÿ”ง ๐Ÿ‘ | + +ๆœ€ไพฟๅฎœ็š„่ง†่ง‰ๆจกๅž‹๏ผš + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/M | ่พ“ๅ‡บ $/M | ่ƒฝๅŠ› | +| -------------------- | --------- | ------ | -------- | -------- | -------- | +| ernie-4.5-0.3b | aihubmix | 0 | $0.0068 | $0.0272 | ๐Ÿ”ง ๐Ÿ‘ ๐Ÿ“‹ | +| deepseek-ocr | aihubmix | 0 | $0.01 | $0.01 | ๐Ÿ‘ | +| gemini-2.0-flash-exp | aihubmix | 0 | $0.01 | $0.04 | ๐Ÿ‘ | +| qwen-3.5-0.8b | auriko | 262K | $0.01 | $0.05 | ๐Ÿง  ๐Ÿ”ง ๐Ÿ‘ | +| qwen3.5-0.8b | deepinfra | 262K | $0.01 | $0.05 | ๐Ÿง  ๐Ÿ‘ | + +ๆœ€ไพฟๅฎœ็š„ๆŽจ็†ๆจกๅž‹๏ผš + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/M | ่พ“ๅ‡บ $/M | ่ƒฝๅŠ› | +| --------------------- | --------- | ------ | -------- | -------- | -------- | +| qwen-3.5-0.8b | auriko | 262K | $0.01 | $0.05 | ๐Ÿง  ๐Ÿ”ง ๐Ÿ‘ | +| qwen3.5-0.8b | deepinfra | 262K | $0.01 | $0.05 | ๐Ÿง  ๐Ÿ‘ | +| gemma-2-2b-it | cortecs | 0 | $0.018 | $0.054 | ๐Ÿง  | +| llama-3.1-8b-instruct | cortecs | 0 | $0.018 | $0.054 | ๐Ÿง  ๐Ÿ”ง | +| qwen-3.5-2b | auriko | 262K | $0.02 | $0.1 | ๐Ÿง  ๐Ÿ”ง ๐Ÿ‘ | + +## ๅคงไธŠไธ‹ๆ–‡ๆจกๅž‹ + +ไธŠไธ‹ๆ–‡็ช—ๅฃๆœ€ๅคง็š„ๆจกๅž‹ โ€” ้€‚็”จไบŽ้•ฟๆ–‡ๆกฃใ€ๅคš่ฝฎๅฏน่ฏๅ’Œไปฃ็ ๅบ“ใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/M | ่พ“ๅ‡บ $/M | ่ƒฝๅŠ› | +| ---------------------------- | ---------- | ------ | -------- | -------- | -------- | +| meta-llama--llama-4-scout | openrouter | 10M | $0.08 | $0.3 | ๐Ÿ”ง ๐Ÿ‘ ๐Ÿ“‹ | +| meta-llama-4-scout | meta | 10M | $0.17 | $0.66 | ๐Ÿ”ง ๐Ÿ‘ | +| gemini-1.5-pro | google | 2M | $1.25 | $5 | ๐Ÿ”ง ๐Ÿ‘ ๐Ÿ“‹ | +| grok-code-fast-1 | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ”ง ๐Ÿ‘ | +| gpt-4o | jiekou | 2M | $1.9 | $5.7 | ๐Ÿ”ง ๐Ÿ‘ | +| grok-4.20-0309-non-reasoning | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ”ง ๐Ÿ‘ | +| grok-4.20-0309-reasoning | jiekou | 2M | $1.9 | $5.7 | ๐Ÿ”ง ๐Ÿ‘ | +| grok-4-1-fast-reasoning | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ”ง ๐Ÿ‘ | +| grok-4-fast-reasoning | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ”ง ๐Ÿ‘ | +| x-ai--grok-4-fast | fastrouter | 2M | $0.2 | $0.5 | ๐Ÿ”ง ๐Ÿ‘ | + +> ๆŸฅ็œ‹[ไธŠไธ‹ๆ–‡็ช—ๅฃๅฏนๆฏ”](context-windows.md)่Žทๅ–ๅฎŒๆ•ดๅˆ†ๆžใ€‚ + +## ๆˆๆœฌไผ˜ๅŒ–ๆŠ€ๅทง + +1. **ๅผ€ๅ‘ๆ—ถไฝฟ็”จๅ…่ดนๆจกๅž‹** โ€” ็”จๅ…่ดนๆจกๅž‹ๅŽŸๅž‹ๅผ€ๅ‘๏ผŒ็”Ÿไบง็Žฏๅขƒๅˆ‡ๆขๅˆฐไป˜่ดนๆจกๅž‹ +2. **ๅฏ็”จๆ็คบ็ผ“ๅญ˜** โ€” [1,374 ไธชๆจกๅž‹](cached-pricing.md)ๆ”ฏๆŒ็ผ“ๅญ˜๏ผŒ่พ“ๅ…ฅๆˆๆœฌ่Š‚็œ 50-90% +3. **้€‰ๆ‹ฉๆปก่ถณ้œ€ๆฑ‚็š„ๆœ€ๅฐๆจกๅž‹** โ€” ไพ‹ๅฆ‚็ฎ€ๅ•ไปปๅŠก็”จ GPT-4.1 Mini ่€Œ้ž GPT-4.1 +4. **ไฝฟ็”จๅผ€ๆบๆƒ้‡ๆจกๅž‹** โ€” [527 ไธชๆจกๅž‹](open-weights.md)ๅฏๅœจ่‡ชๅทฑ็š„ๅŸบ็ก€่ฎพๆ–ฝไธŠ่ฟ่กŒ +5. **่ทจๆไพ›ๅ•†ๅฏนๆฏ”** โ€” ๅŒไธ€ๆจกๅž‹้€š่ฟ‡ๆ›ฟไปฃๆไพ›ๅ•†๏ผˆๅฆ‚ Groqใ€Together AIใ€DeepInfra๏ผ‰้€šๅธธๆ›ดไพฟๅฎœ +6. **ๆ‰น้‡่ฏทๆฑ‚** โ€” ้ƒจๅˆ†ๆไพ›ๅ•†ๅฏนๆ‰น้‡ API ่ฐƒ็”จๆไพ› 50% ๆŠ˜ๆ‰ฃ +7. **็›‘ๆŽง็”จ้‡** โ€” ่ทŸ่ธช่พ“ๅ…ฅ/่พ“ๅ‡บ token ๆฏ”็އไปฅไผ˜ๅŒ–ๆจกๅž‹้€‰ๆ‹ฉ + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๆจกๅž‹ๅฏนๆฏ”](model-comparison.md) โ€” ๆ——่ˆฐใ€้ซ˜ๆ€งไปทๆฏ”ใ€ๅ…่ดนๅ’Œๅผ€ๆบๆจกๅž‹ +- [ๅฎšไปทๅฏนๆฏ”](pricing-comparison.md) โ€” ๅ„ๆไพ›ๅ•†ๅฎšไปทๅนถๆŽ’ๅฏนๆฏ” +- [็ผ“ๅญ˜ๅฎšไปท](cached-pricing.md) โ€” ๆ”ฏๆŒๆ็คบ็ผ“ๅญ˜็š„ๆจกๅž‹ +- [ๅ…่ดน AI ๆจกๅž‹](free-models.md) โ€” 81 ไธชๅ…่ดนๆจกๅž‹ๆŒ‰่ƒฝๅŠ›ๅˆ†็ฑป +- [ๅผ€ๆบๆƒ้‡ๆจกๅž‹](open-weights.md) โ€” 527 ไธชๅฏ่‡ช่กŒ่ฟ่กŒ็š„ๆจกๅž‹ +- [ไธŠไธ‹ๆ–‡็ช—ๅฃๅฏนๆฏ”](context-windows.md) โ€” ๆœ€ๅคงไธŠไธ‹ๆ–‡็ช—ๅฃ +- [ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹](tool-calling.md) โ€” 2,350 ไธชๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ็š„ๆจกๅž‹ +- [ๆŽจ็†ๆจกๅž‹](reasoning-models.md) โ€” 1,306 ไธชๆ”ฏๆŒๆŽจ็†็š„ๆจกๅž‹ +- [่ง†่ง‰ๆจกๅž‹](vision-models.md) โ€” 1,487 ไธชๆ”ฏๆŒๅ›พๅƒ็†่งฃ็š„ๆจกๅž‹ +- [ๅฟซ้€Ÿๅ…ฅ้—จ](quick-start.md) โ€” 30 ็ง’ไธŠๆ‰‹ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/multimodal-models.md b/docs/zh/multimodal-models.md new file mode 100644 index 00000000..a3c54160 --- /dev/null +++ b/docs/zh/multimodal-models.md @@ -0,0 +1,101 @@ +# ๅคšๆจกๆ€ๆจกๅž‹ + +[English](../multimodal-models.md) + +่ƒฝๅคŸๅค„็†**ๅคš็ง่พ“ๅ…ฅๆจกๆ€**็š„ AI ๆจกๅž‹ โ€” ๅ›พๅƒใ€้Ÿณ้ข‘ๅ’Œ่ง†้ข‘ไธŽๆ–‡ๆœฌๅนถ่กŒใ€‚่ฟ™ไบ›ๆจกๅž‹้ฉฑๅŠจ่ง†่ง‰้—ฎ็ญ”ใ€ๆ–‡ๆกฃๅˆ†ๆžใ€่ง†้ข‘็†่งฃๅ’Œ้Ÿณ้ข‘่ฝฌๅฝ•ใ€‚ + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models)ใ€‚ + +## ไธบไป€ไนˆๅคšๆจกๆ€ๆจกๅž‹ๅพˆ้‡่ฆ + +ๅคšๆจกๆ€ๆจกๅž‹ๆ‰“็ ดไบ†็บฏๆ–‡ๆœฌ็š„้™ๅˆถ๏ผš + +- **่ง†่ง‰้—ฎ็ญ”** โ€” ๅฏนๅ›พๅƒๅ’Œๆ–‡ๆกฃๆ้—ฎ +- **ๆ–‡ๆกฃๅˆ†ๆž** โ€” ไปŽ PDFใ€ๆˆชๅ›พๅ’Œๆ‰ซๆไปถไธญๆๅ–ไฟกๆฏ +- **่ง†้ข‘็†่งฃ** โ€” ๅˆ†ๆž่ง†้ข‘ๅ†…ๅฎน๏ผŒๆ€ป็ป“็‰‡ๆฎต +- **้Ÿณ้ข‘ๅค„็†** โ€” ่ฝฌๅฝ•่ฏญ้Ÿณ๏ผŒๅˆ†ๆž้Ÿณ้ข‘ๅ†…ๅฎน +- **ๆ— ้šœ็ข** โ€” ไธบ่ง†้šœ็”จๆˆทๆ่ฟฐๅ›พๅƒ +- **ๅ†…ๅฎนๅฎกๆ ธ** โ€” ่ทจๆจกๆ€ๆฃ€ๆต‹ไธๅฝ“ๅ†…ๅฎน + +## ็ปŸ่ฎก + +| ๆŒ‡ๆ ‡ | ๆ•ฐ้‡ | +| ------------------ | ---- | +| ๅคšๆจกๆ€ๆจกๅž‹ | 1519 | +| ๆไพ›ๅ•† | 61 | +| ๅ›พๅƒ่พ“ๅ…ฅ | 1487 | +| ้Ÿณ้ข‘่พ“ๅ…ฅ | 118 | +| ่ง†้ข‘่พ“ๅ…ฅ | 167 | +| ๅ…่ดนๅคšๆจกๆ€ๆจกๅž‹ | 53 | +| ๅผ€ๆบๆƒ้‡ๅคšๆจกๆ€ๆจกๅž‹ | 119 | +| ๅธฆๅทฅๅ…ท่ฐƒ็”จ | 1179 | +| ๅธฆๆŽจ็†่ƒฝๅŠ› | 701 | + +## ๆไพ›ๅ•† + +`01ai`, `302ai`, `aihubmix`, `aimlapi`, `amazon`, `amazon-bedrock`, `anthropic`, `arcee`, `auriko`, `baidu`, `berget`, `bytedance`, `chutes`, `clarifai`, `cloudferro-sherlock`, `cloudflare`, `cortecs`, `databricks`, `deepinfra`, `digitalocean`, `evroc`, `fastrouter`, `fireworks`, `google`, `google-vertex` ็ญ‰ 36 ไธช + +## ๅ…่ดนๅคšๆจกๆ€ๆจกๅž‹ + +ๆ”ฏๆŒๅคšๆจกๆ€่พ“ๅ…ฅ็š„ๅ…่ดนๆจกๅž‹ โ€” ้›ถๆˆๆœฌ่ง†่ง‰/้Ÿณ้ข‘ๅบ”็”จใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/M | ่พ“ๅ‡บ $/M | ๆจกๆ€ | +| ---------------------------------------------------- | ---------- | ------ | -------- | -------- | -------------- | +| google--lyria-3-clip-preview | openrouter | 1M | Free | Free | ๐Ÿ–ผ๏ธ | +| google--lyria-3-pro-preview | openrouter | 1M | Free | Free | ๐Ÿ–ผ๏ธ | +| google--gemma-4-26b-a4b-it--free | openrouter | 262K | Free | Free | ๐Ÿ–ผ๏ธ ๐ŸŽฌ ๐Ÿ”ง ๐Ÿง  | +| google--gemma-4-31b-it--free | openrouter | 262K | Free | Free | ๐Ÿ–ผ๏ธ ๐ŸŽฌ ๐Ÿ”ง ๐Ÿง  | +| gemma-4-26b-a4b-it | auriko | 262K | Free | Free | ๐Ÿ–ผ๏ธ ๐Ÿ”ง ๐Ÿง  | +| gemma-4-31b-it | auriko | 262K | Free | Free | ๐Ÿ–ผ๏ธ ๐Ÿ”ง ๐Ÿง  | +| nvidia--nemotron-3-nano-omni-30b-a3b-reasoning--free | openrouter | 256K | Free | Free | ๐Ÿ–ผ๏ธ ๐ŸŽค ๐ŸŽฌ ๐Ÿ”ง ๐Ÿง  | +| spotlight | arcee | 131K | Free | Free | ๐Ÿ–ผ๏ธ | +| gemma-3-4b-it | google | 131K | Free | Free | ๐Ÿ–ผ๏ธ | +| gemma-3-12b-it | google | 131K | Free | Free | ๐Ÿ–ผ๏ธ | + +## ๆœ€ไพฟๅฎœๅคšๆจกๆ€ๆจกๅž‹ + +็”Ÿไบง็Žฏๅขƒๅคšๆจกๆ€ๅบ”็”จ็š„ๆœ€ไฝณๆ€งไปทๆฏ”ๆจกๅž‹ใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/M | ่พ“ๅ‡บ $/M | ๆจกๆ€ | +| -------------------------- | --------- | ------ | -------- | -------- | -------- | +| ernie-4.5-0.3b | aihubmix | 0 | $0.0068 | $0.0272 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง | +| deepseek-ocr | aihubmix | 0 | $0.01 | $0.01 | ๐Ÿ–ผ๏ธ | +| gemini-2.0-flash-exp | aihubmix | 0 | $0.01 | $0.04 | ๐Ÿ–ผ๏ธ ๐ŸŽค ๐ŸŽฌ | +| qwen-3.5-0.8b | auriko | 262K | $0.01 | $0.05 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง ๐Ÿง  | +| qwen3.5-0.8b | deepinfra | 262K | $0.01 | $0.05 | ๐Ÿ–ผ๏ธ ๐Ÿง  | +| qwen3-vl-flash-2026-01-22 | aihubmix | 0 | $0.0103 | $0.103 | ๐Ÿ–ผ๏ธ ๐ŸŽฌ ๐Ÿ”ง | +| qwen3-vl-flash | aihubmix | 0 | $0.0103 | $0.103 | ๐Ÿ–ผ๏ธ ๐ŸŽฌ ๐Ÿ”ง | +| glm-ocr | aihubmix | 0 | $0.0141 | $0.0141 | ๐Ÿ–ผ๏ธ | +| paddlepaddle--paddleocr-vl | novitaai | 16K | $0.02 | $0.02 | ๐Ÿ–ผ๏ธ | +| qwen-3.5-2b | auriko | 262K | $0.02 | $0.1 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง ๐Ÿง  | + +## ๅคงไธŠไธ‹ๆ–‡ๅคšๆจกๆ€ๆจกๅž‹ + +ไธŠไธ‹ๆ–‡็ช—ๅฃๆœ€ๅคง็š„ๅคšๆจกๆ€ๆจกๅž‹ โ€” ้€‚็”จไบŽๅค„็†้•ฟๆ–‡ๆกฃๅ’Œ่ง†้ข‘ใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/M | ่พ“ๅ‡บ $/M | ๆจกๆ€ | +| ---------------------------- | ---------- | ------ | -------- | -------- | ----------- | +| meta-llama--llama-4-scout | openrouter | 10M | $0.08 | $0.3 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง | +| meta-llama-4-scout | meta | 10M | $0.17 | $0.66 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง | +| gemini-1.5-pro | google | 2M | $1.25 | $5 | ๐Ÿ–ผ๏ธ ๐ŸŽค ๐ŸŽฌ ๐Ÿ”ง | +| grok-code-fast-1 | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง | +| gpt-4o | jiekou | 2M | $1.9 | $5.7 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง | +| grok-4.20-0309-non-reasoning | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง | +| grok-4.20-0309-reasoning | jiekou | 2M | $1.9 | $5.7 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง | +| grok-4-1-fast-reasoning | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง | +| grok-4-fast-reasoning | jiekou | 2M | $0.19 | $0.475 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง | +| x-ai--grok-4-fast | fastrouter | 2M | $0.2 | $0.5 | ๐Ÿ–ผ๏ธ ๐Ÿ”ง | + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [่ง†่ง‰ๆจกๅž‹](vision-models.md) โ€” 1,487 ไธชๆ”ฏๆŒๅ›พๅƒ่พ“ๅ…ฅ็š„ๆจกๅž‹ +- [่ง†้ข‘ๆจกๅž‹](video-models.md) โ€” ๆ”ฏๆŒ่ง†้ข‘็†่งฃ็š„ๆจกๅž‹ +- [้Ÿณ้ข‘ๆจกๅž‹](audio-models.md) โ€” ๆ”ฏๆŒ้Ÿณ้ข‘่พ“ๅ…ฅ/่พ“ๅ‡บ็š„ๆจกๅž‹ +- [ๅ›พๅƒ็”Ÿๆˆ](image-generation.md) โ€” 28 ไธชๅ›พๅƒ็”Ÿๆˆๆจกๅž‹ +- [ๆ™บ่ƒฝไฝ“ๆจกๅž‹](agentic-models.md) โ€” 1,080 ไธชๅ…ทๅค‡ๅทฅๅ…ท่ฐƒ็”จ + ๆŽจ็†่ƒฝๅŠ›็š„ๆจกๅž‹ +- [ๅ…่ดน AI ๆจกๅž‹](free-models.md) โ€” 81 ไธชๅ…่ดนๆจกๅž‹ๆŒ‰่ƒฝๅŠ›ๅˆ†็ฑป +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ้€‰ๆ‹ฉๆจกๅž‹็š„ๅ†ณ็ญ–ๆก†ๆžถ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/open-weights.md b/docs/zh/open-weights.md new file mode 100644 index 00000000..7e7a6d83 --- /dev/null +++ b/docs/zh/open-weights.md @@ -0,0 +1,118 @@ +[English](../open-weights.md) | **ไธญๆ–‡** + +# ๅผ€ๆบๆƒ้‡ AI ๆจกๅž‹ + +ๆœฌ็›ฎๅฝ•ไธญๆœ‰ 513 ไธชๅผ€ๆบๆƒ้‡ๆจกๅž‹ โ€” ไฝ ๅฏไปฅไธ‹่ฝฝๆƒ้‡ๅนถๅœจ่‡ชๅทฑ็š„ๅŸบ็ก€่ฎพๆ–ฝไธŠ่ฟ่กŒใ€‚ๆœฌ้กต้‡็‚นไป‹็ปๆœ€ๆœ‰่ƒฝๅŠ›ๅ’Œๆœ€ๅนฟๆณ›ๅฏ็”จ็š„ๅผ€ๆบๆƒ้‡ๆจกๅž‹ใ€‚ + +> ๆ‰€ๆœ‰ๆ•ฐๆฎๆฅ่‡ชไธ€ๆ‰‹ API ๅ’Œๆ–‡ๆกฃใ€‚"ๅผ€ๆบๆƒ้‡"่กจ็คบๆจกๅž‹ๆƒ้‡ๅ…ฌๅผ€ๅฏ็”จ๏ผ›ๅ„ๆจกๅž‹็š„่ฎธๅฏ่ฏๆกๆฌพไธๅŒใ€‚ + +## ๅฟซ้€Ÿ็ปŸ่ฎก + +| ่ƒฝๅŠ› | ๅผ€ๆบๆƒ้‡ๆจกๅž‹ๆ•ฐ | +| -------------------- | -------------: | +| ๆ€ปๅผ€ๆบๆƒ้‡ๆจกๅž‹ | 513 | +| ๅ”ฏไธ€ๆจกๅž‹ ID | 420 | +| ๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ | 270 | +| ๆ”ฏๆŒๆŽจ็† | 101 | +| ๆ”ฏๆŒ่ง†่ง‰๏ผˆๅ›พๅƒ่พ“ๅ…ฅ๏ผ‰ | 104 | + +## ๆœ€ๅนฟๆณ›ๅฏ็”จ + +่ฟ™ไบ›ๅผ€ๆบๆƒ้‡ๆจกๅž‹ๅœจๆœ€ๅคšๆไพ›ๅ•†ไธŠๅฏ็”จ โ€” ๅฎนๆ˜“ๆ‰พๅˆฐ๏ผŒๅฎนๆ˜“ๅˆ‡ๆข๏ผš + +| ๆจกๅž‹ | ๆไพ›ๅ•†ๆ•ฐ | ไธŠไธ‹ๆ–‡ | ๅทฅๅ…ท่ฐƒ็”จ | ๆŽจ็† | ่ง†่ง‰ | +| ----------------------------- | -------: | ------ | -------- | ---- | ---- | +| GPT-OSS-120B | 14 | 131K | โœ… | โœ… | โŒ | +| GPT-OSS-20B | 8 | 131K | โœ… | โœ… | โŒ | +| Qwen3.5-397B-A17B | 4 | 262K | โœ… | โœ… | โŒ | +| Kimi K2 Thinking | 4 | 262K | โœ… | โœ… | โœ… | +| DeepSeek-R1-Distill-Llama-70B | 4 | 131K | โœ… | โœ… | โŒ | +| Llama 4 Scout 17B | 4 | 328K | โœ… | โŒ | โœ… | +| DeepSeek-R1 | 3 | 131K | โœ… | โœ… | โŒ | +| Llama 4 Maverick | 3 | 1M | โœ… | โŒ | โœ… | +| Qwen3-32B | 3 | 131K | โœ… | โœ… | โŒ | +| Gemma 4 31B IT | 3 | 262K | โœ… | โœ… | โœ… | + +## ๆœ€ๅคงไธŠไธ‹ๆ–‡็ช—ๅฃ + +ๆ‹ฅๆœ‰ๆœ€ๅคงไธŠไธ‹ๆ–‡็ช—ๅฃ็š„ๅผ€ๆบๆƒ้‡ๆจกๅž‹๏ผš + +| ๆจกๅž‹ | ไธŠไธ‹ๆ–‡ | ๅทฅๅ…ท่ฐƒ็”จ | ๆŽจ็† | ่ง†่ง‰ | +| ----------------- | ------ | -------- | ---- | ---- | +| Llama 4 Scout | 10M | โœ… | โŒ | โœ… | +| Qwen3.5 Flash | 1M | โœ… | โŒ | โœ… | +| Qwen3.6 Flash | 1M | โœ… | โŒ | โœ… | +| Llama 4 Maverick | 1M | โœ… | โŒ | โœ… | +| DeepSeek-V4 Flash | 1M | โœ… | โœ… | โŒ | +| DeepSeek-V4 Pro | 1M | โœ… | โœ… | โŒ | +| MiMo V2.5 | 1M | โœ… | โœ… | โœ… | +| Minimax M2.5 | 1M | โœ… | โŒ | โŒ | +| Gemma 4 31B IT | 1M | โœ… | โŒ | โœ… | + +## ๆœ€ไฝณๅผ€ๆบๆƒ้‡ๆŽจ็†ๆจกๅž‹ + +่ฟ™ไบ›ๅผ€ๆบๆƒ้‡ๆจกๅž‹ๆ”ฏๆŒ้“พๅผๆ€็ปดๆŽจ็†๏ผš + +| ๆจกๅž‹ | ไธŠไธ‹ๆ–‡ | ๅทฅๅ…ท่ฐƒ็”จ | ่ง†่ง‰ | ๆไพ›ๅ•†ๆ•ฐ | +| -------------------- | ------ | -------- | ---- | -------: | +| DeepSeek-V4 Flash | 1M | โœ… | โŒ | 2 | +| DeepSeek-V4 Pro | 1M | โœ… | โŒ | 2 | +| MiMo V2.5 Pro | 1M | โœ… | โŒ | 1 | +| MiMo V2.5 | 1M | โœ… | โœ… | 1 | +| Gemma 4 26B A4B IT | 262K | โœ… | โœ… | 3 | +| Kimi K2.6 | 262K | โœ… | โœ… | 2 | +| Qwen3.5-397B-A17B | 262K | โœ… | โŒ | 2 | +| Nemotron-3-120B-A12B | 262K | โœ… | โŒ | 1 | +| DeepSeek-R1 | 131K | โœ… | โŒ | 3 | +| Qwen3-32B | 131K | โœ… | โœ… | 3 | + +## ๆœ€ไฝณๅผ€ๆบๆƒ้‡่ง†่ง‰ๆจกๅž‹ + +ๆŽฅๅ—ๅ›พๅƒ่พ“ๅ…ฅ็š„ๅผ€ๆบๆƒ้‡ๆจกๅž‹๏ผš + +| ๆจกๅž‹ | ไธŠไธ‹ๆ–‡ | ๅทฅๅ…ท่ฐƒ็”จ | ๆŽจ็† | ๆไพ›ๅ•†ๆ•ฐ | +| ------------------ | ------ | -------- | ---- | -------: | +| MiMo V2.5 | 1M | โœ… | โœ… | 1 | +| Llama 4 Maverick | 1M | โœ… | โŒ | 3 | +| Llama 4 Scout | 10M | โœ… | โŒ | 2 | +| Gemma 4 31B IT | 1M | โœ… | โŒ | 3 | +| Qwen3.5 Flash | 1M | โœ… | โŒ | 1 | +| Kimi K2.6 | 262K | โœ… | โœ… | 2 | +| Gemma 4 26B A4B IT | 262K | โœ… | โœ… | 3 | +| Llama 4 Scout 17B | 328K | โœ… | โŒ | 4 | + +## ๆœ€ไพฟๅฎœ็š„ๅผ€ๆบๆƒ้‡ๆจกๅž‹ + +ๅผ€ๆบๆƒ้‡ๆŽจ็†็š„ๆœ€ไฝŽๆฏ token ๅฎšไปท๏ผš + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ่พ“ๅ…ฅ $/1M | ่พ“ๅ‡บ $/1M | ไธŠไธ‹ๆ–‡ | +| -------------------------- | ------------ | --------: | --------: | ------ | +| GLM-4-Flash | 302AI | $0.0014 | $0.0014 | 131K | +| Mistral-Nemo-Instruct-2407 | KlusterAI | $0.008 | $0.001 | 131K | +| BDC-Coder | InferenceNet | $0.01 | $0.01 | 131K | +| Granite 4.0 H Micro | Cloudflare | $0.017 | $0.112 | 131K | +| Llama 3.1 8B Instruct | InferenceNet | $0.02 | $0.03 | 131K | +| Mistral Nemo Instruct 2407 | MegaNova | $0.02 | $0.04 | 131K | +| Meta-Llama-3.1-8B-Instruct | Nebius | $0.02 | $0.06 | 131K | +| Llama 3.2 1B Instruct | Cloudflare | $0.027 | $0.201 | 131K | + +## ่ฆ็‚นๆ€ป็ป“ + +- **513 ไธชๅผ€ๆบๆƒ้‡ๆจกๅž‹**๏ผŒๆถต็›– 420 ไธชๅ”ฏไธ€ๆจกๅž‹ ID โ€” ๆœ€ๅคง็š„ๅผ€ๆบๆƒ้‡ๆจกๅž‹็›ฎๅฝ• +- **GPT-OSS-120B** ๆ˜ฏๆœ€ๅนฟๆณ›ๅฏ็”จ็š„๏ผŒ็”ฑ 14 ไธชๆไพ›ๅ•†ๆไพ› +- **Llama 4 Scout** ๆ‹ฅๆœ‰ๆœ€ๅคง็š„ไธŠไธ‹ๆ–‡็ช—ๅฃ๏ผˆ10M tokens๏ผ‰ +- **DeepSeek-R1** ๆ˜ฏๆœ€ๅ—ๆฌข่ฟŽ็š„ๅผ€ๆบๆƒ้‡ๆŽจ็†ๆจกๅž‹๏ผŒๅœจ 3 ไธชๆไพ›ๅ•†ไธŠๅฏ็”จ +- **MiMo V2.5** ๆ˜ฏๅ”ฏไธ€็ป“ๅˆ 1M ไธŠไธ‹ๆ–‡ใ€ๆŽจ็†ๅ’Œ่ง†่ง‰็š„ๅผ€ๆบๆƒ้‡ๆจกๅž‹ +- ๅฎšไปทๅทฎๅผ‚ๅพˆๅคง โ€” ๆœ€ไพฟๅฎœ็š„ๅผ€ๆบๆƒ้‡ๆจกๅž‹ๆฏ 1M tokens ไธๅˆฐ $0.01 + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ้€‰ๆ‹ฉๆจกๅž‹็š„ๅ†ณ็ญ–ๆก†ๆžถ +- [ๅ…่ดน AI ๆจกๅž‹](free-models.md) โ€” 81 ไธชๅ…่ดนๆจกๅž‹ +- [ๆไพ›ๅ•†ๆฆ‚่งˆ](providers.md) โ€” 95 ไธชๆไพ›ๅ•†ๆŒ‰็ฑปๅž‹ๅˆ†็ฑป +- [ๆŽจ็†ๆจกๅž‹](reasoning-models.md) โ€” 1,306 ไธชๆ”ฏๆŒๆŽจ็†็š„ๆจกๅž‹ +- [็ผ“ๅญ˜ๅฎšไปท](cached-pricing.md) โ€” 1,374 ไธชๆ”ฏๆŒๆ็คบ็ผ“ๅญ˜็š„ๆจกๅž‹ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/openai-alternatives.md b/docs/zh/openai-alternatives.md new file mode 100644 index 00000000..bb8be1af --- /dev/null +++ b/docs/zh/openai-alternatives.md @@ -0,0 +1,156 @@ +[English](../openai-alternatives.md) | **ไธญๆ–‡** + +# OpenAI ๆ›ฟไปฃๆ–นๆกˆ โ€” GPT-4ใ€GPT-3.5 ๅŠๆ›ดๅคš + +ๅ…จ้ขๅฏนๆฏ” OpenAI GPT-4ใ€GPT-4o ๅ’Œ GPT-3.5 Turbo ็š„ๆ›ฟไปฃๆจกๅž‹ โ€” ๅŒ…ๅซๅฎšไปทใ€่ƒฝๅŠ›ๅ’Œ API ๅ…ผๅฎนๆ€งใ€‚ๆ‰€ๆœ‰ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) ไธ€ๆ‰‹ APIใ€‚ + +## ๅฟซ้€Ÿๅฏนๆฏ”๏ผšGPT-4 ็บงๅˆซๆ›ฟไปฃๆ–นๆกˆ + +ๅ…ทๅค‡ **ๅทฅๅ…ท่ฐƒ็”จ + ๆŽจ็† + ่ง†่ง‰** ็š„ๆจกๅž‹๏ผˆๅฎŒๆ•ด GPT-4 ่ƒฝๅŠ›้›†๏ผ‰๏ผš + +| Model | Provider | Context | Input $/1M | Output $/1M | Open Weights | +| ----------------------------- | ---------- | ------- | ---------- | ----------- | ------------ | +| openai--gpt-oss-120b | novitaai | 128K | $0.05 | $0.25 | | +| Qwen--Qwen3.6-35B-A3B | neuralwatt | 0 | $0.05 | $0.1 | | +| Nemotron-3-Nano-Omni | nebius | 125K | $0.06 | $0.24 | โœ… | +| seed-1.6-flash | bytedance | 256K | $0.07 | $0.3 | | +| gemma-4-26b-a4b-it | cloudflare | 256K | $0.1 | $0.3 | โœ… | +| Gemma-3-27b-it | nebius | 93K | $0.1 | $0.3 | โœ… | +| seed-2.0-mini | bytedance | 256K | $0.1 | $0.4 | | +| google--gemma-4-26b-a4b-it | novitaai | 256K | $0.13 | $0.4 | | +| google--gemma-4-31B-turbo-TEE | chutes | 128K | $0.13 | $0.38 | | +| baidu--ernie-4.5-vl-28b-a3b | novitaai | 29K | $0.14 | $0.56 | | +| google--gemma-4-31b-it | novitaai | 256K | $0.14 | $0.4 | | +| amazon-nova-2.0-lite | amazon | 62K | $0.15 | $1.25 | | +| gemini-2.5-flash | google | 1024K | $0.15 | $3.5 | | +| amazon-nova-2.0-omni | amazon | 62K | $0.2 | $1.3 | | +| xai-grok-4.1 | xai | 128K | $0.2 | $0.5 | | + +> ๅฎŒๆ•ดๅˆ—่กจ๏ผš50+ ๆไพ›ๅ•†ๅ…ฑ 617 ไธชๅ…ทๅค‡ๅทฅๅ…ท่ฐƒ็”จ+ๆŽจ็†+่ง†่ง‰็š„ๆจกๅž‹ใ€‚่ฏฆ่ง [ๆ™บ่ƒฝไฝ“ๆจกๅž‹](agentic-models.md)ใ€‚ + +## ๆœ€ไพฟๅฎœ็š„ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹ + +ๆœ€ๅ…ทๆ€งไปทๆฏ”็š„ๅ‡ฝๆ•ฐ/ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹๏ผˆไป…็›ด่ฟžๆไพ›ๅ•†๏ผ‰๏ผš + +| Model | Provider | Context | Input $/1M | Output $/1M | +| ------------------------------------------- | -------------- | ------- | ---------- | ----------- | +| ling-2.6-flash | inclusionai | 256K | $0.01 | $0.03 | +| bdc-coder | inferencenet | 128K | $0.01 | $0.01 | +| klusterai--Meta-Llama-3.1-8B-Instruct-Turbo | klusterai | 127K | $0.015 | $0.02 | +| granite-4.0-h-micro | cloudflare | 128K | $0.017 | $0.112 | +| schematron-v3 | inferencenet | 128K | $0.02 | $0.05 | +| schematron-3b | inferencenet | 128K | $0.02 | $0.05 | +| llama-3.1-8b-instruct--fp-16 | inferencenet | 128K | $0.02 | $0.03 | +| liquid-ai--LFM2-24B-A2B | togetherai | 128K | $0.03 | $0.12 | +| qwen--qwen3-4b-fp8 | novitaai | 125K | $0.03 | $0.03 | +| schematron-v2-turbo | inferencenet | 128K | $0.03 | $0.15 | +| gpt-oss-20b | inferencenet | 128K | $0.03 | $0.15 | +| openai--gpt-oss-20b | neuralwatt | 0 | $0.03 | $0.16 | +| amazon-nova-micro | amazon | 125K | $0.035 | $0.14 | +| amazon-nova-micro | amazon-bedrock | 125K | $0.035 | $0.14 | +| mistral-nemo-12b-instruct--fp-8 | inferencenet | 128K | $0.0375 | $0.1 | + +> ๅฎŒๆ•ดๅˆ—่กจ๏ผš67 ไธชๆไพ›ๅ•†ๅ…ฑ 2,350 ไธชๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹ใ€‚่ฏฆ่ง [ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹](tool-calling.md)ใ€‚ + +## GPT-4 ๅ…่ดนๆ›ฟไปฃๆ–นๆกˆ + +้›ถๆˆๆœฌ็š„ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹๏ผˆไป…็›ด่ฟžๆไพ›ๅ•†๏ผ‰๏ผš + +| Model | Provider | Context | Capabilities | +| --------------------------------- | -------- | ------- | ---------------------------- | +| glm-4.7-flash | zhipuai | 195K | Tool Call | +| glm-4.1v-thinking-flash | zhipuai | 62K | Reasoning, Vision, Tool Call | +| glm-4-flash-250414 | zhipuai | 125K | Tool Call | +| glm-4v-flash | zhipuai | 15K | Vision, Tool Call | +| autoglm-phone | zhipuai | 19K | Vision, Tool Call | +| glm-ocr | zhipuai | 0 | Vision, Tool Call | +| glm-4.6v-flash | zhipuai | 125K | Vision, Tool Call | +| cobuddy | baidu | 128K | Tool Call | +| qwen--qwen3-omni-30b-a3b-instruct | novitaai | 64K | Vision, Tool Call | +| qwen--qwen3-omni-30b-a3b-thinking | novitaai | 64K | Reasoning, Vision, Tool Call | +| baidu--ernie-4.5-0.3b | aimlapi | 117K | Tool Call | +| qwen--qwen3.5-4b-free | mixlayer | 128K | Reasoning, Tool Call | +| llama-4-scout-17b-16e-instruct | cerebras | 128K | Tool Call | +| qwen-2.5-32b | cerebras | 128K | Tool Call | +| llama-3.3-70b | cerebras | 128K | Tool Call | + +> ๅฎŒๆ•ดๅˆ—่กจ๏ผš81 ไธชๅ…่ดนๆจกๅž‹ใ€‚่ฏฆ่ง [ๅ…่ดน AI ๆจกๅž‹](free-models.md)ใ€‚ + +## ๆœ€ๅคงไธŠไธ‹ๆ–‡็ช—ๅฃ็š„ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹ + +| Model | Provider | Context | Input $/1M | Output $/1M | +| -------------------------------------------------- | ----------- | ------- | ---------- | ----------- | +| meta-llama-4-scout | meta | 9765K | $0.17 | $0.66 | +| xai--grok-4-fast-reasoning | aimlapi | 1953K | $0.52 | $1.3 | +| xai--grok-4-fast-non-reasoning | aimlapi | 1953K | $0.52 | $1.3 | +| meta-llama--Llama-4-Maverick-17B-128E-Instruct-FP8 | gmicloud | 1024K | $0.25 | $0.8 | +| minimax-m2-5 | baseten | 1024K | $0.3 | $1.2 | +| deepseek-v4-flash | baidu | 1024K | $0.126 | $0.252 | +| deepseek-v4-pro | siliconflow | 1024K | $1.74 | $3.48 | +| deepseek-v4-flash | siliconflow | 1024K | $0.14 | $0.28 | +| deepseek--deepseek-v4-pro | novitaai | 1024K | $1.67 | $3.38 | +| xiaomimimo--mimo-v2.5-pro | novitaai | 1024K | $2 | $6 | +| deepseek--deepseek-v4-flash | novitaai | 1024K | $0.14 | $0.28 | +| gemini-2.0-flash-lite | google | 1024K | $0.075 | $0.3 | +| gemini-2.5-flash | google | 1024K | $0.15 | $3.5 | +| gemini-2.5-pro | google | 1024K | $1.25 | $10 | +| gemini-2.0-flash | google | 1024K | $0.1 | $0.4 | + +> ๅฎŒๆ•ดๅˆ—่กจ๏ผš2,195 ไธช 128K+ ไธŠไธ‹ๆ–‡ๆจกๅž‹ใ€‚่ฏฆ่ง [ๅคงไธŠไธ‹ๆ–‡ๆจกๅž‹](large-context-models.md)ใ€‚ + +## OpenAI ๅ…ผๅฎนๆไพ›ๅ•† + +70 ไธชๆไพ›ๅ•†ๆไพ› OpenAI ๅ…ผๅฎน API ็ซฏ็‚น โ€” ๆœ€ๅฐ‘ไปฃ็ ไฟฎๆ”นๅณๅฏๅˆ‡ๆข๏ผš + +| Provider | API Endpoint | Model Count | Free Tier | +| --------------- | -------------------------------------------- | ----------- | --------- | +| Regolo | `https://api.regolo.ai/v1` | 1 | โ€” | +| MegaNova | `https://api.meganova.ai/v1` | 1 | โ€” | +| GMI Cloud | `https://api.gmi-serving.com/v1` | 1 | โ€” | +| Cohere | `https://api.cohere.com` | 1 | โ€” | +| Requesty | `https://router.requesty.ai/v1` | 1 | โ€” | +| ๆŽฅๅฃ AI | `https://api.jiekou.ai/v1` | 1 | โ€” | +| Zhipu AI (ๆ™บ่ฐฑ) | `https://open.bigmodel.cn/api/paas/v4` | 1 | โ€” | +| SambaNova | `https://api.sambanova.ai/v1` | 1 | โ€” | +| Baseten | `https://model-api.baseten.co/v1` | 1 | โ€” | +| Wafer | `https://pass.wafer.ai/v1` | 1 | โ€” | +| Arcee AI | `https://api.arcee.ai/v1` | 1 | โ€” | +| Moonshot AI | `https://api.moonshot.cn/v1` | 1 | โ€” | +| Amazon Nova | `https://bedrock.us-east-1.amazonaws.com/v1` | 1 | โ€” | +| Baidu | `https://qianfan.baidubce.com/v1` | 1 | โ€” | +| Together AI | `https://api.together.xyz/v1` | 1 | โ€” | +| OpenRouter | `https://openrouter.ai/api/v1` | 1 | โ€” | +| FastRouter | `https://api.fastrouter.ai/v1` | 1 | โ€” | +| SubModel | `https://api.submodel.ai/v1` | 1 | โ€” | +| Inception Labs | `https://api.inceptionlabs.ai/v1` | 1 | โ€” | +| SiliconFlow | `https://api.siliconflow.cn/v1` | 1 | โ€” | + +> ่ฏฆ่ง [่ฟ็งปๆŒ‡ๅ—](migration-guide.md) ไบ†่งฃไปŽ OpenAI ๅˆ‡ๆข็š„ๆญฅ้ชคใ€‚ + +## ้€‰ๆ‹ฉไฝ ็š„ๆ›ฟไปฃๆ–นๆกˆ + +| ้œ€ๆฑ‚ | ๆœ€ไฝณ้€‰ๆ‹ฉ | ่ฏฆ่ง | +| ------------------ | ---------------------------------- | ------------------------------------- | +| ๆœ€ไพฟๅฎœ็š„ๅทฅๅ…ท่ฐƒ็”จ | DeepSeek, Qwen3 | [ๅฎšไปทๅฏนๆฏ”](pricing-comparison.md) | +| GPT-4 ็บงๅˆซๆŽจ็† | Claude Opus 4, Gemini 2.5 Pro | [ๆŽจ็†ๆจกๅž‹](reasoning-models.md) | +| ๅ…่ดนๅŽŸๅž‹ๅผ€ๅ‘ | Google Gemini, Cloudflare | [Free Models](free-models.md) | +| ๆœ€ๅคงไธŠไธ‹ๆ–‡ | Gemini 2.5 Pro (1M), Llama 4 (10M) | [Context Windows](context-windows.md) | +| ๅผ€ๆบๆƒ้‡่‡ช้ƒจ็ฝฒ | Llama 4, Qwen3 | [Open-Weight Models](open-weights.md) | +| ่ฝปๆพไปŽ OpenAI ่ฟ็งป | Any OpenAI-compatible provider | [่ฟ็งปๆŒ‡ๅ—](migration-guide.md) | +| ่ฟ่กŒ AI ๆ™บ่ƒฝไฝ“ | Models with tool_call + reasoning | [ๆ™บ่ƒฝไฝ“ๆจกๅž‹](agentic-models.md) | + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹](tool-calling.md) โ€” 2,350 models with function calling +- [ๆŽจ็†ๆจกๅž‹](reasoning-models.md) โ€” 1,306 models with chain-of-thought +- [่ง†่ง‰ๆจกๅž‹](vision-models.md) โ€” 1,487 models with image understanding +- [ๅ…่ดน AI ๆจกๅž‹](free-models.md) โ€” 81 models at zero cost +- [ๅฎšไปทๅฏนๆฏ”](pricing-comparison.md) โ€” side-by-side pricing across providers +- [่ฟ็งปๆŒ‡ๅ—](migration-guide.md) โ€” switch providers with minimal code changes +- [ๆไพ›ๅ•†ๅฏนๆฏ”](provider-comparison.md) โ€” top 30 providers by model count +- [ๆ™บ่ƒฝไฝ“ๆจกๅž‹](agentic-models.md) โ€” 1,080 models for AI agents +- [ไปฃ็ ๆจกๅž‹](code-models.md) โ€” 189 ไธชไปฃ็ ๆจกๅž‹ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/pricing-comparison.md b/docs/zh/pricing-comparison.md new file mode 100644 index 00000000..0441442c --- /dev/null +++ b/docs/zh/pricing-comparison.md @@ -0,0 +1,134 @@ +[English](../pricing-comparison.md) | **ไธญๆ–‡** + +# ๅฎšไปทๅฏนๆฏ” + +ๅ„ๆไพ›ๅ•†ๅ’Œๅนณๅฐ็š„ AI ๆจกๅž‹ๆŽจ็†ๅฎšไปทๅนถๆŽ’ๅฏนๆฏ”ใ€‚ๆ‰€ๆœ‰ไปทๆ ผไปฅ็พŽๅ…ƒๆฏ็™พไธ‡ token ่ฎก๏ผŒๆฅ่‡ช็ฌฌไธ€ๆ–น APIใ€‚ + +## ็›ดๆŽฅๆไพ›ๅ•†ๅฎšไปท + +ๆจกๅž‹็”Ÿไบงๅ•†่‡ชๆœ‰ API ็š„ๅฎšไปทใ€‚ + +### OpenAI + +| ๆจกๅž‹ | ่พ“ๅ…ฅ $/็™พไธ‡token | ่พ“ๅ‡บ $/็™พไธ‡token | ็ผ“ๅญ˜่ฏปๅ– $/็™พไธ‡token | ไธŠไธ‹ๆ–‡ | +| ------------ | ---------------: | ---------------: | -------------------: | -----: | +| GPT-4.1 Nano | 0.10 | 0.40 | 0.025 | 1M | +| GPT-4o Mini | 0.15 | 0.60 | 0.075 | 128K | +| GPT-4.1 Mini | 0.40 | 1.60 | 0.10 | 1M | +| GPT-4.1 | 2.00 | 8.00 | 0.50 | 1M | +| GPT-4o | 2.50 | 10.00 | 1.25 | 128K | +| o4-mini | 1.10 | 4.40 | 0.275 | 200K | +| o3 | 10.00 | 40.00 | 2.50 | 200K | + +### Anthropic + +| ๆจกๅž‹ | ่พ“ๅ…ฅ $/็™พไธ‡token | ่พ“ๅ‡บ $/็™พไธ‡token | ไธŠไธ‹ๆ–‡ | +| ----------------- | ---------------: | ---------------: | -----: | +| Claude Haiku 4.5 | 1.00 | 5.00 | 200K | +| Claude Sonnet 4.0 | 3.00 | 15.00 | 1M | +| Claude Sonnet 4.5 | 3.00 | 15.00 | 1M | +| Claude Sonnet 4.6 | 3.00 | 15.00 | 1M | +| Claude Opus 4.5 | 5.00 | 25.00 | 200K | +| Claude Opus 4.7 | 5.00 | 25.00 | 1M | + +### Google + +| ๆจกๅž‹ | ่พ“ๅ…ฅ $/็™พไธ‡token | ่พ“ๅ‡บ $/็™พไธ‡token | ็ผ“ๅญ˜่ฏปๅ– $/็™พไธ‡token | ไธŠไธ‹ๆ–‡ | +| --------------------- | ---------------: | ---------------: | -------------------: | -----: | +| Gemini 1.5 Flash 8B | 0.075 | 0.30 | โ€” | 1M | +| Gemini 2.0 Flash Lite | 0.075 | 0.30 | โ€” | 1M | +| Gemini 2.0 Flash | 0.10 | 0.40 | โ€” | 1M | +| Gemini 2.5 Flash Lite | 0.10 | 0.40 | โ€” | 1M | +| Gemini 2.5 Flash | 0.15 | 3.50 | 0.0375 | 1M | +| Gemini 2.5 Pro | 1.25 | 10.00 | 0.315 | 1M | + +### DeepSeek + +| ๆจกๅž‹ | ่พ“ๅ…ฅ $/็™พไธ‡token | ่พ“ๅ‡บ $/็™พไธ‡token | ็ผ“ๅญ˜่ฏปๅ– $/็™พไธ‡token | ไธŠไธ‹ๆ–‡ | +| ----------------- | ---------------: | ---------------: | -------------------: | -----: | +| DeepSeek-V4-Flash | 0.14 | 0.28 | 0.0028 | 1M | +| DeepSeek-V4-Pro | 0.435 | 0.87 | 0.003625 | 1M | + +### xAI + +| ๆจกๅž‹ | ่พ“ๅ…ฅ $/็™พไธ‡token | ่พ“ๅ‡บ $/็™พไธ‡token | ไธŠไธ‹ๆ–‡ | +| ----------- | ---------------: | ---------------: | -----: | +| Grok 4 Fast | 0.20 | 0.50 | 131K | +| Grok 4.1 | 0.20 | 0.50 | 131K | +| Grok 3 Mini | 0.25 | 1.27 | 131K | +| Grok 4.2 | 2.00 | 6.00 | 131K | +| Grok 3 | 3.00 | 15.00 | 131K | +| Grok 4 | 3.00 | 15.00 | 131K | + +### Meta๏ผˆๆ‰˜็ฎกๆŽจ็†๏ผ‰ + +| ๆจกๅž‹ | ่พ“ๅ…ฅ $/็™พไธ‡token | ่พ“ๅ‡บ $/็™พไธ‡token | ไธŠไธ‹ๆ–‡ | +| ---------------- | ---------------: | ---------------: | -----: | +| Llama 3.2 1B | 0.10 | 0.10 | 128K | +| Llama 4 Scout | 0.17 | 0.66 | 10M | +| Llama 4 Maverick | 0.24 | 0.97 | 1M | + +### Mistral + +| ๆจกๅž‹ | ่พ“ๅ…ฅ $/็™พไธ‡token | ่พ“ๅ‡บ $/็™พไธ‡token | ไธŠไธ‹ๆ–‡ | +| ------------- | ---------------: | ---------------: | -----: | +| Ministral 3B | 0.04 | 0.04 | 128K | +| Ministral 8B | 0.10 | 0.10 | 128K | +| Mistral Small | 0.20 | 0.60 | 128K | +| Mistral Large | 2.00 | 6.00 | 128K | + +## ่ทจๅนณๅฐไปทๆ ผๅฏนๆฏ” + +ๅŒไธ€ๆจกๅž‹ๅœจไธๅŒๆŽจ็†ๅนณๅฐไธŠ็š„ไปทๆ ผ โ€” ๅทฎๅผ‚ๅฏ่ƒฝๅพˆๅคงใ€‚ + +### Llama 4 Scout๏ผˆ10M ไธŠไธ‹ๆ–‡๏ผ‰ + +| ๅนณๅฐ | ่พ“ๅ…ฅ $/็™พไธ‡token | ่พ“ๅ‡บ $/็™พไธ‡token | +| ------------ | ---------------: | ---------------: | +| AIHubMix | 0.061 | 0.183 | +| Auriko | 0.08 | 0.30 | +| DeepInfra | 0.08 | 0.30 | +| Kluster AI | 0.08 | 0.45 | +| Meta๏ผˆ็›ด่ฟž๏ผ‰ | 0.17 | 0.66 | + +### Llama 4 Maverick๏ผˆ1M ไธŠไธ‹ๆ–‡๏ผ‰ + +| ๅนณๅฐ | ่พ“ๅ…ฅ $/็™พไธ‡token | ่พ“ๅ‡บ $/็™พไธ‡token | +| --------------- | ---------------: | ---------------: | +| AIHubMix | 0.10 | 0.10 | +| ๆŽฅๅฃ AI | 0.10 | 0.50 | +| AIHubMix (Groq) | 0.11 | 0.33 | +| Cortecs | 0.124 | 0.603 | +| Auriko | 0.15 | 0.60 | +| Meta๏ผˆ็›ด่ฟž๏ผ‰ | 0.24 | 0.97 | + +## ๆœ€ไพฟๅฎœ็š„ๆจกๅž‹ + +ๆ‰€ๆœ‰ๆไพ›ๅ•†ไธญๆŒ‰ token ่ฎก่ดนๆœ€ไพฟๅฎœ็š„ๆจกๅž‹ใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ่พ“ๅ…ฅ $/็™พไธ‡token | ่พ“ๅ‡บ $/็™พไธ‡token | ไธŠไธ‹ๆ–‡ | +| ------------------- | -------- | ---------------: | ---------------: | -----: | +| Ministral 3B | Mistral | 0.04 | 0.04 | 128K | +| Voxtral Mini | Mistral | 0.04 | 0.04 | 128K | +| Ministral 8B | Mistral | 0.10 | 0.10 | 128K | +| Llama 3.2 1B | Meta | 0.10 | 0.10 | 128K | +| GPT-4.1 Nano | OpenAI | 0.10 | 0.40 | 1M | +| Gemini 1.5 Flash 8B | Google | 0.075 | 0.30 | 1M | +| DeepSeek-V4-Flash | DeepSeek | 0.14 | 0.28 | 1M | + +--- + +**ๆณจๆ„**๏ผšๆ‰€ๆœ‰ๅฎšไปทๆฅ่‡ช็ฌฌไธ€ๆ–นๆฅๆบ๏ผŒไปฅๆ•ฐๆฎ้‡‡้›†ๆ—ฅๆœŸไธบๅ‡†ใ€‚ๆŽจ็†ๅนณๅฐไปทๆ ผๅฏ่ƒฝไธๅŒใ€‚ๆŸฅ็œ‹ `providers//models/` ่Žทๅ–ๆœ€ๆ–ฐๆ•ฐๆฎใ€‚ไบบๆฐ‘ๅธๅ’Œๆฌงๅ…ƒๅฎšไปท่งๆไพ›ๅ•† YAML ๆ–‡ไปถใ€‚ + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ้€‰ๆ‹ฉๆจกๅž‹็š„ๅ†ณ็ญ–ๆก†ๆžถ +- [็ผ“ๅญ˜ๅฎšไปท](cached-pricing.md) โ€” 1,374 ไธชๆ”ฏๆŒๆ็คบ็ผ“ๅญ˜็š„ๆจกๅž‹ +- [ๅ…่ดน AI ๆจกๅž‹](free-models.md) โ€” 81 ไธชๅ…่ดนๆจกๅž‹ +- [ไธŠไธ‹ๆ–‡็ช—ๅฃๅฏนๆฏ”](context-windows.md) โ€” ๆœ€ๅคงไธŠไธ‹ๆ–‡็ช—ๅฃ +- [ๆไพ›ๅ•†ๆฆ‚่งˆ](providers.md) โ€” 95 ไธชๆไพ›ๅ•† +- [OpenAI ๆ›ฟไปฃๆ–นๆกˆ](openai-alternatives.md) โ€” ๆœ€ไพฟๅฎœ็š„ GPT-4 ๆ›ฟไปฃ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/provider-comparison.md b/docs/zh/provider-comparison.md new file mode 100644 index 00000000..f022cf11 --- /dev/null +++ b/docs/zh/provider-comparison.md @@ -0,0 +1,127 @@ +# ๆไพ›ๅ•†ๅฏนๆฏ” + +[English](../provider-comparison.md) + +AI ๆจกๅž‹ๆไพ›ๅ•†็š„ๅนถๆŽ’ๅฏนๆฏ” โ€” ๆจกๅž‹ๆ•ฐ้‡ใ€่ƒฝๅŠ›ใ€ๅฎšไปทๅ’ŒไธŠไธ‹ๆ–‡็ช—ๅฃไธ€็›ฎไบ†็„ถใ€‚ + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models)ใ€‚ + +## ๆŒ‰ๆจกๅž‹ๆ•ฐ้‡ๆŽ’ๅ็š„ๅ‰ 30 ไธชๆไพ›ๅ•† + +| ๆไพ›ๅ•† | ๆจกๅž‹ | ๅ…่ดน | ๅทฅๅ…ท่ฐƒ็”จ | ๆŽจ็† | ่ง†่ง‰ | ๆœ€ไฝŽ $/M | ่ƒฝๅŠ› | +| -------------- | ---: | ---: | -------: | ---: | ---: | -------: | ----------- | +| nanogpt | 547 | 0 | 0 | 0 | 0 | $0.02 | | +| aihubmix | 476 | 0 | 132 | 74 | 145 | $0.00 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐ŸŽค | +| openrouter | 356 | 29 | 263 | 190 | 160 | $0.01 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐ŸŽค | +| martian | 304 | 0 | 0 | 3 | 2 | $0.02 | ๐Ÿง  ๐Ÿ‘๏ธ | +| requesty | 277 | 0 | 251 | 139 | 151 | $0.02 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ | +| 302ai | 268 | 0 | 190 | 44 | 144 | $0.00 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐Ÿ”“ | +| auriko | 181 | 5 | 154 | 108 | 93 | $0.01 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐Ÿ–ผ๏ธ | +| llmgateway | 163 | 3 | 158 | 85 | 89 | $0.03 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐Ÿ–ผ๏ธ | +| aimlapi | 147 | 2 | 21 | 0 | 14 | $0.01 | ๐Ÿ”ง ๐Ÿ‘๏ธ | +| fastrouter | 120 | 2 | 94 | 66 | 65 | $0.02 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐ŸŽค | +| orcarouter | 120 | 0 | 102 | 64 | 111 | $0.05 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐Ÿ”“ | +| cortecs | 105 | 0 | 97 | 82 | 52 | $0.02 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐ŸŽค | +| novitaai | 104 | 2 | 72 | 53 | 33 | $0.02 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐ŸŽค | +| vultr | 98 | 0 | 11 | 22 | 23 | $0.55 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐ŸŽค | +| deepinfra | 88 | 0 | 0 | 51 | 38 | $0.01 | ๐Ÿง  ๐Ÿ‘๏ธ | +| venice | 75 | 0 | 64 | 55 | 39 | $0.05 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ | +| jiekou | 73 | 0 | 73 | 0 | 49 | $0.03 | ๐Ÿ”ง ๐Ÿ‘๏ธ ๐Ÿ”“ | +| meganova | 63 | 4 | 60 | 7 | 37 | $0.02 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐Ÿ”“ | +| alibaba | 62 | 0 | 62 | 52 | 0 | $0.15 | ๐Ÿ”ง ๐Ÿง  | +| ppio | 60 | 1 | 46 | 12 | 11 | $0.21 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐Ÿ”“ | +| amazon-bedrock | 57 | 0 | 37 | 0 | 16 | $0.04 | ๐Ÿ”ง ๐Ÿ‘๏ธ ๐ŸŽค ๐ŸŽฌ | +| google-vertex | 38 | 0 | 32 | 0 | 19 | $0.07 | ๐Ÿ”ง ๐Ÿ‘๏ธ ๐ŸŽค ๐ŸŽฌ | +| siliconflow-cn | 37 | 0 | 2 | 7 | 9 | $0.50 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ | +| stepfun | 31 | 14 | 0 | 0 | 11 | $0.70 | ๐Ÿ‘๏ธ ๐ŸŽค ๐Ÿ–ผ๏ธ | +| cloudflare | 30 | 0 | 15 | 10 | 7 | $0.02 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐Ÿ”“ | +| gmicloud | 29 | 0 | 11 | 10 | 0 | $0.07 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ”“ | +| databricks | 29 | 0 | 4 | 0 | 10 | $0.05 | ๐Ÿ”ง ๐Ÿ‘๏ธ ๐Ÿ”“ | +| openai | 28 | 5 | 18 | 8 | 12 | $0.02 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐ŸŽค | +| siliconflow | 27 | 0 | 24 | 2 | 3 | $0.04 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ‘๏ธ ๐Ÿ”“ | +| togetherai | 24 | 0 | 22 | 2 | 0 | $0.03 | ๐Ÿ”ง ๐Ÿง  ๐Ÿ”“ | + +## ๆไพ›ๅ•†ๅˆ†็ฑป + +### ่šๅˆๅ™จ๏ผˆๅคšๆไพ›ๅ•†่ฎฟ้—ฎ๏ผ‰ + +่ฟ™ไบ›ๆไพ›ๅ•†้€š่ฟ‡ๅ•ไธ€ API ๆไพ›ๅคšๅฎถ AI ๅ…ฌๅธ็š„ๆจกๅž‹๏ผš + +| ๆไพ›ๅ•† | ๆจกๅž‹ | ๅค‡ๆณจ | +| ---------- | ---: | --------------------------------- | +| openrouter | 356 | ๆœ€ๅคง็š„ๆจกๅž‹่šๅˆๅ™จ๏ผŒOpenAI ๅ…ผๅฎน API | +| requesty | 277 | ๆ™บ่ƒฝ่ทฏ็”ฑ | +| martian | 304 | ๅคšๆไพ›ๅ•†่ดŸ่ฝฝๅ‡่กก | +| aihubmix | 476 | ไธญๅ›ฝๅธ‚ๅœบ่šๅˆๅ™จ | +| nanogpt | 547 | ๆŒ‰้‡ไป˜่ดน๏ผŒๆ— ้œ€่ฎข้˜… | +| llmgateway | 163 | ไผไธš API ็ฝ‘ๅ…ณ | +| fastrouter | 120 | ๅฟซ้€Ÿๆจกๅž‹่ทฏ็”ฑ | +| orcarouter | 120 | ๅคšๆไพ›ๅ•†่ทฏ็”ฑ | + +### ็›ดไพ›ๆไพ›ๅ•†๏ผˆ็ฌฌไธ€ๆ–น API๏ผ‰ + +| ๆไพ›ๅ•† | ๆจกๅž‹ | ไธ“้•ฟ | +| --------- | ---: | --------------------------- | +| openai | 28 | GPT-4.1, o3/o4 ๆŽจ็†ๆจกๅž‹ | +| anthropic | 11 | Claude 4 ็ณปๅˆ—๏ผŒๆœ€้€‚ๅˆ Agent | +| google | 21 | Gemini 2.5, 1M+ ไธŠไธ‹ๆ–‡ | +| deepseek | 4 | DeepSeek R1๏ผŒๆœ€ไฝณๅผ€ๆบๆŽจ็† | +| meta | 12 | Llama 4๏ผŒๅผ€ๆบๆƒ้‡ | +| mistral | 16 | Mistral Large, Codestral | +| xai | 6 | Grok 3๏ผŒๅฎžๆ—ถๆ•ฐๆฎ | +| alibaba | 62 | Qwen 3๏ผŒๆœ€ๅคง็š„ๅผ€ๆบๅฎถๆ— | + +### ๅŸบ็ก€่ฎพๆ–ฝๆไพ›ๅ•†๏ผˆๆ‰˜็ฎกๅผ€ๆบๆจกๅž‹๏ผ‰ + +| ๆไพ›ๅ•† | ๆจกๅž‹ | ไธ“้•ฟ | +| ---------- | ---: | --------------------- | +| groq | 12 | ๆœ€ๅฟซๆŽจ็† (LPU) | +| cerebras | 11 | ่ถ…ๅฟซๆŽจ็† (CS-3) | +| togetherai | 24 | ๆ— ๆœๅŠกๅ™จๅผ€ๆบๆ‰˜็ฎก | +| deepinfra | 88 | ้ซ˜ๆ€งไปทๆฏ”ๆŽจ็† | +| fireworks | 10 | ๆ— ๆœๅŠกๅ™จๆจกๅž‹ๆ‰˜็ฎก | +| cloudflare | 30 | ่พน็ผ˜ๆŽจ็† (Workers AI) | + +### ๅŒบๅŸŸๆไพ›ๅ•† + +| ๆไพ›ๅ•† | ๆจกๅž‹ | ๅŒบๅŸŸ | +| ------------------- | ---: | ------------ | +| siliconflow | 27 | ไธญๅ›ฝ | +| siliconflow-cn | 37 | ไธญๅ›ฝ๏ผˆๅ›ฝๅ†…๏ผ‰ | +| stepfun | 31 | ไธญๅ›ฝ | +| zhipuai | 20 | ไธญๅ›ฝ | +| baichuan | 11 | ไธญๅ›ฝ | +| baidu | 8 | ไธญๅ›ฝ | +| iflytek | 6 | ไธญๅ›ฝ | +| tencent | 14 | ไธญๅ›ฝ | +| ppio | 60 | ไธญๅ›ฝ | +| ovhcloud | 12 | ๆฌงๆดฒ๏ผˆๆณ•ๅ›ฝ๏ผ‰ | +| scaleway | 13 | ๆฌงๆดฒ๏ผˆๆณ•ๅ›ฝ๏ผ‰ | +| cloudferro-sherlock | 12 | ๆฌงๆดฒ๏ผˆๆฌง็›Ÿ๏ผ‰ | + +## ้€‰ๆ‹ฉๆไพ›ๅ•† + +| ๅฆ‚ๆžœๆ‚จ้œ€่ฆ... | ๆœ€ไฝณๆไพ›ๅ•† | ๅŽŸๅ›  | +| ---------------- | ------------------------------ | ---------------------- | +| **ๆœ€ไฝŽไปทๆ ผ** | deepseek, google | ่พ“ๅ…ฅไฝŽ่‡ณ $0.14/M token | +| **ๆœ€ๅฟซๆŽจ็†** | groq, cerebras | ไบš 100ms ๅปถ่ฟŸ | +| **ๆœ€ๅคงไธŠไธ‹ๆ–‡** | google, meta | 1M-10M token ไธŠไธ‹ๆ–‡ | +| **ๆœ€ๅคšๆจกๅž‹** | nanogpt, aihubmix | ๅ„ 500+ ๆจกๅž‹ | +| **ๆœ€้€‚ๅˆ Agent** | anthropic, openai | ๅทฅๅ…ท่ฐƒ็”จ + ๆŽจ็† | +| **ๅผ€ๆบๆƒ้‡** | meta, deepseek | ๅœจ่‡ชๆœ‰็กฌไปถไธŠ่ฟ่กŒ | +| **ๆฌง็›Ÿๆ•ฐๆฎ้ฉป็•™** | ovhcloud, scaleway, cloudferro | ๆฌง็›Ÿๆ‰˜็ฎกๆŽจ็† | +| **ไธญๅ›ฝ่ฎฟ้—ฎ** | siliconflow, ppio, stepfun | ไธญๅ›ฝ่Š‚็‚น | + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [่ฟ็งปๆŒ‡ๅ—](migration-guide.md) โ€” ๅˆ‡ๆขๆไพ›ๅ•†็š„ๅฎšไปทๅฏนๆฏ” +- [ๅฎšไปทๅฏนๆฏ”](pricing-comparison.md) โ€” ่ทจๆไพ›ๅ•†ๅฎšไปทๅฏนๆฏ” +- [ๆไพ›ๅ•†ๆฆ‚่งˆ](providers.md) โ€” ๅ…จ้ƒจ 95 ไธชๆไพ›ๅ•†ๅˆ—่กจ +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ้€‰ๆ‹ฉๆจกๅž‹็š„ๅ†ณ็ญ–ๆก†ๆžถ +- [ๅ…่ดน AI ๆจกๅž‹](free-models.md) โ€” 81 ไธชๅ…่ดนๆจกๅž‹ๆŒ‰่ƒฝๅŠ›ๅˆ†็ฑป +- [่Šๅคฉๆจกๅž‹](chat-models.md) โ€” 2,350 ไธชๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ็š„่Šๅคฉๆจกๅž‹ +- [ๆ™บ่ƒฝไฝ“ๆจกๅž‹](agentic-models.md) โ€” 1,080 ไธชๅ…ทๅค‡ๅทฅๅ…ท่ฐƒ็”จ + ๆŽจ็†่ƒฝๅŠ›็š„ๆจกๅž‹ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/providers.md b/docs/zh/providers.md new file mode 100644 index 00000000..5177170f --- /dev/null +++ b/docs/zh/providers.md @@ -0,0 +1,172 @@ +[English](../providers.md) | **ไธญๆ–‡** + +# ๆไพ›ๅ•†ๆฆ‚่งˆ + +ๆœฌ็›ฎๅฝ•ไธญๆ‰€ๆœ‰ 95 ไธช AI ๆจกๅž‹ๆไพ›ๅ•†็š„็ปผๅˆๆฆ‚่งˆ๏ผŒๆŒ‰็ฑปๅž‹ๅˆ†็ฑปใ€‚ + +## ๆจกๅž‹็”Ÿไบงๅ•† + +ๅผ€ๅ‘ๅ’Œ็”Ÿไบง่‡ชๆœ‰ AI ๆจกๅž‹็š„ๆไพ›ๅ•†ใ€‚ๅฎƒไปฌ็š„ API ๅ’Œๆ–‡ๆกฃๆ˜ฏๆจกๅž‹ๆ•ฐๆฎ็š„ๆƒๅจๆฅๆบใ€‚ + +| ๆไพ›ๅ•† | ID | ๆจกๅž‹ๆ•ฐ | ไปฃ่กจๆจกๅž‹ | API ๆ ผๅผ | +| --------------------- | ------------- | -----: | ---------------------------------- | --------- | +| 01.AI (้›ถไธ€ไธ‡็‰ฉ) | `01ai` | 5 | Yi-Lightning, Yi-Vision | OpenAI | +| AI21 Labs | `ai21` | 2 | Jamba 1.5 | OpenAI | +| ้˜ฟ้‡Œไบ‘็™พ็‚ผ | `alibaba` | 62 | Qwen 3, Qwen 2.5 | OpenAI | +| Amazon Nova | `amazon` | 7 | Nova Pro, Nova Lite | OpenAI | +| Anthropic | `anthropic` | 11 | Claude Opus 4.7, Claude Sonnet 4.6 | Anthropic | +| ๅญ—่Š‚่ทณๅŠจ | `bytedance` | 5 | ่ฑ†ๅŒ…-Pro, ่ฑ†ๅŒ…-Lite | OpenAI | +| Cloudflare Workers AI | `cloudflare` | 30 | Llama 3.3, Mistral | OpenAI | +| Cohere | `cohere` | โ€” | Command R+, Embed 3 | OpenAI | +| DeepSeek | `deepseek` | 4 | DeepSeek-V4-Pro, DeepSeek-R1 | OpenAI | +| Google | `google` | 21 | Gemini 3.5 Flash, Gemini 3.1 Pro | Google | +| IBM Granite | `ibm` | โ€” | Granite 3.3 | OpenAI | +| ่ฎฏ้ฃžๆ˜Ÿ็ซ | `iflytek` | 6 | SparkDesk 4.0 Ultra | OpenAI | +| Inception Labs | `inception` | 5 | Mercury Coder | OpenAI | +| InclusionAI | `inclusionai` | 3 | Book3R | OpenAI | +| Meta Llama | `meta` | 12 | Llama 4 Maverick, Llama 4 Scout | OpenAI | +| Microsoft Phi | `microsoft` | 12 | Phi-4, Phi-4-Mini | OpenAI | +| MiniMax | `minimax` | 21 | MiniMax-Text-01, MiniMax-M1 | OpenAI | +| Mistral AI | `mistral` | 16 | Mistral Large, Codestral | OpenAI | +| Moonshot AI | `moonshotai` | 16 | Kimi K2.6, Kimi K2.5 | OpenAI | +| NVIDIA | `nvidia` | โ€” | Nemotron Ultra | OpenAI | +| OpenAI | `openai` | 28 | GPT-5.5, GPT-5.4, o3 | OpenAI | +| Perplexity | `perplexity` | 4 | Sonar, Sonar Pro | OpenAI | +| Reka AI | `reka` | 2 | Reka Core, Reka Flash | OpenAI | +| Sarvam AI | `sarvam` | โ€” | Sarvam-M | OpenAI | +| ้˜ถ่ทƒๆ˜Ÿ่พฐ | `stepfun` | 31 | Step-2, Step-1.5V | OpenAI | +| ่…พ่ฎฏๆททๅ…ƒ | `tencent` | 14 | ๆททๅ…ƒ-Turbos | OpenAI | +| Upstage | `upstage` | 8 | Solar Pro, Solar Mini | OpenAI | +| Voyage AI | `voyage` | 21 | Voyage 3, Voyage Code 3 | OpenAI | +| Writer | `writer` | 6 | Palmyra X5 | OpenAI | +| xAI Grok | `xai` | 6 | Grok 3, Grok 3 Mini | OpenAI | +| ๅฐ็ฑณ | `xiaomi` | 5 | MiMo | OpenAI | +| ๆ™บ่ฐฑ AI | `zhipuai` | 20 | GLM-4, GLM-Z1 | OpenAI | + +## ๆŽจ็†ๅนณๅฐ + +ๆ‰˜็ฎกๅ’Œๆไพ›ไป–ไบบ็”Ÿไบง็š„ๆจกๅž‹็š„ๆไพ›ๅ•†ใ€‚ๅฎƒไปฌๆไพ›่‡ชๅทฑ็š„ๆŒ‰ token ่ฎก่ดนๅ’Œ API ่ฎฟ้—ฎใ€‚ + +| ๆไพ›ๅ•† | ID | ๆจกๅž‹ๆ•ฐ | ่ฎก่ดนๅธ็ง | API ๆ ผๅผ | +| --------------------- | --------------------- | -----: | -------- | -------- | +| 302.AI | `302ai` | 268 | CNY | OpenAI | +| AIHubMix | `aihubmix` | 476 | CNY | OpenAI | +| AI/ML API | `aimlapi` | 147 | USD | OpenAI | +| Aion Labs | `aion` | 5 | USD | OpenAI | +| Arcee AI | `arcee` | 7 | USD | OpenAI | +| Auriko | `auriko` | 181 | USD | OpenAI | +| Baseten | `baseten` | 9 | USD | OpenAI | +| Berget | `berget` | 7 | EUR | OpenAI | +| Cerebras | `cerebras` | 11 | USD | OpenAI | +| Chutes | `chutes` | 12 | USD | OpenAI | +| Clarifai | `clarifai` | 12 | USD | OpenAI | +| CloudFerro Sherlock | `cloudferro-sherlock` | 12 | EUR | OpenAI | +| Cortecs | `cortecs` | 105 | USD | OpenAI | +| Databricks | `databricks` | 29 | USD | OpenAI | +| DeepInfra | `deepinfra` | 88 | USD | OpenAI | +| DigitalOcean | `digitalocean` | 20 | USD | OpenAI | +| DInference | `dinference` | 6 | CNY | OpenAI | +| evroc | `evroc` | 8 | EUR | OpenAI | +| FastRouter | `fastrouter` | 120 | USD | OpenAI | +| Fireworks AI | `fireworks` | 10 | USD | OpenAI | +| FriendliAI | `friendli` | 8 | USD | OpenAI | +| GMI Cloud | `gmicloud` | 29 | USD | OpenAI | +| Google Vertex AI | `google-vertex` | 38 | USD | Google | +| Groq | `groq` | 12 | USD | OpenAI | +| HPC-AI Cloud | `hpc-ai` | 11 | CNY | OpenAI | +| Hyperbolic | `hyperbolic` | 11 | USD | OpenAI | +| Inference.net | `inferencenet` | 20 | USD | OpenAI | +| ๆŽฅๅฃ AI | `jiekou` | 73 | CNY | OpenAI | +| Kluster AI | `klusterai` | 12 | USD | OpenAI | +| LLM Gateway | `llmgateway` | 163 | USD | OpenAI | +| Martian | `martian` | 304 | USD | OpenAI | +| MegaNova | `meganova` | 63 | USD | OpenAI | +| Mixlayer | `mixlayer` | 5 | USD | OpenAI | +| MoArk AI | `moark` | โ€” | USD | OpenAI | +| Morph | `morph` | 7 | USD | OpenAI | +| NanoGPT | `nanogpt` | 547 | USD | OpenAI | +| Nebius | `nebius` | 23 | USD | OpenAI | +| NeuralWatt | `neuralwatt` | 14 | USD | OpenAI | +| Nous Research | `nousresearch` | 7 | USD | OpenAI | +| Novita AI | `novitaai` | 104 | USD | OpenAI | +| OrcaRouter | `orcarouter` | 120 | USD | OpenAI | +| OVHcloud AI Endpoints | `ovhcloud` | 12 | EUR | OpenAI | +| PPIO | `ppio` | 60 | CNY | OpenAI | +| Privatemode AI | `privatemode` | 5 | EUR | OpenAI | +| ไธƒ็‰› AI | `qiniu-ai` | โ€” | CNY | OpenAI | +| Regolo | `regolo` | โ€” | EUR | OpenAI | +| Requesty | `requesty` | 277 | USD | OpenAI | +| SambaNova | `sambanova` | 7 | USD | OpenAI | +| Scaleway | `scaleway` | 13 | EUR | OpenAI | +| SiliconFlow | `siliconflow` | 27 | USD | OpenAI | +| SiliconFlow CN | `siliconflow-cn` | 37 | CNY | OpenAI | +| SubModel | `submodel` | 6 | USD | OpenAI | +| ่…พ่ฎฏไบ‘ TokenHub | `tencent-tokenhub` | 19 | CNY | OpenAI | +| TextSynth | `textsynth` | 6 | USD | OpenAI | +| Together AI | `togetherai` | 24 | USD | OpenAI | +| Venice AI | `venice` | 75 | USD | OpenAI | +| Vultr Cloud Inference | `vultr` | 98 | USD | OpenAI | +| Wafer | `wafer` | 2 | USD | OpenAI | + +## ไบ‘ๅŽ‚ๅ•†ๆ‰˜็ฎกๆœๅŠก + +ๆไพ› AI ๆจกๅž‹ๆ‰˜็ฎกๆœๅŠก็š„ไธป่ฆไบ‘ๅŽ‚ๅ•†ใ€‚ + +| ๆไพ›ๅ•† | ID | ๆจกๅž‹ๆ•ฐ | ไบ‘ๅนณๅฐ | +| -------------------- | ---------------- | -----: | ------ | +| Amazon Bedrock | `amazon-bedrock` | 57 | AWS | +| Azure OpenAI Service | `azure` | โ€” | Azure | +| Google Vertex AI | `google-vertex` | 38 | GCP | + +## ไธญๅ›ฝๅธ‚ๅœบๆไพ›ๅ•† + +ไธป่ฆๆœๅŠกไธญๅ›ฝๅธ‚ๅœบใ€ไปฅไบบๆฐ‘ๅธ่ฎก่ดน็š„ๆไพ›ๅ•†ใ€‚ + +| ๆไพ›ๅ•† | ID | ๆจกๅž‹ๆ•ฐ | +| --------------- | ------------------ | -----: | +| 302.AI | `302ai` | 268 | +| AIHubMix | `aihubmix` | 476 | +| ้˜ฟ้‡Œไบ‘็™พ็‚ผ | `alibaba` | 62 | +| ็™พๅทๆ™บ่ƒฝ | `baichuan` | 11 | +| ็™พๅบฆ | `baidu` | 8 | +| ๅญ—่Š‚่ทณๅŠจ | `bytedance` | 5 | +| DInference | `dinference` | 6 | +| HPC-AI Cloud | `hpc-ai` | 11 | +| ่ฎฏ้ฃžๆ˜Ÿ็ซ | `iflytek` | 6 | +| ๆŽฅๅฃ AI | `jiekou` | 73 | +| MiniMax | `minimax` | 21 | +| Moonshot AI | `moonshotai` | 16 | +| PPIO | `ppio` | 60 | +| ไธƒ็‰› AI | `qiniu-ai` | โ€” | +| SiliconFlow CN | `siliconflow-cn` | 37 | +| ้˜ถ่ทƒๆ˜Ÿ่พฐ | `stepfun` | 31 | +| ่…พ่ฎฏไบ‘ TokenHub | `tencent-tokenhub` | 19 | +| ่…พ่ฎฏๆททๅ…ƒ | `tencent` | 14 | +| ๅฐ็ฑณ | `xiaomi` | 5 | +| ๆ™บ่ฐฑ AI | `zhipuai` | 20 | + +## ๆฌงๆดฒๅธ‚ๅœบๆไพ›ๅ•† + +ไปฅๆฌงๅ…ƒ่ฎก่ดนใ€ๆœๅŠกๆฌงๆดฒๅธ‚ๅœบ็š„ๆไพ›ๅ•†ใ€‚ + +| ๆไพ›ๅ•† | ID | ๆจกๅž‹ๆ•ฐ | +| --------------------- | --------------------- | -----: | +| Berget | `berget` | 7 | +| CloudFerro Sherlock | `cloudferro-sherlock` | 12 | +| evroc | `evroc` | 8 | +| OVHcloud AI Endpoints | `ovhcloud` | 12 | +| Privatemode AI | `privatemode` | 5 | +| Regolo | `regolo` | โ€” | +| Scaleway | `scaleway` | 13 | + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๆจกๅž‹ๅฏนๆฏ”](model-comparison.md) โ€” ๆ——่ˆฐใ€้ซ˜ๆ€งไปทๆฏ”ใ€ๅ…่ดนๆจกๅž‹ +- [ๅฎšไปทๅฏนๆฏ”](pricing-comparison.md) โ€” ๅฎšไปทๅนถๆŽ’ๅฏนๆฏ” +- [ๅผ€ๆบๆƒ้‡ๆจกๅž‹](open-weights.md) โ€” 527 ไธชๅฏ่‡ช่กŒ่ฟ่กŒ็š„ๆจกๅž‹ +- [ๅ…่ดน AI ๆจกๅž‹](free-models.md) โ€” 81 ไธชๅ…่ดนๆจกๅž‹ +- [ๆ•ฐๆฎๆจกๅผ](data-schema.md) โ€” ๅฎŒๆ•ด YAML ๆจกๅผ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/quick-start.md b/docs/zh/quick-start.md new file mode 100644 index 00000000..1ea62047 --- /dev/null +++ b/docs/zh/quick-start.md @@ -0,0 +1,142 @@ +[English](../quick-start.md) | **ไธญๆ–‡** + +# ๅฟซ้€Ÿๅ…ฅ้—จๆŒ‡ๅ— + +30 ็ง’ๅ†…ๆ‰พๅˆฐ้€‚ๅˆไฝ ้œ€ๆฑ‚็š„ AI ๆจกๅž‹ใ€‚ + +## ๆˆ‘ๆƒณๆ‰พๆœ€ไพฟๅฎœ็š„ๆจกๅž‹ + +โ†’ ๆŸฅ็œ‹[ๅฎšไปทๅฏนๆฏ”](pricing-comparison.md)๏ผŒไบ†่งฃๅ„ๆไพ›ๅ•†ๆœ€ไพฟๅฎœ็š„ๆจกๅž‹ๅ’Œ่ทจๅนณๅฐไปทๆ ผๅฏนๆฏ”ใ€‚ + +**ๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ็š„ๆœ€ไพฟๅฎœๆจกๅž‹๏ผš** + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ่พ“ๅ…ฅ๏ผˆๆฏ็™พไธ‡ token๏ผ‰ | ่พ“ๅ‡บ๏ผˆๆฏ็™พไธ‡ token๏ผ‰ | +| ---------------- | ----------- | -------------------: | -------------------: | +| DeepSeek-V3 | DeepSeek | $0.27 | $1.10 | +| Qwen3-235B-A22B | ้˜ฟ้‡Œไบ‘ | $0.14 | $0.42 | +| Llama 4 Maverick | Together AI | $0.20 | $0.80 | + +## ๆˆ‘ๆƒณๆ‰พๆœ€ๅผบๅคง็š„ๆจกๅž‹ + +โ†’ ๆŸฅ็œ‹[ๆจกๅž‹ๅฏนๆฏ”](model-comparison.md)๏ผŒไบ†่งฃๆ——่ˆฐๆจกๅž‹ๅฏนๆฏ”ใ€‚ + +**้กถ็บงๆ——่ˆฐๆจกๅž‹๏ผš** + +| ๆจกๅž‹ | ไธŠไธ‹ๆ–‡ | ๅทฅๅ…ท่ฐƒ็”จ | ่ง†่ง‰ | ่พ“ๅ…ฅ $/1M | ่พ“ๅ‡บ $/1M | +| -------------- | ------ | -------- | ---- | --------: | --------: | +| GPT-4.1 | 1M | โœ… | โœ… | $2.00 | $8.00 | +| Claude Opus 4 | 200K | โœ… | โœ… | $15.00 | $75.00 | +| Gemini 2.5 Pro | 1M | โœ… | โœ… | $1.25 | $10.00 | +| DeepSeek-R1 | 128K | โœ… | โŒ | $0.55 | $2.19 | + +## ๆˆ‘ๆƒณๆ‰พๅ…่ดนๆจกๅž‹ + +โ†’ ๆŸฅ็œ‹[ๆจกๅž‹ๅฏนๆฏ”](model-comparison.md#ๅ…่ดนๆจกๅž‹)่Žทๅ–ๅฎŒๆ•ดๅˆ—่กจใ€‚ + +**ๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ็š„ๅ…่ดนๆจกๅž‹๏ผš** + +- Google Gemini 2.0 Flash๏ผˆ้€š่ฟ‡ Google AI Studio๏ผ‰ +- Cloudflare Workers AI ๆจกๅž‹๏ผˆ่พน็ผ˜ๆŽจ็†๏ผ‰ +- Chutesใ€Cerebrasใ€Groq ๅ…่ดนๅฑ‚ไธŠ็š„ๅ„็งๆจกๅž‹ + +## ๆˆ‘ๆƒณๆ‰พๆœ€ๅคงไธŠไธ‹ๆ–‡็ช—ๅฃ + +โ†’ ๆŸฅ็œ‹[ๆจกๅž‹ๅฏนๆฏ”](model-comparison.md#ๆœ€ๅคงไธŠไธ‹ๆ–‡็ช—ๅฃ)่Žทๅ–ๅฎŒๆ•ดๅˆ—่กจใ€‚ + +| ๆจกๅž‹ | ไธŠไธ‹ๆ–‡็ช—ๅฃ | +| --------------- | ----------: | +| Llama 4 Scout | 10M tokens | +| Gemini 2.5 Pro | 1M tokens | +| GPT-4.1 | ~1M tokens | +| Claude Sonnet 4 | 200K tokens | + +## ๆˆ‘ๆƒณๆต่งˆๆ‰€ๆœ‰ๆไพ›ๅ•† + +โ†’ ๆŸฅ็œ‹[ๆไพ›ๅ•†ๆฆ‚่งˆ](providers.md)๏ผŒ95 ไธชๆไพ›ๅ•†ๆŒ‰็ฑปๅž‹ๅˆ†็ฑปใ€‚ + +## ๆˆ‘ๆƒณ็ผ–็จ‹ไฝฟ็”จๆ•ฐๆฎ + +### npm ๅŒ… + +```bash +npm install ai-models +``` + +```typescript +import catalog from "ai-models"; // 4,587 ไธชๆจกๅž‹ JSON +import type { Model } from "ai-models"; // TypeScript ็ฑปๅž‹ +``` + +### ไธ‹่ฝฝๆ•ฐๆฎๆ–‡ไปถ + +```bash +# JSON โ€” ๅฎŒๆ•ดๅ…ƒๆ•ฐๆฎ๏ผˆ2.3 MB๏ผ‰ +curl -LO https://github.com/i-need-token/ai-models/releases/latest/download/models.json + +# CSV โ€” ้€‚ๅˆ Excel/Google Sheets ็š„่กจๆ ผ๏ผˆ560 KB๏ผ‰ +curl -LO https://github.com/i-need-token/ai-models/releases/latest/download/models.csv +``` + +### CDN ่ฎฟ้—ฎ๏ผˆๆ— ้œ€ๅฎ‰่ฃ…๏ผ‰ + +็ผ–่ฏ‘ๅŽ็š„ JSON ๅฏ้€š่ฟ‡ [jsDelivr CDN](https://www.jsdelivr.com/package/npm/ai-models) ่ฎฟ้—ฎ โ€” ๆ— ้œ€ไธ‹่ฝฝๆˆ–ๅฎ‰่ฃ…๏ผš + +```bash +# ๅง‹็ปˆๆœ€ๆ–ฐ๏ผŒๆ”ฏๆŒ CORS๏ผŒๅฏๅœจๆต่งˆๅ™จไธญไฝฟ็”จ +curl -s https://github.com/i-need-token/ai-models/releases/latest/download/models.json | jq '.models | length' +``` + +```html + +``` + +### ไปŽๆบ็  + +```bash +# ๅฎ‰่ฃ…ไพ่ต– +npm install + +# ่ฎก็ฎ—็›ฎๅฝ•็ปŸ่ฎก +npx tsx scripts/stats.ts + +# ้ชŒ่ฏๆ‰€ๆœ‰ๆจกๅž‹ๆ•ฐๆฎ +npx tsx scripts/validate.ts +``` + +```typescript +import { ModelSchema } from "./types/schemas"; +import { parse } from "yaml"; +import { readFileSync } from "fs"; + +// ๅŠ ่ฝฝๅนถ้ชŒ่ฏๆจกๅž‹ +const raw = readFileSync("providers/openai/models/gpt-4.1.yaml", "utf-8"); +const model = ModelSchema.parse(parse(raw)); + +console.log(model.pricing); // { input: 2, output: 8, cache_read: 0.5 } +console.log(model.limit); // { context: 1047576, output: 32768 } +``` + +## ๆˆ‘ๆƒณๆทปๅŠ ๆ–ฐ็š„ๆไพ›ๅ•† + +โ†’ ๆŸฅ็œ‹[่ดก็ŒฎๆŒ‡ๅ—](../../CONTRIBUTING.md)ๅ’Œ[ๆ•ฐๆฎ้‡‡้›†ๆŒ‡ๅ—](data-acquisition.md)ใ€‚ + +## ๆˆ‘ๆƒณไบ†่งฃๆ•ฐๆฎๆ ผๅผ + +โ†’ ๆŸฅ็œ‹[ๆ•ฐๆฎ Schema ๅ‚่€ƒ](data-schema.md)๏ผŒไบ†่งฃๅฎŒๆ•ด็š„ YAML Schemaใ€‚ + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ้€‰ๆ‹ฉๆจกๅž‹็š„ๅ†ณ็ญ–ๆก†ๆžถ +- [ๅธธ่ง้—ฎ้ข˜](faq.md) โ€” ๅ…ณไบŽ็›ฎๅฝ•็š„ๅธธ่ง้—ฎ้ข˜ +- [API ไธŽ็ผ–็จ‹่ฎฟ้—ฎ](api.md) โ€” ไธ‹่ฝฝๅ’Œไฝฟ็”จๆ•ฐๆฎ +- [ไปฃ็ ็คบไพ‹](code-examples.md) โ€” TypeScriptใ€Pythonใ€Goใ€Rust ๅฎž็”จ็คบไพ‹ +- [ๆœฏ่ฏญ่กจ](glossary.md) โ€” ๅ…ณ้”ฎๆœฏ่ฏญๅ’Œๅฎšไน‰ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/reasoning-models.md b/docs/zh/reasoning-models.md new file mode 100644 index 00000000..fd48dbcb --- /dev/null +++ b/docs/zh/reasoning-models.md @@ -0,0 +1,104 @@ +[English](../reasoning-models.md) | **ไธญๆ–‡** + +# AI ๆŽจ็†ๆจกๅž‹ + +ๆœฌ็›ฎๅฝ•ไธญๆœ‰ 1,306 ไธชๆจกๅž‹ๆ”ฏๆŒๆŽจ็†๏ผˆ้“พๅผๆ€็ปด / ๆ‰ฉๅฑ•ๆ€่€ƒ๏ผ‰ใ€‚ๆœฌ้กต้‡็‚นไป‹็ปๆœ€ๆœ‰่ƒฝๅŠ›ๅ’Œๆœ€ๅ…ทๆ€งไปทๆฏ”็š„ๆŽจ็†ๆจกๅž‹ใ€‚ + +> ๆ‰€ๆœ‰ๆ•ฐๆฎๆฅ่‡ชไธ€ๆ‰‹ API ๅ’Œๆ–‡ๆกฃใ€‚"ๆŽจ็†"่กจ็คบๆจกๅž‹ๅฏไปฅๅœจๅ›ž็ญ”ๅ‰็”Ÿๆˆๆ‰ฉๅฑ•็š„้“พๅผๆ€็ปดใ€‚ + +## ๅฟซ้€Ÿ็ปŸ่ฎก + +| ่ƒฝๅŠ› | ๆŽจ็†ๆจกๅž‹ๆ•ฐ | +| -------------------- | ---------: | +| ๆ€ปๆŽจ็†ๆจกๅž‹ | 1,306 | +| ๅ”ฏไธ€ๆจกๅž‹ ID | 868 | +| ๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ | 1,076 | +| ๆ”ฏๆŒ่ง†่ง‰๏ผˆๅ›พๅƒ่พ“ๅ…ฅ๏ผ‰ | 697 | +| ๅผ€ๆบๆƒ้‡ | 119 | + +## ๆŒ‰ไธŠไธ‹ๆ–‡ๆŽ’ๅบ็š„้กถ็บงๆŽจ็†ๆจกๅž‹ + +ๆœ€ๅคงไธŠไธ‹ๆ–‡็š„ๆŽจ็†ๆจกๅž‹ โ€” ้€‚ๅˆๅคๆ‚ๅคšๆญฅไปปๅŠก๏ผš + +| ๆจกๅž‹ | ไธŠไธ‹ๆ–‡ | ๅทฅๅ…ท่ฐƒ็”จ | ่ง†่ง‰ | ่พ“ๅ…ฅ $/1M | ๆไพ›ๅ•†ๆ•ฐ | +| ----------------------------- | ------ | -------- | ---- | --------: | -------: | +| Grok 4 Fast Reasoning | 2M | โœ… | โœ… | $0.20 | 2 | +| Grok 4.1 Fast Reasoning | 2M | โœ… | โœ… | $0.20 | 2 | +| Grok 4.20 | 2M | โœ… | โœ… | $1.42 | 1 | +| GPT-5.4 | 1M | โœ… | โœ… | $2.50 | 4 | +| GPT-5.5 | 1M | โœ… | โœ… | $5.00 | 4 | +| Gemini 2.5 Pro | 1M | โœ… | โœ… | $1.25 | 4 | +| Gemini 2.5 Flash | 1M | โœ… | โœ… | $0.15 | 3 | +| Gemini 2.5 Flash Lite | 1M | โœ… | โœ… | $0.10 | 3 | +| Gemini 3 Flash Preview | 1M | โœ… | โœ… | $0.50 | 4 | +| Gemini 3.1 Flash Lite Preview | 1M | โœ… | โœ… | $0.25 | 3 | +| DeepSeek Reasoner | 1M | โœ… | โœ… | $0.43 | 1 | + +## ๆœ€ไพฟๅฎœ็š„ๆŽจ็†ๆจกๅž‹ + +ๆŽจ็†่ƒฝๅŠ›็š„ๆœ€ไฝณๆ€งไปทๆฏ”๏ผš + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ่พ“ๅ…ฅ $/1M | ่พ“ๅ‡บ $/1M | ไธŠไธ‹ๆ–‡ | +| --------------------- | --------- | --------: | --------: | ------ | +| Qwen 3.5 0.8B | Auriko | $0.01 | $0.05 | 262K | +| Qwen 3.5 0.8B | DeepInfra | $0.01 | $0.05 | 262K | +| Qwen 3.5 2B | Auriko | $0.02 | $0.10 | 262K | +| Qwen 3.5 2B | DeepInfra | $0.02 | $0.10 | 262K | +| GPT-5 Nano | Requesty | $0.025 | $0.20 | 400K | +| Qwen 3.5 4B | Auriko | $0.03 | $0.15 | 262K | +| Qwen 3.5 4B | DeepInfra | $0.03 | $0.15 | 262K | +| Gemini 2.5 Flash Lite | Google | $0.10 | $0.60 | 1M | +| Gemini 2.5 Flash | Google | $0.15 | $0.60 | 1M | +| Grok 4 Fast Reasoning | xAI | $0.20 | $0.50 | 2M | + +## ๆœ€ไฝณๆŽจ็† + ่ง†่ง‰ๆจกๅž‹ + +่ƒฝๅฏนๅ›พๅƒ่ฟ›่กŒๆŽจ็†็š„ๆจกๅž‹ โ€” ้€‚ๅˆ่ง†่ง‰ๅˆ†ๆž๏ผš + +| ๆจกๅž‹ | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/1M | ๆไพ›ๅ•†ๆ•ฐ | +| --------------------- | ------ | --------: | -------: | +| Grok 4 Fast Reasoning | 2M | $0.20 | 2 | +| Gemini 2.5 Flash | 1M | $0.15 | 3 | +| Gemini 2.5 Pro | 1M | $1.25 | 4 | +| GPT-5.4 | 1M | $2.50 | 4 | +| DeepSeek Reasoner | 1M | $0.43 | 1 | +| MiMo V2.5๏ผˆๅผ€ๆบๆƒ้‡๏ผ‰ | 1M | varies | 2 | + +## ๅผ€ๆบๆƒ้‡ๆŽจ็†ๆจกๅž‹ + +119 ไธชๅผ€ๆบๆƒ้‡ๆจกๅž‹ๆ”ฏๆŒๆŽจ็† โ€” ๅฏๅœจ่‡ชๅทฑ็š„็กฌไปถไธŠ่ฟ่กŒ๏ผš + +| ๆจกๅž‹ | ไธŠไธ‹ๆ–‡ | ๅทฅๅ…ท่ฐƒ็”จ | ่ง†่ง‰ | ๆไพ›ๅ•†ๆ•ฐ | +| ----------------------- | ------ | -------- | ---- | -------: | +| MiMo V2.5 Pro | 1M | โœ… | โŒ | 2 | +| MiMo V2.5 | 1M | โœ… | โœ… | 2 | +| DeepSeek-V4 Pro | 1M | โœ… | โŒ | 1 | +| Qwen3 Next 80B Thinking | 262K | โœ… | โŒ | 4 | +| Kimi K2.6 | 262K | โœ… | โœ… | 4 | +| Trinity Large Thinking | 262K | โœ… | โŒ | 1 | +| Nemotron 3 120B | 262K | โœ… | โŒ | 1 | +| Qwen3.5 397B A17B | 262K | โœ… | โŒ | 2 | + +## ่ฆ็‚นๆ€ป็ป“ + +- **1,306 ไธชๆŽจ็†ๆจกๅž‹**๏ผŒๆถต็›– 868 ไธชๅ”ฏไธ€ๆจกๅž‹ ID โ€” ๆœ€ๅคง็š„ๆŽจ็†ๆจกๅž‹็›ฎๅฝ• +- **Grok 4 Fast Reasoning** ไปฅ 2M ไธŠไธ‹ๆ–‡ๅ’Œ $0.20/1M ่พ“ๅ…ฅไปทๆ ผๆไพ›ๆœ€ไฝณๆ€งไปทๆฏ” +- **Gemini 2.5 Flash Lite** ๆ˜ฏๆœ€ไพฟๅฎœ็š„ 1M ไธŠไธ‹ๆ–‡ๆŽจ็†ๆจกๅž‹๏ผˆ$0.10/1M๏ผ‰ +- **MiMo V2.5** ๆ˜ฏๅ”ฏไธ€็ป“ๅˆ 1M ไธŠไธ‹ๆ–‡ใ€ๆŽจ็†ๅ’Œ่ง†่ง‰็š„ๅผ€ๆบๆƒ้‡ๆจกๅž‹ +- **697 ไธชๆŽจ็†ๆจกๅž‹**ๅŒๆ—ถๆ”ฏๆŒ่ง†่ง‰ โ€” ๆœ€ๅธธ่ง็š„็ป„ๅˆ่ƒฝๅŠ› +- ๅฐๅž‹ๆŽจ็†ๆจกๅž‹๏ผˆQwen 3.5 0.8Bโ€“4B๏ผ‰ๆฏ 1M tokens ไป…้œ€ $0.01โ€“$0.03 + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ้€‰ๆ‹ฉๆจกๅž‹็š„ๅ†ณ็ญ–ๆก†ๆžถ +- [ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹](tool-calling.md) โ€” 2,350 ไธชๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ็š„ๆจกๅž‹ +- [็ป“ๆž„ๅŒ–่พ“ๅ‡บ](structured-output.md) โ€” 829 ไธช JSON ๆจกๅผๆจกๅž‹ +- [ๅ…่ดน AI ๆจกๅž‹](free-models.md) โ€” 81 ไธชๅ…่ดนๆจกๅž‹๏ผŒ้ƒจๅˆ†ๆ”ฏๆŒๆŽจ็† +- [็ผ“ๅญ˜ๅฎšไปท](cached-pricing.md) โ€” 1,374 ไธชๆ”ฏๆŒๆ็คบ็ผ“ๅญ˜็š„ๆจกๅž‹ +- [OpenAI ๆ›ฟไปฃๆ–นๆกˆ](openai-alternatives.md) โ€” GPT-4 ็บงๅˆซๆŽจ็†ๆ›ฟไปฃ +- [ๆ™บ่ƒฝไฝ“ๆจกๅž‹](agentic-models.md) โ€” 1,080 ไธชๅทฅๅ…ท่ฐƒ็”จ+ๆŽจ็†ๆจกๅž‹ +- [ไปฃ็ ๆจกๅž‹](code-models.md) โ€” 189 ไธชไปฃ็ ๆจกๅž‹ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/small-language-models.md b/docs/zh/small-language-models.md new file mode 100644 index 00000000..91563386 --- /dev/null +++ b/docs/zh/small-language-models.md @@ -0,0 +1,126 @@ +# ๅฐ่ฏญ่จ€ๆจกๅž‹ (SLM) ๆŒ‡ๅ— + +> 2,000+ ๅฐ่ฏญ่จ€ๆจกๅž‹ๅฎŒๆ•ดๆŒ‡ๅ—๏ผŒ้€‚็”จไบŽ่พน็ผ˜้ƒจ็ฝฒใ€็งปๅŠจๅบ”็”จๅ’ŒไฝŽๆˆๆœฌ็”Ÿไบง็Žฏๅขƒใ€‚ + +## ไป€ไนˆๆ˜ฏๅฐ่ฏญ่จ€ๆจกๅž‹๏ผŸ + +ๅฐ่ฏญ่จ€ๆจกๅž‹๏ผˆSLM๏ผ‰ๆ˜ฏๅ‚ๆ•ฐ้‡ๅฐ‘ไบŽ็บฆ 100 ไบฟ็š„ AI ๆจกๅž‹๏ผŒไธ“ไธบ้ซ˜ๆ•ˆใ€ไฝŽๅปถ่ฟŸๅ’Œ่ต„ๆบๅ—้™็กฌไปถ้ƒจ็ฝฒ่€Œ่ฎพ่ฎกใ€‚ๅฝ“ๆˆๆœฌใ€้€Ÿๅบฆๆˆ–้š็งๆ˜ฏๅ…ณ้”ฎๅ› ็ด ๆ—ถ๏ผŒๅฎƒไปฌๆ˜ฏๅคงๅž‹ๅ‰ๆฒฟๆจกๅž‹็š„ๅฎž็”จๆ›ฟไปฃๆ–นๆกˆใ€‚ + +### ๆ ธๅฟƒไผ˜ๅŠฟ + +| ๅ› ็ด  | ๅฐๆจกๅž‹ (SLM) | ๅคงๆจกๅž‹ (LLM) | +| ---------------- | ---------------- | -------------- | +| ๆฏ 1M token ๆˆๆœฌ | $0.01 โ€“ $0.20 | $1 โ€“ $40 | +| ๅปถ่ฟŸ๏ผˆ้ฆ– token๏ผ‰ | 50 โ€“ 200ms | 200 โ€“ 2000ms | +| ้ƒจ็ฝฒๆ–นๅผ | ๆœฌๅœฐใ€่พน็ผ˜ใ€ไบ‘็ซฏ | ไป…ไบ‘็ซฏ | +| ้š็งไฟๆŠค | ๆ•ฐๆฎ็•™ๅœจๆœฌๅœฐ | ๆ•ฐๆฎๅ‘้€ๅˆฐไบ‘็ซฏ | +| ๅฎšๅˆถๅŒ– | ๆ˜“ไบŽๅพฎ่ฐƒ | ๅพฎ่ฐƒๆˆๆœฌ้ซ˜ | +| ๅคๆ‚ๆŽจ็† | ้€‚ๅˆ็ฎ€ๅ•ไปปๅŠก | ๅคๆ‚ไปปๅŠกๆ›ดไผ˜ | + +## ๅฟซ้€Ÿ็ปŸ่ฎก + +| ๆŒ‡ๆ ‡ | ๆ•ฐ้‡ | +| ------------ | ----- | +| ๅฐๆจกๅž‹ๆ€ปๆ•ฐ | 2,002 | +| ๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ | 928 | +| ๆ”ฏๆŒๆŽจ็† | 557 | +| ๅ…่ดนๅฐๆจกๅž‹ | 48 | +| ไธ€ๆ‰‹ๆไพ›ๅ•† | 689 | + +## ๆŒ‰ไฝฟ็”จๅœบๆ™ฏ้€‰ๆ‹ฉ + +### ไฝŽๆˆๆœฌ AI Agent + +้œ€่ฆๅทฅๅ…ท่ฐƒ็”จ + ๆŽจ็† + ไฝŽๅปถ่ฟŸ็š„ๅคง่ง„ๆจก Agent ๅทฅไฝœๆตใ€‚ + +- **ๆœ€ไฝณๆ€งไปทๆฏ”**๏ผšling-2.6-flash ($0.01/$0.03/M) โ€” ๆœ€ไพฟๅฎœ็š„ TC ๆจกๅž‹๏ผŒ262K ไธŠไธ‹ๆ–‡ +- **ๅ‡่กกไน‹้€‰**๏ผšGPT-4.1-mini ($0.40/$1.60/M) โ€” ๅฏ้  + 1M ไธŠไธ‹ๆ–‡ +- **ๅ…่ดน**๏ผšGemma 4 27B IT โ€” ๅ…่ดน่ง†่ง‰ + ๅทฅๅ…ท่ฐƒ็”จ + +### ๆœฌๅœฐ / ่พน็ผ˜้ƒจ็ฝฒ + +้œ€่ฆๅœจๆ‰‹ๆœบใ€IoT ่ฎพๅค‡ๆˆ–่พน็ผ˜ๆœๅŠกๅ™จไธŠ่ฟ่กŒ็š„ๆจกๅž‹ใ€‚ + +- **่ถ…็ดงๅ‡‘**๏ผšQwen3.5 0.8B โ€” ๅฐไฝ“็งฏๆŽจ็†ๆจกๅž‹ +- **ๅ‡่กก**๏ผšQwen3 4B ($0.03/$0.15/M) โ€” ๅผ€ๆบ + ๆŽจ็† +- **่ง†่ง‰**๏ผšGemma 4 27B IT โ€” ๅ…่ดน + ่ง†่ง‰ + ๅทฅๅ…ท่ฐƒ็”จ + +### ไปฃ็ ่กฅๅ…จ + +้œ€่ฆๅทฅๅ…ท่ฐƒ็”จ + ็ป“ๆž„ๅŒ–่พ“ๅ‡บ็š„็ผ–็จ‹่พ…ๅŠฉใ€‚ + +- **ๆœ€ไพฟๅฎœ**๏ผšbdc-coder ($0.01/$0.01/M) โ€” ๆœ€ไพฟๅฎœ็š„็ผ–็จ‹ๆจกๅž‹ +- **ๅ‡่กก**๏ผšGPT-4.1-nano ($0.10/$0.40/M) โ€” ๅฟซ้€Ÿ + ไพฟๅฎœ +- **ๅผ€ๆบ**๏ผšQwen3 4B ($0.03/$0.15/M) โ€” ๆŽจ็† + ๅทฅๅ…ท่ฐƒ็”จ + +### ๆ•ฐๅญฆ & ๆŽจ็† + +้œ€่ฆๆŽจ็†่ƒฝๅŠ›็š„้€ๆญฅ้—ฎ้ข˜่งฃๅ†ณใ€‚ + +- **ๅ…่ดน**๏ผšDeepSeek R1 Distill Llama 8B โ€” ๅ…่ดนๆŽจ็†ๆจกๅž‹ +- **ๆœ€ไพฟๅฎœ**๏ผšQwen3.5 0.8B ($0.01/$0.05/M) โ€” ๆœ€ไพฟๅฎœ็š„ๆŽจ็†ๆจกๅž‹ +- **ๅ‡่กก**๏ผšQwen3.5 4B ($0.03/$0.15/M) โ€” ๅผ€ๆบๆŽจ็† + +### ๅฏน่ฏ & RAG + +้œ€่ฆๅคงไธŠไธ‹ๆ–‡ + ไฝŽๆˆๆœฌ็š„ๆฃ€็ดขๅขžๅผบ็”Ÿๆˆใ€‚ + +- **ๆœ€ไพฟๅฎœ**๏ผšQwen3 4B ($0.03/$0.15/M) โ€” ไพฟๅฎœ + 262K ไธŠไธ‹ๆ–‡ +- **ๅฟซ้€Ÿ**๏ผšGPT-4.1-nano ($0.10/$0.40/M) โ€” ๅฟซ้€Ÿ + ไพฟๅฎœ +- **ๅคงไธŠไธ‹ๆ–‡**๏ผšGemini 2.5 Flash ($0.15/$0.60/M) โ€” 1M ไธŠไธ‹ๆ–‡ + ๆŽจ็† + +## ๆœ€ไพฟๅฎœ็š„ๅทฅๅ…ท่ฐƒ็”จๅฐๆจกๅž‹ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ่พ“ๅ…ฅ $/M | ่พ“ๅ‡บ $/M | ไธŠไธ‹ๆ–‡ | ๆŽจ็† | +| ------------------------------------------- | --------- | -------- | -------- | ------ | ---- | +| ling-2.6-flash | ling | $0.01 | $0.03 | 262K | โ€” | +| klusterai--Meta-Llama-3.1-8B-Instruct-Turbo | klusterai | $0.015 | $0.02 | 131K | โ€” | +| granite-4.0-h-micro | ibm | $0.017 | $0.112 | 131K | โ€” | +| llama-3.1-8b-instruct--fp-16 | fireworks | $0.02 | $0.03 | 131K | โ€” | +| schematron-3b | fireworks | $0.02 | $0.05 | 131K | โ€” | + +## ๅ…่ดนๅฐ่ฏญ่จ€ๆจกๅž‹ + +48 ไธชๅ…่ดนๅฐๆจกๅž‹๏ผŒ้€‚ๅˆๅŽŸๅž‹ๅผ€ๅ‘ๅ’Œๆต‹่ฏ•๏ผš + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ๅทฅๅ…ท่ฐƒ็”จ | ๆŽจ็† | +| ------------------------------ | -------- | ------ | -------- | ---- | +| deepseek-r1-distill-llama-8b | cerebras | 131K | โ€” | โœ“ | +| llama-4-scout-17b-16e-instruct | cerebras | 131K | โœ“ | โ€” | +| qwen-2.5-32b | cerebras | 131K | โœ“ | โ€” | +| gemma-4-26b-a4b-it | auriko | 262K | โœ“ | โ€” | +| glm-4.5-flash | auriko | 200K | โœ“ | โ€” | + +## ๆ”ฏๆŒๆŽจ็†็š„ๅฐๆจกๅž‹ + +557 ไธชๆ”ฏๆŒๆŽจ็†่ƒฝๅŠ›็š„ๅฐๆจกๅž‹๏ผš + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ่พ“ๅ…ฅ $/M | ่พ“ๅ‡บ $/M | ไธŠไธ‹ๆ–‡ | ๅทฅๅ…ท่ฐƒ็”จ | +| ---------------------------- | --------- | -------- | -------- | ------ | -------- | +| qwen3.5-0.8b | qwen | $0.01 | $0.05 | 262K | โ€” | +| qwen3.5-2b | qwen | $0.02 | $0.10 | 262K | โ€” | +| qwen--qwen3-4b-fp8 | fireworks | $0.03 | $0.03 | 128K | โ€” | +| qwen3.5-4b | qwen | $0.03 | $0.15 | 262K | โ€” | +| deepseek-r1-distill-llama-8b | cerebras | ๅ…่ดน | ๅ…่ดน | 131K | โ€” | + +## ๅฆ‚ไฝ•้€‰ๆ‹ฉๅˆ้€‚็š„ๅฐๆจกๅž‹ + +1. **ๆ˜Ž็กฎ็บฆๆŸๆกไปถ**๏ผš้ข„็ฎ—ใ€ๅปถ่ฟŸ่ฆๆฑ‚ใ€้ƒจ็ฝฒ็›ฎๆ ‡๏ผˆไบ‘็ซฏ vs ่พน็ผ˜๏ผ‰ +2. **็กฎๅฎšๆ‰€้œ€่ƒฝๅŠ›**๏ผšๅทฅๅ…ท่ฐƒ็”จ๏ผŸๆŽจ็†๏ผŸ่ง†่ง‰๏ผŸ็ป“ๆž„ๅŒ–่พ“ๅ‡บ๏ผŸ +3. **ๆฃ€ๆŸฅไธŠไธ‹ๆ–‡็ช—ๅฃ**๏ผš้œ€่ฆๅค„็†ๅคšๅฐ‘ๆ–‡ๆœฌ๏ผŸ +4. **ๅฏนๆฏ”ๅฎšไปท**๏ผšไฝฟ็”จ[ไบคไบ’ๅผ็›ฎๅฝ•](https://i-need-token.github.io/ai-models/)ๆˆ–[ๅฎšไปท่ฎก็ฎ—ๅ™จ](https://i-need-token.github.io/ai-models/ai-model-pricing-calculator.html) +5. **็”จไฝ ็š„ๆ•ฐๆฎๆต‹่ฏ•**๏ผšๅฐๆจกๅž‹ๅœจ็‰นๅฎš้ข†ๅŸŸ็š„่ดจ้‡ๅทฎๅผ‚ๅพˆๅคง + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๅ…่ดนๆจกๅž‹ๆŒ‡ๅ—](free-models.md) โ€” 81 ไธชๅ…่ดนๆจกๅž‹ +- [ๅทฅๅ…ท่ฐƒ็”จๆŒ‡ๅ—](tool-calling.md) โ€” 2,350 ไธชๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹ +- [ๆŽจ็†ๆจกๅž‹ๆŒ‡ๅ—](reasoning-models.md) โ€” 1,306 ไธชๆŽจ็†ๆจกๅž‹ +- [ๅฎšไปทๅฏนๆฏ”](pricing-comparison.md) โ€” ๆ‰พๅˆฐๆœ€ไพฟๅฎœ็š„ๆจกๅž‹ +- [ไธŠไธ‹ๆ–‡็ช—ๅฃ](context-windows.md) โ€” ๆœ€ๅคงไธŠไธ‹ๆ–‡็ช—ๅฃ +- [ๆจกๅž‹้€‰ๆ‹ฉ้€ŸๆŸฅ่กจ](model-selection-cheatsheet.md) โ€” ๅฟซ้€Ÿๅ‚่€ƒๆŒ‡ๅ— +- [ๅฐ่ฏญ่จ€ๆจกๅž‹ๅฏนๆฏ”](https://i-need-token.github.io/ai-models/small-language-models.html) โ€” ไบคไบ’ๅผ้กต้ข + +--- + +_ๆ•ฐๆฎๆฅ่‡ช [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ไป…ไฝฟ็”จไธ€ๆ‰‹ๆ•ฐๆฎ๏ผŒ่‡ชๅŠจๆ›ดๆ–ฐใ€‚_ diff --git a/docs/zh/small-models.md b/docs/zh/small-models.md new file mode 100644 index 00000000..a2373da3 --- /dev/null +++ b/docs/zh/small-models.md @@ -0,0 +1,80 @@ +# ๅฐๅž‹ไธŽ่พน็ผ˜ๆจกๅž‹ + +[English](../small-models.md) + +ไธ“ไธบ**่พน็ผ˜้ƒจ็ฝฒใ€่ฎพๅค‡็ซฏๆŽจ็†ๅ’Œ่ต„ๆบๅ—้™็Žฏๅขƒ**่ฎพ่ฎก็š„ AI ๆจกๅž‹ โ€” ๅ‚ๆ•ฐ้‡ๅœจ ~16B ไปฅไธ‹็š„ๆจกๅž‹๏ผŒๅฏๅœจๆถˆ่ดน็บง็กฌไปถใ€็งปๅŠจ่ฎพๅค‡ๅ’ŒๅตŒๅ…ฅๅผ็ณป็ปŸไธŠ่ฟ่กŒใ€‚ + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models)ใ€‚ + +## ไธบไป€ไนˆๅฐๅž‹ๆจกๅž‹ๅพˆ้‡่ฆ + +ๅฐๅž‹ๆจกๅž‹ไฝฟ AI ๅœจไบ‘่ฟžๆŽฅๆœ‰้™ๆˆ–ๅปถ่ฟŸๅ…ณ้”ฎ็š„ๅœบๆ™ฏไธญๆˆไธบๅฏ่ƒฝ๏ผš + +- **่ฎพๅค‡็ซฏๆŽจ็†** โ€” ๅœจๆ‰‹ๆœบๅ’Œ็ฌ”่ฎฐๆœฌ็”ต่„‘ไธŠๆ— ้œ€ไบ’่”็ฝ‘่ฟ่กŒ AI +- **่พน็ผ˜่ฎก็ฎ—** โ€” ้ƒจ็ฝฒๅœจ IoT ่ฎพๅค‡ใ€ๆœบๅ™จไบบๅ’Œ่ฝฆ่พ†ไธญ +- **ไฝŽๅปถ่ฟŸ** โ€” ไบš 100ms ๅ“ๅบ”ๆ—ถ้—ด๏ผŒ้€‚็”จไบŽๅฎžๆ—ถๅบ”็”จ +- **ๆˆๆœฌๆ•ˆ็›Š** โ€” ่ฟ่กŒๆˆๆœฌๆ›ดไฝŽ๏ผŒๅฐคๅ…ถๆ˜ฏๅœจๅคง่ง„ๆจกๅœบๆ™ฏ +- **้š็ง** โ€” ๆ•ฐๆฎไธ็ฆปๅผ€่ฎพๅค‡ +- **็ฆป็บฟ่ƒฝๅŠ›** โ€” ๆ— ้œ€็ฝ‘็ปœ่ฟžๆŽฅๅณๅฏไฝฟ็”จ็š„ AI + +## ็ปŸ่ฎก + +| ๆŒ‡ๆ ‡ | ๆ•ฐ้‡ | +| ---------------- | ---- | +| ๅฐๅž‹/่พน็ผ˜ๆจกๅž‹ | 1153 | +| ๆไพ›ๅ•† | 63 | +| ๅ…่ดนๅฐๅž‹ๆจกๅž‹ | 30 | +| ๅผ€ๆบๆƒ้‡ๅฐๅž‹ๆจกๅž‹ | 272 | +| ๅธฆๅทฅๅ…ท่ฐƒ็”จ | 434 | +| ๅธฆๆŽจ็†่ƒฝๅŠ› | 250 | + +## ๆไพ›ๅ•† + +`302ai`ใ€`aihubmix`ใ€`aimlapi`ใ€`aion`ใ€`alibaba`ใ€`amazon-bedrock`ใ€`auriko`ใ€`baichuan`ใ€`berget`ใ€`bytedance`ใ€`cerebras`ใ€`chutes`ใ€`clarifai`ใ€`cloudferro-sherlock`ใ€`cloudflare`ใ€`cortecs`ใ€`databricks`ใ€`deepinfra`ใ€`digitalocean`ใ€`evroc`ใ€`fastrouter`ใ€`fireworks`ใ€`friendli`ใ€`gmicloud`ใ€`google`ใ€`google-vertex`ใ€`groq`ใ€`hpc-ai`ใ€`hyperbolic`ใ€`inferencenet`ใ€`jiekou`ใ€`klusterai`ใ€`llmgateway`ใ€`martian`ใ€`meganova`ใ€`meta`ใ€`microsoft`ใ€`mistral`ใ€`mixlayer`ใ€`moonshotai`ใ€`morph`ใ€`nanogpt`ใ€`nebius`ใ€`neuralwatt`ใ€`nousresearch`ใ€`novitaai`ใ€`openrouter`ใ€`orcarouter`ใ€`ovhcloud`ใ€`ppio`ใ€`privatemode`ใ€`requesty`ใ€`sambanova`ใ€`scaleway`ใ€`siliconflow`ใ€`siliconflow-cn`ใ€`submodel`ใ€`tencent`ใ€`textsynth`ใ€`togetherai`ใ€`venice`ใ€`vultr`ใ€`wafer` + +## ๅ…่ดนๅฐๅž‹ๆจกๅž‹ + +ๅ…่ดนๅฐๅž‹ๆจกๅž‹ โ€” ้›ถๆˆๆœฌ่พน็ผ˜ AIใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/M | ่พ“ๅ‡บ $/M | ่ƒฝๅŠ› | +| ---------------------------------------------------- | ---------- | ------ | -------- | -------- | -------- | +| nvidia--nemotron-3-super-120b-a12b--free | openrouter | 1M | Free | Free | ๐Ÿ”ง ๐Ÿง  ๐Ÿ“‹ | +| google--gemma-4-26b-a4b-it--free | openrouter | 262K | Free | Free | ๐Ÿ”ง ๐Ÿง  ๐Ÿ“‹ | +| google--gemma-4-31b-it--free | openrouter | 262K | Free | Free | ๐Ÿ”ง ๐Ÿง  ๐Ÿ“‹ | +| gemma-4-26b-a4b-it | auriko | 262K | Free | Free | ๐Ÿ”ง ๐Ÿง  ๐Ÿ“‹ | +| gemma-4-31b-it | auriko | 262K | Free | Free | ๐Ÿ”ง ๐Ÿง  ๐Ÿ“‹ | +| nvidia--nemotron-3-nano-omni-30b-a3b-reasoning--free | openrouter | 256K | Free | Free | ๐Ÿ”ง ๐Ÿง  | +| gemma-3-4b-it | google | 131K | Free | Free | | +| gemma-3-12b-it | google | 131K | Free | Free | | +| gemma-3-27b-it | google | 131K | Free | Free | | +| gemma-3n-E2B-it | google | 131K | Free | Free | | + +## ๆœ€ไพฟๅฎœๅฐๅž‹ๆจกๅž‹ + +็”Ÿไบง็Žฏๅขƒๅฐๅž‹ๅบ”็”จ็š„ๆœ€ไฝณๆ€งไปทๆฏ”ๆจกๅž‹ใ€‚ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/M | ่พ“ๅ‡บ $/M | ่ƒฝๅŠ› | +| ----------------------------------------------- | -------- | ------ | -------- | -------- | ----- | +| llama3-groq-8b-8192-tool-use-preview | aihubmix | 0 | $9.5e-05 | $9.5e-05 | | +| mistralai--mistral-7b-instruct--free | aihubmix | 0 | $0.001 | $0.001 | | +| deepseek-ai--deepseek-r1-distill-llama-8b | aihubmix | 0 | $0.005 | $0.005 | | +| deepseek-ai--deepseek-r1-distill-qwen-7b | aihubmix | 0 | $0.005 | $0.005 | | +| deepseek-ai--deepseek-r1-distill-qwen-1.5b | aihubmix | 0 | $0.005 | $0.005 | | +| ernie-4.5-0.3b | aihubmix | 0 | $0.0068 | $0.0272 | ๐Ÿ”ง ๐Ÿ“‹ | +| google--gemma-2-9b-it--free | aihubmix | 0 | $0.01 | $0.01 | | +| meta-llama--llama-3.2-3b-instruct--free | aihubmix | 0 | $0.01 | $0.01 | | +| meta-llama--llama-3.2-11b-vision-instruct--free | aihubmix | 0 | $0.01 | $0.01 | | +| meta-llama--llama-3.1-8b-instruct--free | aihubmix | 0 | $0.01 | $0.01 | | + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๅผ€ๆบๆƒ้‡](open-weights.md) โ€” 527 ไธชๅผ€ๆบๆƒ้‡ๆจกๅž‹ +- [ๅ…่ดน AI ๆจกๅž‹](free-models.md) โ€” 81 ไธชๅ…่ดนๆจกๅž‹ๆŒ‰่ƒฝๅŠ›ๅˆ†็ฑป +- [่Šๅคฉๆจกๅž‹](chat-models.md) โ€” 2,350 ไธชๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ็š„่Šๅคฉๆจกๅž‹ +- [ไปฃ็ ๆจกๅž‹](code-models.md) โ€” 189 ไธชไปฃ็ ๆจกๅž‹ +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ้€‰ๆ‹ฉๆจกๅž‹็š„ๅ†ณ็ญ–ๆก†ๆžถ +- [ๆไพ›ๅ•†ๅฏนๆฏ”](provider-comparison.md) โ€” ๅ‰ 30 ไธชๆไพ›ๅ•† + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/structured-output.md b/docs/zh/structured-output.md new file mode 100644 index 00000000..cd0c9319 --- /dev/null +++ b/docs/zh/structured-output.md @@ -0,0 +1,84 @@ +[English](../structured-output.md) | **ไธญๆ–‡** + +# AI ็ป“ๆž„ๅŒ–่พ“ๅ‡บๆจกๅž‹๏ผˆJSON ๆจกๅผ๏ผ‰ + +ๆœฌ็›ฎๅฝ•ไธญๆœ‰ 829 ไธชๆจกๅž‹ๆ”ฏๆŒ็ป“ๆž„ๅŒ–่พ“ๅ‡บ โ€” ่ƒฝๅคŸๆŒ‰็…งๆŒ‡ๅฎš็š„ JSON Schema ็”Ÿๆˆๅ›žๅคใ€‚่ฟ™ๅฏนไบŽๆž„ๅปบๅฏ้ ็š„ AI ้ฉฑๅŠจ APIใ€ๆ•ฐๆฎ็ฎก้“ๅ’Œ่‡ชๅŠจๅŒ–่‡ณๅ…ณ้‡่ฆใ€‚ + +> ๆ‰€ๆœ‰ๆ•ฐๆฎๆฅ่‡ชไธ€ๆ‰‹ API ๅ’Œๆ–‡ๆกฃใ€‚"็ป“ๆž„ๅŒ–่พ“ๅ‡บ"่กจ็คบๆจกๅž‹ๅฏไปฅๅœจๅ›žๅคไธญๅผบๅˆถ้ตๅพช JSON Schema๏ผˆไนŸ็งฐไธบ JSON ๆจกๅผใ€็บฆๆŸ่งฃ็ ๆˆ–ๅผ•ๅฏผ็”Ÿๆˆ๏ผ‰ใ€‚ + +## ๅฟซ้€Ÿ็ปŸ่ฎก + +| ่ƒฝๅŠ› | ็ป“ๆž„ๅŒ–่พ“ๅ‡บๆจกๅž‹ๆ•ฐ | +| ---------------- | ---------------: | +| ๆ€ป็ป“ๆž„ๅŒ–่พ“ๅ‡บๆจกๅž‹ | 829 | +| ๅ”ฏไธ€ๆจกๅž‹ ID | 704 | +| ๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ | 749 | +| ๆ”ฏๆŒๆŽจ็† | 473 | +| ๆ”ฏๆŒ่ง†่ง‰ | 411 | +| ๅผ€ๆบๆƒ้‡ | 24 | + +## ๆœ€ไพฟๅฎœ็š„็ป“ๆž„ๅŒ–่พ“ๅ‡บๆจกๅž‹ + +็”Ÿๆˆๅฏ้  JSON ๅ›žๅค็š„ๆœ€ไฝณๆ€งไปทๆฏ”๏ผš + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ่พ“ๅ…ฅ $/1M | ่พ“ๅ‡บ $/1M | ไธŠไธ‹ๆ–‡ | ๅทฅๅ…ท่ฐƒ็”จ | ๆŽจ็† | +| --------------------- | ---------- | --------: | --------: | ------ | -------- | ---- | +| Ernie 4.5 0.3B | AIHubMix | $0.0068 | $0.0272 | โ€” | โœ… | โŒ | +| Ling 2.6 Flash | OpenRouter | $0.01 | $0.03 | 262K | โœ… | โŒ | +| Qwen3 VL Flash | AIHubMix | $0.0103 | $0.103 | โ€” | โœ… | โŒ | +| Llama 3.1 8B Instruct | Auriko | $0.02 | $0.03 | 131K | โœ… | โŒ | +| Mistral Nemo | OpenRouter | $0.02 | $0.02 | โ€” | โœ… | โŒ | +| Doubao Seed 1.6 Flash | AIHubMix | $0.022 | $0.022 | โ€” | โœ… | โŒ | +| GPT-5 Nano | AIHubMix | $0.025 | $0.20 | โ€” | โœ… | โœ… | +| GPT-OSS 20B | NeuralWatt | $0.03 | $0.03 | โ€” | โœ… | โœ… | +| Granite 4.0 H Micro | Cloudflare | $0.017 | $0.112 | 131K | โœ… | โŒ | +| Gemini 2.5 Flash Lite | Google | $0.10 | $0.60 | 1M | โœ… | โœ… | + +## ๅ…่ดน็ป“ๆž„ๅŒ–่พ“ๅ‡บๆจกๅž‹ + +24 ไธชๆจกๅž‹ๆไพ›ๅ…่ดน็ป“ๆž„ๅŒ–่พ“ๅ‡บ โ€” ้€‚ๅˆๅŽŸๅž‹่ฎพ่ฎก๏ผš + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ๅทฅๅ…ท่ฐƒ็”จ | ๆŽจ็† | +| ------------------------- | ---------- | ------ | -------- | ---- | +| Ernie 4.5 0.3B | AIMLAPI | โ€” | โœ… | โŒ | +| Gemma 4 26B A4B IT | Auriko | โ€” | โœ… | โœ… | +| Gemma 4 31B IT | Auriko | โ€” | โœ… | โŒ | +| Qwen3 Omni 30B A3B | NovitaAI | โ€” | โœ… | โœ… | +| Dolphin Mistral 24B | OpenRouter | โ€” | โœ… | โŒ | +| Gemma 4 26B A4B IT (free) | OpenRouter | โ€” | โœ… | โœ… | +| Gemma 4 31B IT (free) | OpenRouter | โ€” | โœ… | โŒ | + +## ๆœ€ไฝณ็ป“ๆž„ๅŒ–่พ“ๅ‡บ + ๅทฅๅ…ท่ฐƒ็”จ + ๆŽจ็† + +้€‚ๅˆ้œ€่ฆ่ฟ”ๅ›ž็ป“ๆž„ๅŒ–ๆ•ฐๆฎใ€่ฐƒ็”จๅทฅๅ…ทๅ’ŒๆŽจ็†็š„ AI ไปฃ็†๏ผš + +| ๆจกๅž‹ | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/1M | ๅทฅๅ…ท่ฐƒ็”จ | ๆŽจ็† | ๆไพ›ๅ•†ๆ•ฐ | +| --------------------- | ------ | --------: | -------- | ---- | -------: | +| Grok 4 Fast Reasoning | 2M | $0.20 | โœ… | โœ… | 2 | +| Gemini 2.5 Flash | 1M | $0.15 | โœ… | โœ… | 3 | +| Gemini 2.5 Pro | 1M | $1.25 | โœ… | โœ… | 4 | +| GPT-5.4 | 1M | $2.50 | โœ… | โœ… | 4 | +| DeepSeek Reasoner | 1M | $0.43 | โœ… | โœ… | 1 | +| GPT-5 Nano | โ€” | $0.025 | โœ… | โœ… | 4 | + +## ่ฆ็‚นๆ€ป็ป“ + +- **829 ไธช็ป“ๆž„ๅŒ–่พ“ๅ‡บๆจกๅž‹** โ€” ๆœ€ๅคง็š„ JSON ๆจกๅผๆจกๅž‹็›ฎๅฝ• +- **749 ไธชๆจกๅž‹**ๅŒๆ—ถๆ”ฏๆŒ็ป“ๆž„ๅŒ–่พ“ๅ‡บๅ’Œๅทฅๅ…ท่ฐƒ็”จ โ€” ๅฎŒ็พŽ้€‚ๅˆ AI ไปฃ็† +- **24 ไธชๅ…่ดนๆจกๅž‹**ๆ”ฏๆŒ็ป“ๆž„ๅŒ–่พ“ๅ‡บ โ€” ้›ถๆˆๆœฌๅผ€ๅง‹ๆž„ๅปบ +- **Gemini 2.5 Flash** ๆ˜ฏๆœ€ไฝณๆ€งไปทๆฏ”๏ผš1M ไธŠไธ‹ๆ–‡ใ€็ป“ๆž„ๅŒ–่พ“ๅ‡บใ€ๅทฅๅ…ท่ฐƒ็”จๅ’ŒๆŽจ็†๏ผŒไป… $0.15/1M +- ๅฐๅž‹ๆจกๅž‹๏ผˆErnie 4.5 0.3Bใ€Ling 2.6 Flash๏ผ‰ๅธฆ็ป“ๆž„ๅŒ–่พ“ๅ‡บไป…้œ€ $0.01/1M +- 91% ็š„็ป“ๆž„ๅŒ–่พ“ๅ‡บๆจกๅž‹ๅŒๆ—ถๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ โ€” ่ฟ™ไธค็ง่ƒฝๅŠ›็›ธ่พ…็›ธๆˆ + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ้€‰ๆ‹ฉๆจกๅž‹็š„ๅ†ณ็ญ–ๆก†ๆžถ +- [ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹](tool-calling.md) โ€” 2,350 ไธชๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ็š„ๆจกๅž‹ +- [ๆŽจ็†ๆจกๅž‹](reasoning-models.md) โ€” 1,306 ไธชๆ”ฏๆŒๆŽจ็†็š„ๆจกๅž‹ +- [ๅ…่ดน AI ๆจกๅž‹](free-models.md) โ€” 81 ไธชๅ…่ดนๆจกๅž‹๏ผŒ้ƒจๅˆ†ๆ”ฏๆŒ็ป“ๆž„ๅŒ–่พ“ๅ‡บ +- [็ผ“ๅญ˜ๅฎšไปท](cached-pricing.md) โ€” 1,374 ไธชๆ”ฏๆŒๆ็คบ็ผ“ๅญ˜็š„ๆจกๅž‹ +- [ๆ™บ่ƒฝไฝ“ๆจกๅž‹](agentic-models.md) โ€” 1,080 ไธชๅทฅๅ…ท่ฐƒ็”จ+ๆŽจ็†ๆจกๅž‹ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/tool-calling.md b/docs/zh/tool-calling.md new file mode 100644 index 00000000..5e35f86a --- /dev/null +++ b/docs/zh/tool-calling.md @@ -0,0 +1,102 @@ +[English](../tool-calling.md) | **ไธญๆ–‡** + +# AI ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹ + +ๆœฌ็›ฎๅฝ•ไธญๆœ‰ 2,350 ไธชๆจกๅž‹ๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ๏ผˆๅ‡ฝๆ•ฐ่ฐƒ็”จ๏ผ‰ใ€‚ๆœฌ้กต้‡็‚นไป‹็ปๆž„ๅปบ AI ไปฃ็†ๅ’Œ่‡ชๅŠจๅŒ–ๆœ€ๆœ‰่ƒฝๅŠ›ๅ’Œๆœ€ๅ…ทๆ€งไปทๆฏ”็š„ๆจกๅž‹ใ€‚ + +> ๆ‰€ๆœ‰ๆ•ฐๆฎๆฅ่‡ชไธ€ๆ‰‹ API ๅ’Œๆ–‡ๆกฃใ€‚"ๅทฅๅ…ท่ฐƒ็”จ"่กจ็คบๆจกๅž‹ๅฏไปฅๅœจๅ›žๅคไธญ่ฐƒ็”จๅค–้ƒจๅ‡ฝๆ•ฐ/ๅทฅๅ…ทใ€‚ + +## ๅฟซ้€Ÿ็ปŸ่ฎก + +| ่ƒฝๅŠ› | ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹ๆ•ฐ | +| -------------------- | -------------: | +| ๆ€ปๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹ | 2,350 | +| ๅ”ฏไธ€ๆจกๅž‹ ID | 1,540 | +| ๆ”ฏๆŒๆŽจ็† | 1,076 | +| ๆ”ฏๆŒ่ง†่ง‰๏ผˆๅ›พๅƒ่พ“ๅ…ฅ๏ผ‰ | 1,063 | +| ๆ”ฏๆŒ็ป“ๆž„ๅŒ–่พ“ๅ‡บ | 829 | +| ๅผ€ๆบๆƒ้‡ | 270 | + +## ๆœ€ไพฟๅฎœ็š„ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹ + +ๆž„ๅปบ AI ไปฃ็†็š„ๆœ€ไฝณๆ€งไปทๆฏ”๏ผš + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ่พ“ๅ…ฅ $/1M | ่พ“ๅ‡บ $/1M | ไธŠไธ‹ๆ–‡ | ๆŽจ็† | +| -------------------------- | ------------ | --------: | --------: | ------ | ---- | +| GLM-4-Flash | 302AI | $0.0014 | $0.0014 | 131K | โŒ | +| Mistral-Nemo-Instruct-2407 | KlusterAI | $0.008 | $0.001 | 131K | โŒ | +| BDC-Coder | InferenceNet | $0.01 | $0.01 | 131K | โŒ | +| Qwen 3.5 0.8B | Auriko | $0.01 | $0.05 | 262K | โœ… | +| Qwen 3.5 0.8B | DeepInfra | $0.01 | $0.05 | 262K | โœ… | +| Qwen 3.5 2B | Auriko | $0.02 | $0.10 | 262K | โœ… | +| Qwen 3.5 2B | DeepInfra | $0.02 | $0.10 | 262K | โœ… | +| GPT-5 Nano | Requesty | $0.025 | $0.20 | 400K | โœ… | +| Gemini 2.5 Flash Lite | Google | $0.10 | $0.60 | 1M | โœ… | +| Gemini 2.5 Flash | Google | $0.15 | $0.60 | 1M | โœ… | +| Grok 4 Fast Reasoning | xAI | $0.20 | $0.50 | 2M | โœ… | + +## ๆœ€ๅคงไธŠไธ‹ๆ–‡ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹ + +้€‚ๅˆๅค„็†ๅคงๅž‹ๆ–‡ๆกฃๆˆ–้•ฟๅฏน่ฏๅކๅฒ็š„ไปฃ็†๏ผš + +| ๆจกๅž‹ | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/1M | ๆŽจ็† | ๆไพ›ๅ•†ๆ•ฐ | +| --------------------- | ------ | --------: | ---- | -------: | +| Llama 4 Scout | 10M | $0.08 | โŒ | 4 | +| Grok 4 Fast Reasoning | 2M | $0.20 | โœ… | 2 | +| GPT-5.4 | 1M | $2.50 | โœ… | 4 | +| Gemini 2.5 Pro | 1M | $1.25 | โœ… | 4 | +| Gemini 2.5 Flash | 1M | $0.15 | โœ… | 3 | +| DeepSeek-V4 Flash | 1M | $0.27 | โœ… | 2 | +| GPT-4.1 | 1M | $2.00 | โŒ | 4 | +| Llama 4 Maverick | 1M | $0.15 | โŒ | 3 | + +## ๆœ€ไฝณๅทฅๅ…ท่ฐƒ็”จ + ๆŽจ็† + ่ง†่ง‰ + +้ซ˜็บง AI ไปฃ็†็š„"ไธ‰ไฝไธ€ไฝ“" โ€” ๅทฅๅ…ท่ฐƒ็”จใ€ๆŽจ็†ๅ’Œ่ง†่ง‰ไธ€ไฝ“๏ผš + +| ๆจกๅž‹ | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/1M | ๆไพ›ๅ•†ๆ•ฐ | +| --------------------- | ------ | --------: | -------: | +| Grok 4 Fast Reasoning | 2M | $0.20 | 2 | +| Gemini 2.5 Flash | 1M | $0.15 | 3 | +| Gemini 2.5 Pro | 1M | $1.25 | 4 | +| GPT-5.4 | 1M | $2.50 | 4 | +| DeepSeek Reasoner | 1M | $0.43 | 1 | +| MiMo V2.5๏ผˆๅผ€ๆบๆƒ้‡๏ผ‰ | 1M | varies | 2 | +| Kimi K2.6๏ผˆๅผ€ๆบๆƒ้‡๏ผ‰ | 262K | varies | 4 | + +## ๅ…่ดนๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹ + +45 ไธชๅ…่ดนๆจกๅž‹ๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ โ€” ้€‚ๅˆๅŽŸๅž‹่ฎพ่ฎกๅ’Œๆต‹่ฏ•๏ผš + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ๆŽจ็† | ่ง†่ง‰ | +| ------------------------------ | ------ | ------ | ---- | ---- | +| gemini-2.0-flash | Google | 1M | โœ… | โœ… | +| gemini-2.5-flash-preview-05-20 | Google | 1M | โœ… | โœ… | +| llama-4-scout | Chutes | 10M | โŒ | โœ… | +| llama-4-maverick | Chutes | 1M | โŒ | โœ… | +| deepseek-r1 | Chutes | 128K | โœ… | โŒ | +| qwen3-235b-a22b | Chutes | 128K | โœ… | โœ… | +| gemma-3-27b-it | Chutes | 128K | โœ… | โœ… | + +## ่ฆ็‚นๆ€ป็ป“ + +- **2,350 ไธชๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹**๏ผŒๆถต็›– 1,540 ไธชๅ”ฏไธ€ๆจกๅž‹ ID โ€” ๆœ€ๅคง็š„ๅทฅๅ…ท่ฐƒ็”จๆจกๅž‹็›ฎๅฝ• +- **Gemini 2.5 Flash** ๆ˜ฏๆœ€ไฝณๆ€งไปทๆฏ”๏ผš1M ไธŠไธ‹ๆ–‡ใ€ๅทฅๅ…ท่ฐƒ็”จใ€ๆŽจ็†ๅ’Œ่ง†่ง‰๏ผŒไป… $0.15/1M +- **Grok 4 Fast Reasoning** ๆไพ›ๆœ€ๅคงไธŠไธ‹ๆ–‡๏ผˆ2M๏ผ‰ไธ”ๅ…ทๅค‡ๅ…จ้ƒจไธ‰็ง่ƒฝๅŠ› +- **45 ไธชๅ…่ดนๆจกๅž‹**ๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ โ€” ้›ถๆˆๆœฌๅผ€ๅง‹ๆž„ๅปบไปฃ็† +- **829 ไธชๆจกๅž‹**ๅŒๆ—ถๆ”ฏๆŒ็ป“ๆž„ๅŒ–่พ“ๅ‡บ โ€” ๅฎŒ็พŽ้€‚ๅˆๅฏ้ ็š„ JSON ๅ“ๅบ” +- ๅฐๅž‹ๆจกๅž‹๏ผˆQwen 3.5 0.8Bโ€“4B๏ผ‰ๅธฆๅทฅๅ…ท่ฐƒ็”จไป…้œ€ $0.01โ€“$0.03/1M tokens + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ้€‰ๆ‹ฉๆจกๅž‹็š„ๅ†ณ็ญ–ๆก†ๆžถ +- [ๅ…่ดน AI ๆจกๅž‹](free-models.md) โ€” 81 ไธชๅ…่ดนๆจกๅž‹๏ผŒๅคšๆ•ฐๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ +- [็ป“ๆž„ๅŒ–่พ“ๅ‡บ](structured-output.md) โ€” 829 ไธช JSON ๆจกๅผๆจกๅž‹ +- [ๆŽจ็†ๆจกๅž‹](reasoning-models.md) โ€” 1,306 ไธชๆ”ฏๆŒๆŽจ็†็š„ๆจกๅž‹ +- [็ผ“ๅญ˜ๅฎšไปท](cached-pricing.md) โ€” 1,374 ไธชๆ”ฏๆŒๆ็คบ็ผ“ๅญ˜็š„ๆจกๅž‹ +- [OpenAI ๆ›ฟไปฃๆ–นๆกˆ](openai-alternatives.md) โ€” GPT-4/GPT-3.5 ๅทฅๅ…ท่ฐƒ็”จๆ›ฟไปฃ +- [ๆ™บ่ƒฝไฝ“ๆจกๅž‹](agentic-models.md) โ€” 1,080 ไธชๅทฅๅ…ท่ฐƒ็”จ+ๆŽจ็†ๆจกๅž‹ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/docs/zh/video-models.md b/docs/zh/video-models.md new file mode 100644 index 00000000..a66fb3ed --- /dev/null +++ b/docs/zh/video-models.md @@ -0,0 +1,210 @@ +# ่ง†้ข‘ๆจกๅž‹ + +[English](../video-models.md) + +ๆ”ฏๆŒ่ง†้ข‘่พ“ๅ…ฅๆˆ–่พ“ๅ‡บ็š„ AI ๆจกๅž‹๏ผŒๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models)ใ€‚ + +## ็ปŸ่ฎก + +| ๆŒ‡ๆ ‡ | ๆ•ฐ้‡ | +| ------------ | ---- | +| ่ง†้ข‘ๆจกๅž‹ๆ€ปๆ•ฐ | 171 | +| ่ง†้ข‘่พ“ๅ…ฅ | 167 | +| ่ง†้ข‘่พ“ๅ‡บ | 4 | +| ๅ…่ดน | 0 | +| ๅผ€ๆบๆƒ้‡ | 6 | +| ๆไพ›ๅ•† | 18 | + +## ๆไพ›ๅ•† + +`aihubmix`, `amazon`, `amazon-bedrock`, `bytedance`, `chutes`, `fastrouter`, `google`, `google-vertex`, `hpc-ai`, `inferencenet`, `minimax`, `novitaai`, `openrouter`, `tencent`, `tencent-tokenhub`, `voyage`, `vultr`, `xiaomi` + +## ๆจกๅž‹ + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅไปทๆ ผ | ่ƒฝๅŠ› | +| ---------------------------------------------------- | ---------------- | ------ | --------- | -------------- | +| doubao-seed-1-6 | aihubmix | โ€” | $0.09 | ๐Ÿ“น in ๐Ÿ”ง | +| doubao-seed-1-6-flash | aihubmix | โ€” | $0.022 | ๐Ÿ“น in ๐Ÿ”ง | +| doubao-seed-1-6-lite | aihubmix | โ€” | $0.041 | ๐Ÿ“น in ๐Ÿ”ง | +| doubao-seed-1-6-thinking | aihubmix | โ€” | $0.09 | ๐Ÿ“น in ๐Ÿ”ง | +| doubao-seed-1-8 | aihubmix | โ€” | $0.054795 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| gemini-2.0-flash | aihubmix | โ€” | $0.05 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.0-flash-exp | aihubmix | โ€” | $0.01 | ๐Ÿ“น in | +| gemini-2.0-flash-lite | aihubmix | โ€” | $0.038 | ๐Ÿ“น in | +| gemini-2.0-flash-search | aihubmix | โ€” | $0.05 | ๐Ÿ“น in | +| gemini-2.0-flash-thinking-exp-01-21 | aihubmix | โ€” | $0.038 | ๐Ÿ“น in ๐Ÿง  | +| gemini-2.0-pro-exp-02-05 | aihubmix | โ€” | $0.625 | ๐Ÿ“น in | +| gemini-2.0-pro-exp-02-05-search | aihubmix | โ€” | $0.625 | ๐Ÿ“น in | +| gemini-2.5-flash | aihubmix | โ€” | $0.15 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-flash-lite | aihubmix | โ€” | $0.05 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-flash-lite-nothink | aihubmix | โ€” | $0.05 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-flash-lite-preview-09-2025 | aihubmix | โ€” | $0.05 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-flash-lite-preview-09-2025-nothink | aihubmix | โ€” | $0.05 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-flash-nothink | aihubmix | โ€” | $0.15 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-flash-preview-05-20-nothink | aihubmix | โ€” | $0.15 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-flash-preview-05-20-search | aihubmix | โ€” | $0.15 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-flash-preview-09-2025 | aihubmix | โ€” | $0.15 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-flash-search | aihubmix | โ€” | $0.15 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-pro | aihubmix | โ€” | $0.625 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| gemini-2.5-pro-exp-03-25 | aihubmix | โ€” | $0.625 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-pro-preview-03-25-search | aihubmix | โ€” | $0.625 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| gemini-2.5-pro-preview-05-06 | aihubmix | โ€” | $0.625 | ๐Ÿ“น in ๐Ÿง  | +| gemini-2.5-pro-preview-05-06-search | aihubmix | โ€” | $0.625 | ๐Ÿ“น in ๐Ÿง  | +| gemini-2.5-pro-preview-06-05 | aihubmix | โ€” | $0.625 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| gemini-2.5-pro-preview-06-05-search | aihubmix | โ€” | $0.625 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| gemini-2.5-pro-search | aihubmix | โ€” | $0.625 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| gemini-3.1-flash-lite-preview-nothink | aihubmix | โ€” | $0.125 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| glm-4.5v | aihubmix | โ€” | $0.137 | ๐Ÿ“น in | +| glm-4.6v | aihubmix | โ€” | $0.0685 | ๐Ÿ“น in | +| gme-qwen2-vl-2b-instruct | aihubmix | โ€” | $0.069 | ๐Ÿ“น in | +| kimi-k2.5 | aihubmix | โ€” | $0.3 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| mimo-v2-omni | aihubmix | โ€” | $0.22 | ๐Ÿ“น in | +| mimo-v2-pro | aihubmix | โ€” | $0.55 | ๐Ÿ“น in | +| qwen--qwen2.5-vl-32b-instruct | aihubmix | โ€” | $0.12 | ๐Ÿ“น in ๐Ÿ”ง | +| qwen--qwen2.5-vl-72b-instruct | aihubmix | โ€” | $0.25 | ๐Ÿ“น in | +| qwen2-vl-72b-instruct | aihubmix | โ€” | $1.09 | ๐Ÿ“น in | +| qwen2-vl-7b-instruct | aihubmix | โ€” | $0.14 | ๐Ÿ“น in | +| qwen3-vl-235b-a22b-instruct | aihubmix | โ€” | $0.137 | ๐Ÿ“น in ๐Ÿ”ง | +| qwen3-vl-235b-a22b-thinking | aihubmix | โ€” | $0.137 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen3-vl-30b-a3b-instruct | aihubmix | โ€” | $0.0514 | ๐Ÿ“น in ๐Ÿ”ง | +| qwen3-vl-30b-a3b-thinking | aihubmix | โ€” | $0.0514 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen3-vl-flash | aihubmix | โ€” | $0.0103 | ๐Ÿ“น in ๐Ÿ”ง | +| qwen3-vl-flash-2026-01-22 | aihubmix | โ€” | $0.0103 | ๐Ÿ“น in ๐Ÿ”ง | +| qwen3-vl-plus | aihubmix | โ€” | $0.0685 | ๐Ÿ“น in ๐Ÿ”ง | +| veo-2.0-generate-001 | aihubmix | โ€” | $1 | ๐Ÿ“น in | +| veo-3 | aihubmix | โ€” | $1 | ๐Ÿ“น in | +| veo-3.0-generate-preview | aihubmix | โ€” | $1 | ๐Ÿ“น in | +| veo-3.1-fast-generate-preview | aihubmix | โ€” | $1 | ๐Ÿ“น in | +| veo-3.1-generate-preview | aihubmix | โ€” | $1 | ๐Ÿ“น in | +| veo-3.1-lite-generate-preview | aihubmix | โ€” | $1 | ๐Ÿ“น in | +| veo3 | aihubmix | โ€” | $1 | ๐Ÿ“น in | +| amazon-nova-2.0-lite | amazon | โ€” | $0.15 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| amazon-nova-2.0-omni | amazon | โ€” | $0.2 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| amazon-nova-2.0-pro | amazon | โ€” | $0.625 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| amazon-nova-lite | amazon | โ€” | $0.06 | ๐Ÿ“น in ๐Ÿ”ง | +| amazon-nova-premier | amazon | โ€” | $2.5 | ๐Ÿ“น in ๐Ÿ”ง | +| amazon-nova-pro | amazon | โ€” | $0.8 | ๐Ÿ“น in ๐Ÿ”ง | +| amazon-nova-2-lite | amazon-bedrock | โ€” | $0.33 | ๐Ÿ“น in ๐Ÿ”ง | +| amazon-nova-lite | amazon-bedrock | โ€” | $0.06 | ๐Ÿ“น in ๐Ÿ”ง | +| amazon-nova-premier | amazon-bedrock | โ€” | $2.5 | ๐Ÿ“น in ๐Ÿ”ง | +| amazon-nova-pro | amazon-bedrock | โ€” | $0.8 | ๐Ÿ“น in ๐Ÿ”ง | +| amazon-nova-pro-latency-optimized | amazon-bedrock | โ€” | $1 | ๐Ÿ“น in ๐Ÿ”ง | +| seed-1.6 | bytedance | โ€” | $0.25 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| seed-1.6-flash | bytedance | โ€” | $0.07 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| seed-2.0-lite | bytedance | โ€” | $0.25 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| seed-2.0-mini | bytedance | โ€” | $0.1 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| moonshotai--Kimi-K2.5-TEE | chutes | โ€” | $0.44 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| moonshotai--Kimi-K2.6-TEE | chutes | โ€” | $0.74 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-3-flash-preview | fastrouter | โ€” | $0.5 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-3.1-flash-lite-preview | fastrouter | โ€” | $0.25 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-3.1-pro-preview | fastrouter | โ€” | $2 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemma-4-31b-it | fastrouter | โ€” | $0.2 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| gemini-1.5-flash | google | โ€” | $0.075 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-1.5-flash-8b | google | โ€” | $0.075 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-1.5-pro | google | โ€” | $1.25 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.0-flash | google | โ€” | $0.1 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.0-flash-lite | google | โ€” | $0.075 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-flash | google | โ€” | $0.15 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| gemini-2.5-flash-lite | google | โ€” | $0.1 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2.5-pro | google | โ€” | $1.25 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| gemma-3n-E2B-it | google | โ€” | โ€” | ๐Ÿ“น in | +| gemma-3n-E4B-it | google | โ€” | โ€” | ๐Ÿ“น in | +| veo-2.0-generate | google | โ€” | โ€” | ๐Ÿ“น out | +| gemini-2-5-flash | google-vertex | โ€” | $0.3 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2-5-flash-lite | google-vertex | โ€” | $0.1 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-2-5-pro | google-vertex | โ€” | $1.25 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-3-1-flash-lite | google-vertex | โ€” | $0.25 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-3-flash | google-vertex | โ€” | $0.5 | ๐Ÿ“น in ๐Ÿ”ง | +| gemini-3-pro | google-vertex | โ€” | $2 | ๐Ÿ“น in ๐Ÿ”ง | +| xiaomi--mimo-v2.5 | hpc-ai | โ€” | $0.4 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  ๐Ÿ”“ | +| cliptagger-12b | inferencenet | โ€” | $0.3 | ๐Ÿ“น in ๐Ÿ”“ | +| MiniMax-Hailuo-02 | minimax | โ€” | โ€” | ๐Ÿ“น out | +| MiniMax-Hailuo-2.3 | minimax | โ€” | โ€” | ๐Ÿ“น out | +| MiniMax-Hailuo-2.3-Fast | minimax | โ€” | โ€” | ๐Ÿ“น out | +| baidu--ernie-4.5-vl-28b-a3b-thinking | novitaai | โ€” | $0.39 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| moonshotai--kimi-k2.5 | novitaai | โ€” | $0.6 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| moonshotai--kimi-k2.6 | novitaai | โ€” | $0.8 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen2.5-vl-72b-instruct | novitaai | โ€” | $0.8 | ๐Ÿ“น in | +| qwen--qwen3-omni-30b-a3b-instruct | novitaai | โ€” | โ€” | ๐Ÿ“น in ๐Ÿ”ง | +| qwen--qwen3-omni-30b-a3b-thinking | novitaai | โ€” | โ€” | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3-vl-235b-a22b-instruct | novitaai | โ€” | $0.3 | ๐Ÿ“น in ๐Ÿ”ง | +| qwen--qwen3-vl-235b-a22b-thinking | novitaai | โ€” | $0.98 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3-vl-30b-a3b-instruct | novitaai | โ€” | $0.2 | ๐Ÿ“น in ๐Ÿ”ง | +| qwen--qwen3-vl-30b-a3b-thinking | novitaai | โ€” | $0.2 | ๐Ÿ“น in ๐Ÿ”ง | +| qwen--qwen3-vl-8b-instruct | novitaai | โ€” | $0.08 | ๐Ÿ“น in ๐Ÿ”ง | +| qwen--qwen3.5-122b-a10b | novitaai | โ€” | $0.4 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.5-27b | novitaai | โ€” | $0.3 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.5-35b-a3b | novitaai | โ€” | $0.25 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.5-397b-a17b | novitaai | โ€” | $0.6 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.6-27b | novitaai | โ€” | $0.6 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.6-35b-a3b | novitaai | โ€” | $0.248 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| zai-org--glm-4.5v | novitaai | โ€” | $0.6 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| zai-org--glm-4.6v | novitaai | โ€” | $0.3 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| amazon--nova-2-lite-v1 | openrouter | โ€” | $0.3 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| bytedance-seed--seed-1.6 | openrouter | โ€” | $0.25 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| bytedance-seed--seed-1.6-flash | openrouter | โ€” | $0.075 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| bytedance-seed--seed-2.0-lite | openrouter | โ€” | $0.25 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| bytedance-seed--seed-2.0-mini | openrouter | โ€” | $0.1 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-2.0-flash-001 | openrouter | โ€” | $0.1 | ๐Ÿ“น in ๐Ÿ”ง | +| google--gemini-2.0-flash-lite-001 | openrouter | โ€” | $0.075 | ๐Ÿ“น in ๐Ÿ”ง | +| google--gemini-2.5-flash | openrouter | โ€” | $0.3 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-2.5-flash-lite | openrouter | โ€” | $0.1 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-2.5-flash-lite-preview-09-2025 | openrouter | โ€” | $0.1 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-2.5-pro | openrouter | โ€” | $1.25 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-2.5-pro-preview-05-06 | openrouter | โ€” | $1.25 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-3-flash-preview | openrouter | โ€” | $0.5 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-3.1-flash-lite | openrouter | โ€” | $0.25 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-3.1-flash-lite-preview | openrouter | โ€” | $0.25 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-3.1-pro-preview | openrouter | โ€” | $2 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-3.1-pro-preview-customtools | openrouter | โ€” | $2 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemini-3.5-flash | openrouter | โ€” | $1.5 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemma-4-26b-a4b-it | openrouter | โ€” | $0.06 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemma-4-26b-a4b-it--free | openrouter | โ€” | โ€” | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemma-4-31b-it | openrouter | โ€” | $0.12 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| google--gemma-4-31b-it--free | openrouter | โ€” | โ€” | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| nvidia--nemotron-3-nano-omni-30b-a3b-reasoning--free | openrouter | โ€” | โ€” | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| nvidia--nemotron-nano-12b-v2-vl--free | openrouter | โ€” | โ€” | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| perceptron--perceptron-mk1 | openrouter | โ€” | $0.15 | ๐Ÿ“น in ๐Ÿง  | +| qwen--qwen3.5-122b-a10b | openrouter | โ€” | $0.26 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.5-27b | openrouter | โ€” | $0.195 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.5-35b-a3b | openrouter | โ€” | $0.139 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.5-397b-a17b | openrouter | โ€” | $0.39 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.5-9b | openrouter | โ€” | $0.04 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.5-flash-02-23 | openrouter | โ€” | $0.065 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.5-plus-02-15 | openrouter | โ€” | $0.26 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.5-plus-20260420 | openrouter | โ€” | $0.3 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.6-27b | openrouter | โ€” | $0.32 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.6-35b-a3b | openrouter | โ€” | $0.15 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.6-flash | openrouter | โ€” | $0.1875 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| qwen--qwen3.6-plus | openrouter | โ€” | $0.325 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| rekaai--reka-edge | openrouter | โ€” | $0.1 | ๐Ÿ“น in ๐Ÿ”ง | +| xiaomi--mimo-v2-omni | openrouter | โ€” | $0.4 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| xiaomi--mimo-v2.5 | openrouter | โ€” | $0.4 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| z-ai--glm-4.6v | openrouter | โ€” | $0.3 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| z-ai--glm-5v-turbo | openrouter | โ€” | $1.2 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| ~google--gemini-flash-latest | openrouter | โ€” | $1.5 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| ~google--gemini-pro-latest | openrouter | โ€” | $2 | ๐Ÿ“น in ๐Ÿ”ง ๐Ÿง  | +| hunyuan-turbos-vision-video | tencent | โ€” | $3 | ๐Ÿ“น in | +| yt-vita | tencent-tokenhub | โ€” | $1.2 | ๐Ÿ“น in | +| voyage-multimodal-3 | voyage | โ€” | $0.12 | ๐Ÿ“น in | +| voyage-multimodal-3.5 | voyage | โ€” | $0.12 | ๐Ÿ“น in | +| gemma-4-26b-a4b-it | vultr | โ€” | $0.55 | ๐Ÿ“น in ๐Ÿ”“ | +| gemma-4-31b-it | vultr | โ€” | $0.55 | ๐Ÿ“น in ๐Ÿ”“ | +| gemma-4-e2b-it | vultr | โ€” | $0.55 | ๐Ÿ“น in ๐Ÿ”“ | +| gemma-4-e4b-it | vultr | โ€” | $0.55 | ๐Ÿ“น in ๐Ÿ”“ | +| mimo-v2-omni | xiaomi | โ€” | $0.4 | ๐Ÿ“น in ๐Ÿ”ง | +| mimo-v2.5 | xiaomi | โ€” | $0.4 | ๐Ÿ“น in ๐Ÿ”ง | + +> ๐Ÿ’ก ไฝฟ็”จ[ไบคไบ’ๅผ็›ฎๅฝ•](https://i-need-token.github.io/ai-models/)ๆœ็ดขๅ’Œ็ญ›้€‰ๆ›ดๅคšๆกไปถ็š„ๆจกๅž‹ใ€‚ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [้Ÿณ้ข‘ๆจกๅž‹](audio-models.md) โ€” 118 ไธช้Ÿณ้ข‘่พ“ๅ…ฅ + 34 ไธช้Ÿณ้ข‘่พ“ๅ‡บๆจกๅž‹ +- [่ง†่ง‰ๆจกๅž‹](vision-models.md) โ€” 1,487 ไธช่ง†่ง‰ๆจกๅž‹ +- [ๅ›พๅƒ็”Ÿๆˆ](image-generation.md) โ€” 28 ไธชๅ›พๅƒ็”Ÿๆˆๆจกๅž‹ +- [ๆจกๆ€็Ÿฉ้˜ต](modality-matrix.md) โ€” ๆ‰€ๆœ‰ๆจกๆ€ไธ€่งˆ +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ๅ†ณ็ญ–ๆก†ๆžถ diff --git a/docs/zh/vision-models.md b/docs/zh/vision-models.md new file mode 100644 index 00000000..d84f9bb3 --- /dev/null +++ b/docs/zh/vision-models.md @@ -0,0 +1,101 @@ +[English](../vision-models.md) | **ไธญๆ–‡** + +# AI ่ง†่ง‰ๆจกๅž‹ + +ๆœฌ็›ฎๅฝ•ไธญๆœ‰ 1,487 ไธชๆจกๅž‹ๆŽฅๅ—ๅ›พๅƒ่พ“ๅ…ฅ๏ผˆ่ง†่ง‰๏ผ‰ใ€‚ๆœฌ้กต้‡็‚นไป‹็ปๅ›พๅƒ็†่งฃใ€ๆ–‡ๆกฃๅˆ†ๆžๅ’Œ่ง†่ง‰ๆŽจ็†ๆœ€ๆœ‰่ƒฝๅŠ›ๅ’Œๆœ€ๅ…ทๆ€งไปทๆฏ”็š„ๆจกๅž‹ใ€‚ + +> ๆ‰€ๆœ‰ๆ•ฐๆฎๆฅ่‡ชไธ€ๆ‰‹ API ๅ’Œๆ–‡ๆกฃใ€‚"่ง†่ง‰"่กจ็คบๆจกๅž‹ๆŽฅๅ—ๅ›พๅƒ่พ“ๅ…ฅ๏ผ›ๅ›พๅƒ็”Ÿๆˆๆ˜ฏ็‹ฌ็ซ‹็š„่ƒฝๅŠ›ใ€‚ + +## ๅฟซ้€Ÿ็ปŸ่ฎก + +| ่ƒฝๅŠ› | ่ง†่ง‰ๆจกๅž‹ๆ•ฐ | +| ------------ | ---------: | +| ๆ€ป่ง†่ง‰ๆจกๅž‹ | 1,487 | +| ๅ”ฏไธ€ๆจกๅž‹ ID | 930 | +| ๆ”ฏๆŒๅทฅๅ…ท่ฐƒ็”จ | 1,063 | +| ๆ”ฏๆŒๆŽจ็† | 697 | +| ๅผ€ๆบๆƒ้‡ | 104 | + +## ๆœ€ไพฟๅฎœ็š„่ง†่ง‰ๆจกๅž‹ + +ๅ›พๅƒ็†่งฃ็š„ๆœ€ไฝณๆ€งไปทๆฏ”๏ผš + +| ๆจกๅž‹ | ๆไพ›ๅ•† | ่พ“ๅ…ฅ $/1M | ่พ“ๅ‡บ $/1M | ไธŠไธ‹ๆ–‡ | ๅทฅๅ…ท่ฐƒ็”จ | ๆŽจ็† | +| --------------------- | ----------- | --------: | --------: | ------ | -------- | ---- | +| Qwen 3.5 0.8B | Auriko | $0.01 | $0.05 | 262K | โœ… | โœ… | +| Qwen 3.5 0.8B | DeepInfra | $0.01 | $0.05 | 262K | โœ… | โœ… | +| Qwen 3.5 2B | Auriko | $0.02 | $0.10 | 262K | โœ… | โœ… | +| Qwen 3.5 2B | DeepInfra | $0.02 | $0.10 | 262K | โœ… | โœ… | +| Qwen 3.5 4B | Auriko | $0.03 | $0.15 | 262K | โœ… | โœ… | +| Qwen 3.5 4B | DeepInfra | $0.03 | $0.15 | 262K | โœ… | โœ… | +| Gemini 2.5 Flash Lite | Google | $0.10 | $0.60 | 1M | โœ… | โœ… | +| Gemini 2.5 Flash | Google | $0.15 | $0.60 | 1M | โœ… | โœ… | +| Llama 4 Maverick | Together AI | $0.15 | $0.60 | 1M | โœ… | โŒ | +| Grok 4 Fast Reasoning | xAI | $0.20 | $0.50 | 2M | โœ… | โœ… | + +## ๆœ€ๅคงไธŠไธ‹ๆ–‡่ง†่ง‰ๆจกๅž‹ + +้€‚ๅˆๅˆ†ๆžๅคงๅž‹ๆ–‡ๆกฃใ€ๅคš้กต PDF ๆˆ–้•ฟๅ›พๅƒๅบๅˆ—๏ผš + +| ๆจกๅž‹ | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/1M | ๅทฅๅ…ท่ฐƒ็”จ | ๆŽจ็† | ๆไพ›ๅ•†ๆ•ฐ | +| --------------------- | ------ | --------: | -------- | ---- | -------: | +| Llama 4 Scout | 10M | $0.08 | โœ… | โŒ | 4 | +| Grok 4 Fast Reasoning | 2M | $0.20 | โœ… | โœ… | 2 | +| GPT-5.4 | 1M | $2.50 | โœ… | โœ… | 4 | +| Gemini 2.5 Pro | 1M | $1.25 | โœ… | โœ… | 4 | +| Gemini 2.5 Flash | 1M | $0.15 | โœ… | โœ… | 3 | +| DeepSeek Reasoner | 1M | $0.43 | โœ… | โœ… | 1 | +| GPT-4.1 | 1M | $2.00 | โœ… | โŒ | 4 | +| Llama 4 Maverick | 1M | $0.15 | โœ… | โŒ | 3 | + +## ๆœ€ไฝณ่ง†่ง‰ + ๅทฅๅ…ท่ฐƒ็”จ + ๆŽจ็† + +ๆœ€ๆœ‰่ƒฝๅŠ›็š„่ง†่ง‰ๆจกๅž‹ โ€” ่ƒฝ็œ‹ใ€่ƒฝๆŽจ็†ใ€่ƒฝ่กŒๅŠจ๏ผš + +| ๆจกๅž‹ | ไธŠไธ‹ๆ–‡ | ่พ“ๅ…ฅ $/1M | ๆไพ›ๅ•†ๆ•ฐ | +| --------------------- | ------ | --------: | -------: | +| Grok 4 Fast Reasoning | 2M | $0.20 | 2 | +| Gemini 2.5 Flash | 1M | $0.15 | 3 | +| Gemini 2.5 Pro | 1M | $1.25 | 4 | +| GPT-5.4 | 1M | $2.50 | 4 | +| DeepSeek Reasoner | 1M | $0.43 | 1 | +| MiMo V2.5๏ผˆๅผ€ๆบๆƒ้‡๏ผ‰ | 1M | varies | 2 | +| Kimi K2.6๏ผˆๅผ€ๆบๆƒ้‡๏ผ‰ | 262K | varies | 4 | + +## ๅผ€ๆบๆƒ้‡่ง†่ง‰ๆจกๅž‹ + +104 ไธชๅผ€ๆบๆƒ้‡ๆจกๅž‹ๆŽฅๅ—ๅ›พๅƒ่พ“ๅ…ฅ โ€” ๅœจ่‡ชๅทฑ็š„็กฌไปถไธŠ่ฟ่กŒ่ง†่ง‰ AI๏ผš + +| ๆจกๅž‹ | ไธŠไธ‹ๆ–‡ | ๅทฅๅ…ท่ฐƒ็”จ | ๆŽจ็† | ๆไพ›ๅ•†ๆ•ฐ | +| ------------------ | ------ | -------- | ---- | -------: | +| MiMo V2.5 | 1M | โœ… | โœ… | 2 | +| Llama 4 Maverick | 1M | โœ… | โŒ | 3 | +| Llama 4 Scout | 10M | โœ… | โŒ | 2 | +| Gemma 4 31B IT | 1M | โœ… | โŒ | 3 | +| Qwen3.5 Flash | 1M | โœ… | โŒ | 1 | +| Kimi K2.6 | 262K | โœ… | โœ… | 4 | +| Gemma 4 26B A4B IT | 262K | โœ… | โœ… | 3 | +| Llama 4 Scout 17B | 328K | โœ… | โŒ | 4 | + +## ่ฆ็‚นๆ€ป็ป“ + +- **1,487 ไธช่ง†่ง‰ๆจกๅž‹**๏ผŒๆถต็›– 930 ไธชๅ”ฏไธ€ๆจกๅž‹ ID โ€” ๆœ€ๅคง็š„่ง†่ง‰ๆจกๅž‹็›ฎๅฝ• +- **Gemini 2.5 Flash** ๆ˜ฏๆœ€ไฝณๆ€งไปทๆฏ”๏ผš1M ไธŠไธ‹ๆ–‡ใ€่ง†่ง‰ใ€ๅทฅๅ…ท่ฐƒ็”จๅ’ŒๆŽจ็†๏ผŒไป… $0.15/1M +- **Llama 4 Scout** ๆ‹ฅๆœ‰ๆœ€ๅคง็š„่ง†่ง‰ไธŠไธ‹ๆ–‡็ช—ๅฃ๏ผˆ10M tokens๏ผ‰ +- **Grok 4 Fast Reasoning** ๆ˜ฏๅ”ฏไธ€็ป“ๅˆ 2M ไธŠไธ‹ๆ–‡ใ€่ง†่ง‰ใ€ๅทฅๅ…ท่ฐƒ็”จๅ’ŒๆŽจ็†็š„ๆจกๅž‹ +- **104 ไธชๅผ€ๆบๆƒ้‡่ง†่ง‰ๆจกๅž‹** โ€” ๅœจ่‡ชๅทฑ็š„ๅŸบ็ก€่ฎพๆ–ฝไธŠ่ฟ่กŒ่ง†่ง‰ AI +- ๅฐๅž‹่ง†่ง‰ๆจกๅž‹๏ผˆQwen 3.5 0.8Bโ€“4B๏ผ‰ๆฏ 1M tokens ไป…้œ€ $0.01โ€“$0.03 + +## ็›ธๅ…ณๆ–‡ๆกฃ + +- [ๆจกๅž‹้€‰ๆ‹ฉๆŒ‡ๅ—](model-selection.md) โ€” ้€‰ๆ‹ฉๆจกๅž‹็š„ๅ†ณ็ญ–ๆก†ๆžถ +- [ๅ›พๅƒ็”Ÿๆˆ](image-generation.md) โ€” 28 ไธชๅ›พๅƒ็”Ÿๆˆๆจกๅž‹ +- [่ง†้ข‘ๆจกๅž‹](video-models.md) โ€” 167 ไธช่ง†้ข‘่พ“ๅ…ฅ/่พ“ๅ‡บๆจกๅž‹ +- [ๆจกๆ€็Ÿฉ้˜ต](modality-matrix.md) โ€” ๆ‰€ๆœ‰ๆจกๆ€ไธ€่งˆ +- [ๅ…่ดน AI ๆจกๅž‹](free-models.md) โ€” 81 ไธชๅ…่ดนๆจกๅž‹๏ผŒ้ƒจๅˆ†ๆ”ฏๆŒ่ง†่ง‰ +- [OpenAI ๆ›ฟไปฃๆ–นๆกˆ](openai-alternatives.md) โ€” GPT-4 ็บงๅˆซ่ง†่ง‰ๆ›ฟไปฃ +- [้Ÿณ้ข‘ๆจกๅž‹](audio-models.md) โ€” 118 ไธช้Ÿณ้ข‘่พ“ๅ…ฅ + 34 ไธช้Ÿณ้ข‘่พ“ๅ‡บๆจกๅž‹ + +--- + +ๆ•ฐๆฎๆฅๆบไบŽ [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” ็ป“ๆž„ๅŒ– YAML๏ผŒๅŒ…ๅซ 95 ไธชๆไพ›ๅ•† 4,587+ ๆจกๅž‹็š„ๅฎšไปทใ€ไธŠไธ‹ๆ–‡็ช—ๅฃๅ’Œ่ƒฝๅŠ›ไฟกๆฏใ€‚ diff --git a/llms-full.txt b/llms-full.txt new file mode 100644 index 00000000..42ba2b78 --- /dev/null +++ b/llms-full.txt @@ -0,0 +1,420 @@ +# AI Models Catalog + +> Structured YAML catalog of 4,587 AI models across 95 providers โ€” pricing, context windows, modalities, capabilities. First-party data only. npm package available. + +## What is this? + +A machine-readable YAML catalog of every major AI model provider and their models. Every data point comes from the provider's own API or documentation, never third-party aggregators. + +## Key Stats + +- 95 providers +- 4,587 model files +- 2,712 unique model IDs +- 441 model families +- 1,306 reasoning models +- 2,350 tool-calling models +- 527 open-weight models +- 81 free models +- 1,487 vision models +- 829 structured output models +- 28 image generation models +- 118 audio input models +- 167 video input models + +## Install + +```bash +npm install ai-models +``` + +```typescript +import catalog from "ai-models"; // 4,587 models as JSON +import type { Model } from "ai-models"; // TypeScript types +``` + +## Download + +```bash +# JSON โ€” full metadata (2.3 MB) +curl -LO https://github.com/i-need-token/ai-models/releases/latest/download/models.json + +# CSV โ€” flat table for Excel/Google Sheets (560 KB) +curl -LO https://github.com/i-need-token/ai-models/releases/latest/download/models.csv + +# CDN (no install, CORS-enabled, always up-to-date) +curl -s https://cdn.jsdelivr.net/npm/ai-models@latest/models.json | jq '.models | length' +``` + +## Data Format + +Each model is a single YAML file at `providers//models/.yaml`: + +```yaml +id: gpt-4.1 +name: GPT-4.1 +family: gpt-4.1 +tool_call: true +structured_output: true +pricing: + input: 2.0 + output: 8.0 + cache_read: 0.5 +limit: + context: 1047576 + output: 32768 +modalities: + input: [text, image] + output: [text] +release_date: "2026-05-18" +last_updated: "2026-05-18" +``` + +## Pricing Types + +| Type | When | Example | +| -------------- | ------------------------- | ------------------------------- | +| `TokenPricing` | Per-million-token pricing | `input: 2.5, output: 10` | +| `VideoPricing` | Per-second pricing | `unit: per_second, price: 0.03` | +| `UnitPricing` | Per-image or per-request | `unit: per_image, price: 0.04` | +| `FreePricing` | No cost | `unit: free` | + +## Covered Providers + +OpenAI, Anthropic, Google, Meta, DeepSeek, Alibaba Cloud, Mistral, xAI, Cohere, NVIDIA, IBM, Microsoft, Amazon Bedrock, Azure OpenAI, Google Vertex AI, OpenRouter, Together AI, Fireworks AI, Groq, Cerebras, DeepInfra, SiliconFlow, Novita AI, SambaNova, Cloudflare Workers AI, Chutes, Kluster AI, NanoGPT, and 75+ more. + +Full list: 01.AI, 302.AI, AI21 Labs, AIHubMix, AI/ML API, Aion Labs, Alibaba Cloud, Amazon Bedrock, Amazon Nova, Anthropic, Arcee AI, Auriko, Azure OpenAI, Baichuan AI, Baidu, Baseten, Berget, ByteDance, Cerebras, Chutes, Clarifai, CloudFerro Sherlock, Cloudflare Workers AI, Cohere, Cortecs, DInference, Databricks, DeepInfra, DeepSeek, DigitalOcean, evroc, FastRouter, Fireworks AI, FriendliAI, GMI Cloud, Google, Google Vertex AI, Groq, HPC-AI Cloud, Hyperbolic, IBM Granite, iFlytek SparkDesk, Inception Labs, InclusionAI, Inference.net, Kluster AI, LLM Gateway, Martian, MegaNova, Meta Llama, Microsoft Phi, MiniMax, Mistral AI, Mixlayer, MoArk AI, Moonshot AI, Morph, NanoGPT, Nebius, NeuralWatt, Nous Research, Novita AI, NVIDIA, OpenAI, OpenRouter, OrcaRouter, OVHcloud, PPIO, Perplexity, Privatemode AI, Qiniu AI, Regolo, Reka AI, Requesty, SambaNova, Sarvam AI, Scaleway, SiliconFlow, SiliconFlow CN, StepFun, SubModel, Tencent Cloud TokenHub, Tencent Hunyuan, TextSynth, Together AI, Upstage, Venice AI, Voyage AI, Vultr, Wafer, Writer, xAI Grok, Xiaomi, Zhipu AI, ๆŽฅๅฃ AI + +## Data Schema + +### Model Schema (Required Fields) + +| Field | Type | Description | Example | +| -------------- | ------- | ---------------------------------------- | ------------------------------------------ | +| `id` | string | Stable model ID (no date suffix) | `gpt-4o`, `claude-sonnet-4-5` | +| `name` | string | Display name | `GPT-4o`, `Claude Sonnet 4.5` | +| `family` | string | Model family (broad lineage) | `gpt-4o`, `claude-sonnet` | +| `pricing` | Pricing | Model pricing (see below) | โ€” | +| `modalities` | object | Input/output modalities | `{ input: [text, image], output: [text] }` | +| `last_updated` | string | Last data update (YYYY-MM-DD or YYYY-MM) | `2024-08-06` | + +### Model Schema (Optional Fields) + +| Field | Type | Default | Description | Example | +| ------------------- | ------- | ------- | -------------------------------- | ------------------------------------ | +| `reasoning` | boolean | `false` | Supports reasoning/thinking mode | `true` | +| `temperature` | boolean | `true` | Supports temperature parameter | `false` | +| `tool_call` | boolean | `false` | Supports tool/function calling | `true` | +| `attachment` | boolean | `false` | Supports file attachments | `true` | +| `structured_output` | boolean | `false` | Supports structured/JSON output | `true` | +| `open_weights` | boolean | `false` | Open-weight model | `true` | +| `deprecated` | boolean | `false` | Deprecated but still accessible | `true` | +| `limit` | object | โ€” | Token limits | `{ context: 128000, output: 16384 }` | +| `knowledge` | string | โ€” | Training data cutoff | `2023-10` | +| `release_date` | string | โ€” | Model release date | `2024-05-13` | +| `snapshots` | array | โ€” | Dated model versions | See below | + +### Modality Types + +| Modality | Description | +| -------- | --------------------- | +| `text` | Text input or output | +| `image` | Image input or output | +| `video` | Video input | +| `audio` | Audio input or output | +| `pdf` | PDF document input | + +### Pricing Schema + +Pricing is a union of four types: + +**TokenPricing** (most common โ€” per-million-token pricing): + +```yaml +pricing: + input: 2.5 # $/M input tokens + output: 10 # $/M output tokens + cache_write: 1.25 # optional + cache_read: 0.625 # optional +``` + +**VideoPricing** (per-second, optionally tiered by resolution): + +```yaml +pricing: + unit: per_second + price: 0.03 +``` + +**UnitPricing** (per-image or per-request): + +```yaml +pricing: + unit: per_image + price: 0.04 +``` + +**FreePricing** (no cost): + +```yaml +pricing: + unit: free +``` + +### Snapshot Schema + +Snapshots represent dated versions of a model. They inherit all parent fields and only override what differs: + +```yaml +id: gpt-4o +name: GPT-4o +snapshots: + - id: gpt-4o-2024-08-06 + last_updated: "2024-08-06" + - id: gpt-4o-2024-05-13 + deprecated: true + last_updated: "2024-05-13" +``` + +### Provider Schema + +Each provider has a `provider.yaml` file: + +| Field | Type | Required | Description | Example | +| ---------------- | ------ | -------- | ------------------------------------ | ---------------------------------- | +| `id` | string | โœ… | Provider ID (matches directory name) | `openai` | +| `name` | string | โœ… | Display name | `OpenAI` | +| `url` | string | โœ… | Official website URL | `https://openai.com` | +| `api_docs` | string | โŒ | API documentation URL | `https://platform.openai.com/docs` | +| `apis` | object | โœ… | API endpoints keyed by format | See below | +| `apis.openai` | string | โŒ | OpenAI-compatible API endpoint | `https://api.openai.com/v1` | +| `apis.anthropic` | string | โŒ | Anthropic API endpoint | โ€” | +| `apis.google` | string | โŒ | Google AI API endpoint | โ€” | +| `currency` | string | โŒ | Default currency (USD/CNY/EUR) | `USD` | + +## Quick Start + +### Find the cheapest model + +โ†’ See [Pricing Comparison](docs/pricing-comparison.md) + +**Cheapest models with tool calling:** + +| Model | Provider | Input (per 1M tokens) | Output (per 1M tokens) | +| ---------------- | ------------- | --------------------: | ---------------------: | +| DeepSeek-V3 | DeepSeek | $0.27 | $1.10 | +| Qwen3-235B-A22B | Alibaba Cloud | $0.14 | $0.42 | +| Llama 4 Maverick | Together AI | $0.20 | $0.80 | + +### Find the most capable model + +โ†’ See [Model Comparison](docs/model-comparison.md) + +**Top-tier flagships:** + +| Model | Context | Tool Call | Vision | Input $/1M | Output $/1M | +| -------------- | ------- | --------- | ------ | ---------: | ----------: | +| GPT-4.1 | 1M | โœ… | โœ… | $2.00 | $8.00 | +| Claude Opus 4 | 200K | โœ… | โœ… | $15.00 | $75.00 | +| Gemini 2.5 Pro | 1M | โœ… | โœ… | $1.25 | $10.00 | + +### Find a free model + +โ†’ See [Free AI Models](docs/free-models.md) + +- Google Gemini 2.0 Flash (1M context, tool calling, vision, reasoning) +- 70+ models on Chutes (Llama 4, Qwen3, DeepSeek-R1, etc.) + +### Find the largest context window + +โ†’ See [Context Window Comparison](docs/context-windows.md) + +| Model | Context Window | +| --------------- | -------------: | +| Llama 4 Scout | 10M tokens | +| Gemini 2.5 Pro | 1M tokens | +| GPT-4.1 | ~1M tokens | + +## Programmatic Access + +### npm package + +```bash +npm install ai-models +``` + +```typescript +import catalog from "ai-models"; // 4,587 models as JSON +import type { Model } from "ai-models"; // TypeScript types + +// Find models with tool calling under $1/1M input +const affordable = catalog.models.filter((m) => m.tool_call && m.pricing.input < 1); +``` + +### Download data files + +```bash +# JSON โ€” full metadata (2.3 MB) +curl -LO https://github.com/i-need-token/ai-models/releases/latest/download/models.json + +# CSV โ€” flat table for Excel/Google Sheets (560 KB) +curl -LO https://github.com/i-need-token/ai-models/releases/latest/download/models.csv +``` + +### Python usage + +```python +import json + +with open("models.json") as f: + catalog = json.load(f) + +# Find all reasoning models +reasoning = [m for m in catalog["models"] if m.get("reasoning")] + +# Find models with largest context windows +by_context = sorted( + catalog["models"], + key=lambda m: (m.get("limit", {}) or {}).get("context", 0), + reverse=True, +)[:10] +``` + +### JSON structure + +```json +{ + "generated_at": "2026-05-21T02:13:04.076Z", + "stats": { + "providers": 95, + "models": 4587, + "unique_model_ids": 2712, + "families": 441 + }, + "providers": { + "openai": { "name": "OpenAI", "model_count": 28 }, + "anthropic": { "name": "Anthropic", "model_count": 11 } + }, + "models": [ + { + "id": "gpt-4.1", + "name": "GPT-4.1", + "family": "gpt-4.1", + "provider": "openai", + "tool_call": true, + "structured_output": true, + "pricing": { "input": 2, "output": 8, "cache_read": 0.5 }, + "limit": { "context": 1047576, "output": 32768 }, + "modalities": { "input": ["text", "image"], "output": ["text"] } + } + ] +} +``` + +## Documentation + +- [Quick Start](docs/quick-start.md) โ€” find the right model in 30 seconds +- [Model Selection Guide](docs/model-selection.md) โ€” decision framework: free, best value, large context models +- [Model Selection Cheatsheet](docs/model-selection-cheatsheet.md) +- [AI Model Picker](docs/ai-model-picker.md) โ€” quick-reference: best model by budget and use case +- [Small Language Models Guide](docs/small-language-models.md) โ€” 2,002 SLMs for edge, mobile, and cost-efficient production +- [Benchmarks & Leaderboards](docs/benchmarks.md) โ€” key benchmarks, leaderboard landscape, interpretation guide +- [API & Programmatic Access](docs/api.md) โ€” download models.json, code examples +- [Code Examples](docs/code-examples.md) โ€” practical examples in TypeScript, Python, Go, Rust, jq +- [FAQ](docs/faq.md) โ€” frequently asked questions about the catalog, data, and contributing +- [Glossary](docs/glossary.md) โ€” key terms and definitions for AI model terminology +- [Model Comparison](docs/model-comparison.md) โ€” flagship, cost-effective, free, open-weight +- [Pricing Comparison](docs/pricing-comparison.md) โ€” side-by-side pricing across providers +- [Cached Pricing](docs/cached-pricing.md) โ€” 1,374 models with prompt caching, 50-90% input cost savings +- [Context Window Comparison](docs/context-windows.md) โ€” largest context windows, best value +- [Large Context Models](docs/large-context-models.md) โ€” 2,195 models with 128K+ context, 397 with 1M+ +- [Small & Edge Models](docs/small-models.md) โ€” 1,153 models under 10B params for on-device use +- [Provider Comparison](docs/provider-comparison.md) โ€” top 30 providers by model count and capabilities +- [Migration Guide](docs/migration-guide.md) โ€” switch providers with pricing, API compatibility, checklist +- [OpenAI Alternatives](docs/openai-alternatives.md) โ€” GPT-4/GPT-3.5 alternatives, free options, OpenAI-compatible providers +- [Agentic Models](docs/agentic-models.md) โ€” 1,080 models with tool_call + reasoning for AI agents +- [Code Models](docs/code-models.md) โ€” 189 code-focused models for generation, review, debugging +- [Audio Models](docs/audio-models.md) โ€” 118 audio input + 34 audio output models for speech/voice +- [Free AI Models](docs/free-models.md) โ€” 81 free models by capability +- [Open-Weight Models](docs/open-weights.md) โ€” 513 open-weight models +- [Reasoning Models](docs/reasoning-models.md) โ€” 1,306 reasoning models +- [Tool Calling Models](docs/tool-calling.md) โ€” 2,350 tool-calling models +- [Vision Models](docs/vision-models.md) โ€” 1,487 vision models +- [Image Generation](docs/image-generation.md) โ€” 28 image generation models +- [Audio Models](docs/audio-models.md) โ€” 118 audio input + 34 audio output models +- [Code Models](docs/code-models.md) โ€” 189 code-focused models across 41 providers +- [Agentic Models](docs/agentic-models.md) โ€” models with tool calling + reasoning for AI agents +- [Chat Models](docs/chat-models.md) โ€” 2,350 models with tool calling for chat applications +- [Multimodal Models](docs/multimodal-models.md) โ€” 1,519 models with image/audio/video input +- [Embedding Models](docs/embedding-models.md) โ€” 5 embedding models for search, RAG, similarity +- [Video Models](docs/video-models.md) โ€” 167 video input + 4 video output models +- [Structured Output](docs/structured-output.md) โ€” 829 JSON-mode models +- [Modality Matrix](docs/modality-matrix.md) โ€” vision, image gen, audio, video +- [Provider Overview](docs/providers.md) โ€” all 95 providers by type and market +- [Data Schema Reference](docs/data-schema.md) โ€” complete YAML schema +- [Data Acquisition](docs/data-acquisition.md) โ€” how we acquire and update data +- [Design Principles](docs/lessons-learned.md) โ€” lessons learned + +## Design Principles + +- **First-party data only** โ€” all model data comes from the provider's own API or website +- **Dynamic discovery** โ€” scrape functions discover models from the source, not from hardcoded lists +- **Include deprecated, exclude retired** โ€” deprecated models are included with `deprecated: true`; retired (inaccessible) models are excluded +- **Never fabricate data** โ€” if required data is missing, skip the model with a warning rather than filling in guessed values +- **YAML source format** โ€” human-readable, supports comments, machine-parseable +- **Snapshot inheritance** โ€” dated model versions are nested within the parent model, inheriting all fields + +## Adding a New Provider + +1. Create `providers//scrape.ts` with a `scrape()` function that returns `{ provider, models }` +2. Data must come from a first-party source (provider's API or website) +3. Include a discovery step โ€” no hardcoded model ID lists +4. Run `npx tsx scripts/sync.ts ` to generate initial data +5. Validate with `npx tsx scripts/validate.ts` + +## CLI Tools + +```bash +# Validate all YAML data +npx tsx scripts/validate.ts + +# Compute catalog statistics +npx tsx scripts/stats.ts # table format +npx tsx scripts/stats.ts json # JSON format + +# Compile to models.json +npx tsx scripts/compile.ts + +# Sync data from providers +npx tsx scripts/sync.ts openai # single provider +npx tsx scripts/sync.ts # all providers + +# Export to CSV +npx tsx scripts/export-csv.ts +``` +## SEO Comparison Pages +- Best AI Models: site/best-ai-models.html +- Free AI Models: site/free-ai-models.html +- LLM Pricing: site/llm-pricing.html +- OpenAI Alternatives: site/openai-alternatives.html +- AI Models by Provider: site/ai-models-by-provider.html +- Context Window Comparison: site/context-window-comparison.html +- Best AI Models for Coding: site/best-ai-models-for-coding.html +- Best AI Models for Agents: site/best-ai-models-for-agents.html +- Reasoning Models Comparison: site/reasoning-models-comparison.html +- Cheapest AI Models: site/cheapest-ai-models.html +- Tool Calling Models Comparison: site/tool-calling-models-comparison.html +- AI Model Pricing Calculator: site/ai-model-pricing-calculator.html +- Best AI Models for Image Generation: site/best-ai-models-for-image-generation.html +- Best AI Models for Vision: site/best-ai-models-for-vision.html +- Structured Output Models Comparison: site/structured-output-models-comparison.html +- Open Source AI Models: site/open-source-ai-models.html +- Multimodal AI Models: site/multimodal-ai-models.html +- State of AI Models 2025: site/state-of-ai-models.html +- AI Model Benchmarks Comparison: site/ai-model-benchmarks.html +- ChatGPT vs Claude vs Gemini: site/chatgpt-vs-claude-vs-gemini.html +- AI Model Comparison Chart: site/ai-model-comparison-chart.html +- State of AI Models 2025: site/state-of-ai-models.html +- AI Model Benchmarks Comparison: site/ai-model-benchmarks.html +- ChatGPT vs Claude vs Gemini: site/chatgpt-vs-claude-vs-gemini.html +- AI Model Comparison Chart: site/ai-model-comparison-chart.html diff --git a/llms.txt b/llms.txt new file mode 100644 index 00000000..c2411c39 --- /dev/null +++ b/llms.txt @@ -0,0 +1,416 @@ +# AI Models Catalog + +> Structured YAML catalog of 4,587 AI models across 95 providers โ€” pricing, context windows, modalities, capabilities. First-party data only. npm package available. + +## What is this? + +A machine-readable YAML catalog of every major AI model provider and their models. Every data point comes from the provider's own API or documentation, never third-party aggregators. + +## Key Stats + +- 95 providers +- 4,587 model files +- 2,712 unique model IDs +- 441 model families +- 1,306 reasoning models +- 2,350 tool-calling models +- 527 open-weight models +- 81 free models +- 1,487 vision models +- 829 structured output models +- 28 image generation models +- 118 audio input models +- 167 video input models + +## Install + +```bash +npm install ai-models +``` + +```typescript +import catalog from "ai-models"; // 4,587 models as JSON +import type { Model } from "ai-models"; // TypeScript types +``` + +## Download + +```bash +# JSON โ€” full metadata (2.3 MB) +curl -LO https://github.com/i-need-token/ai-models/releases/latest/download/models.json + +# CSV โ€” flat table for Excel/Google Sheets (560 KB) +curl -LO https://github.com/i-need-token/ai-models/releases/latest/download/models.csv + +# CDN (no install, CORS-enabled, always up-to-date) +curl -s https://cdn.jsdelivr.net/npm/ai-models@latest/models.json | jq '.models | length' +``` + +## Data Format + +Each model is a single YAML file at `providers//models/.yaml`: + +```yaml +id: gpt-4.1 +name: GPT-4.1 +family: gpt-4.1 +tool_call: true +structured_output: true +pricing: + input: 2.0 + output: 8.0 + cache_read: 0.5 +limit: + context: 1047576 + output: 32768 +modalities: + input: [text, image] + output: [text] +release_date: "2026-05-18" +last_updated: "2026-05-18" +``` + +## Pricing Types + +| Type | When | Example | +| -------------- | ------------------------- | ------------------------------- | +| `TokenPricing` | Per-million-token pricing | `input: 2.5, output: 10` | +| `VideoPricing` | Per-second pricing | `unit: per_second, price: 0.03` | +| `UnitPricing` | Per-image or per-request | `unit: per_image, price: 0.04` | +| `FreePricing` | No cost | `unit: free` | + +## Covered Providers + +OpenAI, Anthropic, Google, Meta, DeepSeek, Alibaba Cloud, Mistral, xAI, Cohere, NVIDIA, IBM, Microsoft, Amazon Bedrock, Azure OpenAI, Google Vertex AI, OpenRouter, Together AI, Fireworks AI, Groq, Cerebras, DeepInfra, SiliconFlow, Novita AI, SambaNova, Cloudflare Workers AI, Chutes, Kluster AI, NanoGPT, and 75+ more. + +Full list: 01.AI, 302.AI, AI21 Labs, AIHubMix, AI/ML API, Aion Labs, Alibaba Cloud, Amazon Bedrock, Amazon Nova, Anthropic, Arcee AI, Auriko, Azure OpenAI, Baichuan AI, Baidu, Baseten, Berget, ByteDance, Cerebras, Chutes, Clarifai, CloudFerro Sherlock, Cloudflare Workers AI, Cohere, Cortecs, DInference, Databricks, DeepInfra, DeepSeek, DigitalOcean, evroc, FastRouter, Fireworks AI, FriendliAI, GMI Cloud, Google, Google Vertex AI, Groq, HPC-AI Cloud, Hyperbolic, IBM Granite, iFlytek SparkDesk, Inception Labs, InclusionAI, Inference.net, Kluster AI, LLM Gateway, Martian, MegaNova, Meta Llama, Microsoft Phi, MiniMax, Mistral AI, Mixlayer, MoArk AI, Moonshot AI, Morph, NanoGPT, Nebius, NeuralWatt, Nous Research, Novita AI, NVIDIA, OpenAI, OpenRouter, OrcaRouter, OVHcloud, PPIO, Perplexity, Privatemode AI, Qiniu AI, Regolo, Reka AI, Requesty, SambaNova, Sarvam AI, Scaleway, SiliconFlow, SiliconFlow CN, StepFun, SubModel, Tencent Cloud TokenHub, Tencent Hunyuan, TextSynth, Together AI, Upstage, Venice AI, Voyage AI, Vultr, Wafer, Writer, xAI Grok, Xiaomi, Zhipu AI, ๆŽฅๅฃ AI + +## Data Schema + +### Model Schema (Required Fields) + +| Field | Type | Description | Example | +| -------------- | ------- | ---------------------------------------- | ------------------------------------------ | +| `id` | string | Stable model ID (no date suffix) | `gpt-4o`, `claude-sonnet-4-5` | +| `name` | string | Display name | `GPT-4o`, `Claude Sonnet 4.5` | +| `family` | string | Model family (broad lineage) | `gpt-4o`, `claude-sonnet` | +| `pricing` | Pricing | Model pricing (see below) | โ€” | +| `modalities` | object | Input/output modalities | `{ input: [text, image], output: [text] }` | +| `last_updated` | string | Last data update (YYYY-MM-DD or YYYY-MM) | `2024-08-06` | + +### Model Schema (Optional Fields) + +| Field | Type | Default | Description | Example | +| ------------------- | ------- | ------- | -------------------------------- | ------------------------------------ | +| `reasoning` | boolean | `false` | Supports reasoning/thinking mode | `true` | +| `temperature` | boolean | `true` | Supports temperature parameter | `false` | +| `tool_call` | boolean | `false` | Supports tool/function calling | `true` | +| `attachment` | boolean | `false` | Supports file attachments | `true` | +| `structured_output` | boolean | `false` | Supports structured/JSON output | `true` | +| `open_weights` | boolean | `false` | Open-weight model | `true` | +| `deprecated` | boolean | `false` | Deprecated but still accessible | `true` | +| `limit` | object | โ€” | Token limits | `{ context: 128000, output: 16384 }` | +| `knowledge` | string | โ€” | Training data cutoff | `2023-10` | +| `release_date` | string | โ€” | Model release date | `2024-05-13` | +| `snapshots` | array | โ€” | Dated model versions | See below | + +### Modality Types + +| Modality | Description | +| -------- | --------------------- | +| `text` | Text input or output | +| `image` | Image input or output | +| `video` | Video input | +| `audio` | Audio input or output | +| `pdf` | PDF document input | + +### Pricing Schema + +Pricing is a union of four types: + +**TokenPricing** (most common โ€” per-million-token pricing): + +```yaml +pricing: + input: 2.5 # $/M input tokens + output: 10 # $/M output tokens + cache_write: 1.25 # optional + cache_read: 0.625 # optional +``` + +**VideoPricing** (per-second, optionally tiered by resolution): + +```yaml +pricing: + unit: per_second + price: 0.03 +``` + +**UnitPricing** (per-image or per-request): + +```yaml +pricing: + unit: per_image + price: 0.04 +``` + +**FreePricing** (no cost): + +```yaml +pricing: + unit: free +``` + +### Snapshot Schema + +Snapshots represent dated versions of a model. They inherit all parent fields and only override what differs: + +```yaml +id: gpt-4o +name: GPT-4o +snapshots: + - id: gpt-4o-2024-08-06 + last_updated: "2024-08-06" + - id: gpt-4o-2024-05-13 + deprecated: true + last_updated: "2024-05-13" +``` + +### Provider Schema + +Each provider has a `provider.yaml` file: + +| Field | Type | Required | Description | Example | +| ---------------- | ------ | -------- | ------------------------------------ | ---------------------------------- | +| `id` | string | โœ… | Provider ID (matches directory name) | `openai` | +| `name` | string | โœ… | Display name | `OpenAI` | +| `url` | string | โœ… | Official website URL | `https://openai.com` | +| `api_docs` | string | โŒ | API documentation URL | `https://platform.openai.com/docs` | +| `apis` | object | โœ… | API endpoints keyed by format | See below | +| `apis.openai` | string | โŒ | OpenAI-compatible API endpoint | `https://api.openai.com/v1` | +| `apis.anthropic` | string | โŒ | Anthropic API endpoint | โ€” | +| `apis.google` | string | โŒ | Google AI API endpoint | โ€” | +| `currency` | string | โŒ | Default currency (USD/CNY/EUR) | `USD` | + +## Quick Start + +### Find the cheapest model + +โ†’ See [Pricing Comparison](docs/pricing-comparison.md) + +**Cheapest models with tool calling:** + +| Model | Provider | Input (per 1M tokens) | Output (per 1M tokens) | +| ---------------- | ------------- | --------------------: | ---------------------: | +| DeepSeek-V3 | DeepSeek | $0.27 | $1.10 | +| Qwen3-235B-A22B | Alibaba Cloud | $0.14 | $0.42 | +| Llama 4 Maverick | Together AI | $0.20 | $0.80 | + +### Find the most capable model + +โ†’ See [Model Comparison](docs/model-comparison.md) + +**Top-tier flagships:** + +| Model | Context | Tool Call | Vision | Input $/1M | Output $/1M | +| -------------- | ------- | --------- | ------ | ---------: | ----------: | +| GPT-4.1 | 1M | โœ… | โœ… | $2.00 | $8.00 | +| Claude Opus 4 | 200K | โœ… | โœ… | $15.00 | $75.00 | +| Gemini 2.5 Pro | 1M | โœ… | โœ… | $1.25 | $10.00 | + +### Find a free model + +โ†’ See [Free AI Models](docs/free-models.md) + +- Google Gemini 2.0 Flash (1M context, tool calling, vision, reasoning) +- 70+ models on Chutes (Llama 4, Qwen3, DeepSeek-R1, etc.) + +### Find the largest context window + +โ†’ See [Context Window Comparison](docs/context-windows.md) + +| Model | Context Window | +| --------------- | -------------: | +| Llama 4 Scout | 10M tokens | +| Gemini 2.5 Pro | 1M tokens | +| GPT-4.1 | ~1M tokens | + +## Programmatic Access + +### npm package + +```bash +npm install ai-models +``` + +```typescript +import catalog from "ai-models"; // 4,587 models as JSON +import type { Model } from "ai-models"; // TypeScript types + +// Find models with tool calling under $1/1M input +const affordable = catalog.models.filter((m) => m.tool_call && m.pricing.input < 1); +``` + +### Download data files + +```bash +# JSON โ€” full metadata (2.3 MB) +curl -LO https://github.com/i-need-token/ai-models/releases/latest/download/models.json + +# CSV โ€” flat table for Excel/Google Sheets (560 KB) +curl -LO https://github.com/i-need-token/ai-models/releases/latest/download/models.csv +``` + +### Python usage + +```python +import json + +with open("models.json") as f: + catalog = json.load(f) + +# Find all reasoning models +reasoning = [m for m in catalog["models"] if m.get("reasoning")] + +# Find models with largest context windows +by_context = sorted( + catalog["models"], + key=lambda m: (m.get("limit", {}) or {}).get("context", 0), + reverse=True, +)[:10] +``` + +### JSON structure + +```json +{ + "generated_at": "2026-05-21T02:13:04.076Z", + "stats": { + "providers": 95, + "models": 4587, + "unique_model_ids": 2712, + "families": 441 + }, + "providers": { + "openai": { "name": "OpenAI", "model_count": 28 }, + "anthropic": { "name": "Anthropic", "model_count": 11 } + }, + "models": [ + { + "id": "gpt-4.1", + "name": "GPT-4.1", + "family": "gpt-4.1", + "provider": "openai", + "tool_call": true, + "structured_output": true, + "pricing": { "input": 2, "output": 8, "cache_read": 0.5 }, + "limit": { "context": 1047576, "output": 32768 }, + "modalities": { "input": ["text", "image"], "output": ["text"] } + } + ] +} +``` + +## Documentation + +- [Quick Start](docs/quick-start.md) โ€” find the right model in 30 seconds +- [Model Selection Guide](docs/model-selection.md) โ€” decision framework: free, best value, large context models +- [Model Selection Cheatsheet](docs/model-selection-cheatsheet.md) +- [AI Model Picker](docs/ai-model-picker.md) โ€” quick-reference: best model by budget and use case +- [Small Language Models Guide](docs/small-language-models.md) โ€” 2,002 SLMs for edge, mobile, and cost-efficient production +- [Benchmarks & Leaderboards](docs/benchmarks.md) โ€” key benchmarks, leaderboard landscape, interpretation guide +- [API & Programmatic Access](docs/api.md) โ€” download models.json, code examples +- [Code Examples](docs/code-examples.md) โ€” practical examples in TypeScript, Python, Go, Rust, jq +- [FAQ](docs/faq.md) โ€” frequently asked questions about the catalog, data, and contributing +- [Glossary](docs/glossary.md) โ€” key terms and definitions for AI model terminology +- [Model Comparison](docs/model-comparison.md) โ€” flagship, cost-effective, free, open-weight +- [Pricing Comparison](docs/pricing-comparison.md) โ€” side-by-side pricing across providers +- [Cached Pricing](docs/cached-pricing.md) โ€” 1,374 models with prompt caching, 50-90% input cost savings +- [Context Window Comparison](docs/context-windows.md) โ€” largest context windows, best value +- [Large Context Models](docs/large-context-models.md) โ€” 2,195 models with 128K+ context, 397 with 1M+ +- [Small & Edge Models](docs/small-models.md) โ€” 1,153 models under 10B params for on-device use +- [Provider Comparison](docs/provider-comparison.md) โ€” top 30 providers by model count and capabilities +- [Migration Guide](docs/migration-guide.md) โ€” switch providers with pricing, API compatibility, checklist +- [OpenAI Alternatives](docs/openai-alternatives.md) โ€” GPT-4/GPT-3.5 alternatives, free options, OpenAI-compatible providers +- [Agentic Models](docs/agentic-models.md) โ€” 1,080 models with tool_call + reasoning for AI agents +- [Code Models](docs/code-models.md) โ€” 189 code-focused models for generation, review, debugging +- [Audio Models](docs/audio-models.md) โ€” 118 audio input + 34 audio output models for speech/voice +- [Free AI Models](docs/free-models.md) โ€” 81 free models by capability +- [Open-Weight Models](docs/open-weights.md) โ€” 513 open-weight models +- [Reasoning Models](docs/reasoning-models.md) โ€” 1,306 reasoning models +- [Tool Calling Models](docs/tool-calling.md) โ€” 2,350 tool-calling models +- [Vision Models](docs/vision-models.md) โ€” 1,487 vision models +- [Image Generation](docs/image-generation.md) โ€” 28 image generation models +- [Audio Models](docs/audio-models.md) โ€” 118 audio input + 34 audio output models +- [Code Models](docs/code-models.md) โ€” 189 code-focused models across 41 providers +- [Agentic Models](docs/agentic-models.md) โ€” models with tool calling + reasoning for AI agents +- [Chat Models](docs/chat-models.md) โ€” 2,350 models with tool calling for chat applications +- [Multimodal Models](docs/multimodal-models.md) โ€” 1,519 models with image/audio/video input +- [Embedding Models](docs/embedding-models.md) โ€” 5 embedding models for search, RAG, similarity +- [Video Models](docs/video-models.md) โ€” 167 video input + 4 video output models +- [Structured Output](docs/structured-output.md) โ€” 829 JSON-mode models +- [Modality Matrix](docs/modality-matrix.md) โ€” vision, image gen, audio, video +- [Provider Overview](docs/providers.md) โ€” all 95 providers by type and market +- [Data Schema Reference](docs/data-schema.md) โ€” complete YAML schema +- [Data Acquisition](docs/data-acquisition.md) โ€” how we acquire and update data +- [Design Principles](docs/lessons-learned.md) โ€” lessons learned + +## Design Principles + +- **First-party data only** โ€” all model data comes from the provider's own API or website +- **Dynamic discovery** โ€” scrape functions discover models from the source, not from hardcoded lists +- **Include deprecated, exclude retired** โ€” deprecated models are included with `deprecated: true`; retired (inaccessible) models are excluded +- **Never fabricate data** โ€” if required data is missing, skip the model with a warning rather than filling in guessed values +- **YAML source format** โ€” human-readable, supports comments, machine-parseable +- **Snapshot inheritance** โ€” dated model versions are nested within the parent model, inheriting all fields + +## Adding a New Provider + +1. Create `providers//scrape.ts` with a `scrape()` function that returns `{ provider, models }` +2. Data must come from a first-party source (provider's API or website) +3. Include a discovery step โ€” no hardcoded model ID lists +4. Run `npx tsx scripts/sync.ts ` to generate initial data +5. Validate with `npx tsx scripts/validate.ts` + +## CLI Tools + +```bash +# Validate all YAML data +npx tsx scripts/validate.ts + +# Compute catalog statistics +npx tsx scripts/stats.ts # table format +npx tsx scripts/stats.ts json # JSON format + +# Compile to models.json +npx tsx scripts/compile.ts + +# Sync data from providers +npx tsx scripts/sync.ts openai # single provider +npx tsx scripts/sync.ts # all providers + +# Export to CSV +npx tsx scripts/export-csv.ts +``` +## SEO Comparison Pages +- Best AI Models: site/best-ai-models.html +- Free AI Models: site/free-ai-models.html +- LLM Pricing: site/llm-pricing.html +- OpenAI Alternatives: site/openai-alternatives.html +- AI Models by Provider: site/ai-models-by-provider.html +- Context Window Comparison: site/context-window-comparison.html +- Best AI Models for Coding: site/best-ai-models-for-coding.html +- Best AI Models for Agents: site/best-ai-models-for-agents.html +- Reasoning Models Comparison: site/reasoning-models-comparison.html +- Cheapest AI Models: site/cheapest-ai-models.html +- Tool Calling Models Comparison: site/tool-calling-models-comparison.html +- AI Model Pricing Calculator: site/ai-model-pricing-calculator.html +- Best AI Models for Image Generation: site/best-ai-models-for-image-generation.html +- Best AI Models for Vision: site/best-ai-models-for-vision.html +- Structured Output Models Comparison: site/structured-output-models-comparison.html +- Open Source AI Models: site/open-source-ai-models.html +- Multimodal AI Models: site/multimodal-ai-models.html +- State of AI Models 2025: site/state-of-ai-models.html +- AI Model Benchmarks Comparison: site/ai-model-benchmarks.html +- ChatGPT vs Claude vs Gemini: site/chatgpt-vs-claude-vs-gemini.html +- AI Model Comparison Chart: site/ai-model-comparison-chart.html diff --git a/package-lock.json b/package-lock.json index 6a9b3687..7be227c6 100644 --- a/package-lock.json +++ b/package-lock.json @@ -1,30 +1,30 @@ { "name": "ai-models", - "version": "0.1.0", + "version": "0.2.2", "lockfileVersion": 3, "requires": true, "packages": { "": { "name": "ai-models", - "version": "0.1.0", + "version": "0.2.2", "license": "MIT", "dependencies": { "linkedom": "^0.18.12", - "yaml": "^2.7.0", + "yaml": "^2.9.0", "zod": "^3.24.0" }, "devDependencies": { - "@types/node": "^25.6.0", + "@types/node": "^25.9.1", "husky": "^9.1.7", - "oxfmt": "^0.48.0", - "oxlint": "^1.63.0", - "typescript": "^5.7.0" + "oxfmt": "^0.51.0", + "oxlint": "^1.66.0", + "typescript": "^6.0.3" } }, "node_modules/@oxfmt/binding-android-arm-eabi": { - "version": "0.48.0", - "resolved": "https://registry.npmjs.org/@oxfmt/binding-android-arm-eabi/-/binding-android-arm-eabi-0.48.0.tgz", - "integrity": "sha512-uwqk+/KhQvBIpULD8SMM/zAafMRC/+DV/xsEQjkkIsJ/kLmEI/2bxonVowcYTiXqqZ/a0FEW8DPkZY3VvwELDA==", + "version": "0.51.0", + "resolved": "https://registry.npmjs.org/@oxfmt/binding-android-arm-eabi/-/binding-android-arm-eabi-0.51.0.tgz", + "integrity": "sha512-Ni0sCqg5CIHaLIYFGj+ncbcumylvNC6FE4rfD0KfdmnWHbPJ+zev0qZCXKxy2hFVa0fYRK0yPzf5nzPbkZou7g==", "cpu": [ "arm" ], @@ -39,9 +39,9 @@ } }, "node_modules/@oxfmt/binding-android-arm64": { - "version": "0.48.0", - "resolved": "https://registry.npmjs.org/@oxfmt/binding-android-arm64/-/binding-android-arm64-0.48.0.tgz", - "integrity": "sha512-VUCiKuXK5+McVssgHEJdrcGK7hRJzrRb36zm9/jwzMholyYt4BgXhw5Nm1V1DX6Ce717Zi/1jk432b/tgmQgtQ==", + "version": "0.51.0", + "resolved": "https://registry.npmjs.org/@oxfmt/binding-android-arm64/-/binding-android-arm64-0.51.0.tgz", + "integrity": "sha512-eu5lAZjuo0KAkp+M24EhDqfOwA8owQ8d7wyBlOUUGRbDLHpU3IRlDHp8Dif+YqGlxs6jra7yS6WQu/NkPhAxeg==", "cpu": [ "arm64" ], @@ -56,9 +56,9 @@ } }, "node_modules/@oxfmt/binding-darwin-arm64": { - "version": "0.48.0", - "resolved": "https://registry.npmjs.org/@oxfmt/binding-darwin-arm64/-/binding-darwin-arm64-0.48.0.tgz", - "integrity": "sha512-IkKp8rnIyQLW6Jt+6jragCbUVYSayk55lapiprLjIVvt4NczLyO/nwX2GgefLQ5iaBdfS8UEAFgCs/pLO6Cl0w==", + "version": "0.51.0", + "resolved": "https://registry.npmjs.org/@oxfmt/binding-darwin-arm64/-/binding-darwin-arm64-0.51.0.tgz", + "integrity": "sha512-6LsUNIdURhhcIfIn8+xsOb61mSTa9msAHTeSGx9Jf4rsP/gN8PGCF+SKWPAQZbND2w/WBkqQ6303jqEEIXzMdQ==", "cpu": [ "arm64" ], @@ -73,9 +73,9 @@ } }, "node_modules/@oxfmt/binding-darwin-x64": { - "version": "0.48.0", - "resolved": "https://registry.npmjs.org/@oxfmt/binding-darwin-x64/-/binding-darwin-x64-0.48.0.tgz", - "integrity": "sha512-+aFuhsGIuvnoOjXyKVHMhPKJZR1kQkAl8QyrKoMlA7yJsSTC3N0Asl53La8TChSHhW8epToQ/Q0nvLmEmfNmLg==", + "version": "0.51.0", + "resolved": "https://registry.npmjs.org/@oxfmt/binding-darwin-x64/-/binding-darwin-x64-0.51.0.tgz", + "integrity": "sha512-9aUMGmVxdHjYMsEAW1tNRoieTJXlVNDFkRvIR1J7LttJXWjVYCu2ekclLij2KJtxBxSQOYSHd12ME/adVGVbZg==", "cpu": [ "x64" ], @@ -90,9 +90,9 @@ } }, "node_modules/@oxfmt/binding-freebsd-x64": { - "version": "0.48.0", - "resolved": "https://registry.npmjs.org/@oxfmt/binding-freebsd-x64/-/binding-freebsd-x64-0.48.0.tgz", - "integrity": "sha512-fbqzQL8FjI9gGnktI7RIo0dksDziTAYBy7xlI7jU7eID5fxLF/25fS4Xj6GydD8Y5oWHL83U4NK160QaOAxtyg==", + "version": "0.51.0", + "resolved": "https://registry.npmjs.org/@oxfmt/binding-freebsd-x64/-/binding-freebsd-x64-0.51.0.tgz", + "integrity": "sha512-mkY1nhZTqYb+NHaAWxOCKISN6FwdrwMNsu17vTUA3wzUV2VJ+Paq15ZokRcsMU/2PUdHO73prxyeJpjXQ3MPpQ==", "cpu": [ "x64" ], @@ -107,9 +107,9 @@ } }, "node_modules/@oxfmt/binding-linux-arm-gnueabihf": { - "version": "0.48.0", - "resolved": "https://registry.npmjs.org/@oxfmt/binding-linux-arm-gnueabihf/-/binding-linux-arm-gnueabihf-0.48.0.tgz", - "integrity": "sha512-hn4i0zhAyTiB3ZHjQfYUZkDvrbVkohw1S7pySWxWUoZ87HnkDoTFThj7QTxk40hNPOTUP0vHbPRNamFIv1HBJQ==", + "version": "0.51.0", + "resolved": "https://registry.npmjs.org/@oxfmt/binding-linux-arm-gnueabihf/-/binding-linux-arm-gnueabihf-0.51.0.tgz", + "integrity": "sha512-wtFwNwE4+YCNuPaWoGDZeGsKvD6D1YSUNBJNn/rJBh7CrDBThFE+TBI5kY7vRW9rIOQRsbW2IpyyL3Du4Zqwiw==", "cpu": [ "arm" ], @@ -124,9 +124,9 @@ } }, "node_modules/@oxfmt/binding-linux-arm-musleabihf": { - "version": "0.48.0", - "resolved": "https://registry.npmjs.org/@oxfmt/binding-linux-arm-musleabihf/-/binding-linux-arm-musleabihf-0.48.0.tgz", - "integrity": "sha512-R4WBD9qF3QM9hqgdAa+fBGXmquTvDUujrPQ36t2Sjk8RPOSKGHDeN7l/khr10hqbQaOq9KCgPHG9ubNET/X/RQ==", + "version": "0.51.0", + "resolved": "https://registry.npmjs.org/@oxfmt/binding-linux-arm-musleabihf/-/binding-linux-arm-musleabihf-0.51.0.tgz", + "integrity": "sha512-rnOaNx86G7iRKM6lsCIQMux0SMGNC/TEbFR+r7lpruJ12bnrIWgxd5w1PLqOvgR9r8ZJbpK/zfRKctJnh8/Jfg==", "cpu": [ "arm" ], @@ -141,9 +141,9 @@ } }, "node_modules/@oxfmt/binding-linux-arm64-gnu": { - "version": "0.48.0", - "resolved": "https://registry.npmjs.org/@oxfmt/binding-linux-arm64-gnu/-/binding-linux-arm64-gnu-0.48.0.tgz", - "integrity": "sha512-5bVdwSwlm1M8wbYCorLOxWxUBw/8tBvHYyQNIfwWVPwOJaj5vg1APSGJQVpwJfV5VNE9PSrR91UKEpoNwHhqUA==", + "version": "0.51.0", + "resolved": "https://registry.npmjs.org/@oxfmt/binding-linux-arm64-gnu/-/binding-linux-arm64-gnu-0.51.0.tgz", + "integrity": "sha512-jOgDzSqWcICGRjsp4mc08FxKMN8vzP2Kgs4E0d2HUP99F+nJDQKklRV4Zuj+0gcBgjrzx2CbpqaIdUVPepCojA==", "cpu": [ "arm64" ], @@ -158,9 +158,9 @@ } }, "node_modules/@oxfmt/binding-linux-arm64-musl": { - "version": "0.48.0", - "resolved": "https://registry.npmjs.org/@oxfmt/binding-linux-arm64-musl/-/binding-linux-arm64-musl-0.48.0.tgz", - "integrity": "sha512-vCS3Fk7gFslTqE1lUE2IlroyVV7u/9SmMA/uBqDoshuck2psGWcjW0ePyPZI3rM3+qtf2pDaMVIKMHozraifuw==", + "version": "0.51.0", + "resolved": "https://registry.npmjs.org/@oxfmt/binding-linux-arm64-musl/-/binding-linux-arm64-musl-0.51.0.tgz", + "integrity": "sha512-KBUCdrH5bwVrAvI9gU/1S55oH6fzXjr++J/oVocdu7bYTks1l7DNNT+rLd/1TDdAEjObGwmfWamn7LC1m8A0DQ==", "cpu": [ "arm64" ], @@ -175,9 +175,9 @@ } }, "node_modules/@oxfmt/binding-linux-ppc64-gnu": { - "version": "0.48.0", - "resolved": "https://registry.npmjs.org/@oxfmt/binding-linux-ppc64-gnu/-/binding-linux-ppc64-gnu-0.48.0.tgz", - "integrity": "sha512-gKtfFfueUClXDumyoHUbymqRf7prHejOOyzJK0eIJn93GF9JBdFHdo60TM1ZBHxkEwZvjuOgHmKtneKbEOc/Eg==", + "version": "0.51.0", + "resolved": "https://registry.npmjs.org/@oxfmt/binding-linux-ppc64-gnu/-/binding-linux-ppc64-gnu-0.51.0.tgz", + "integrity": "sha512-NapfjYsABFqTJ1Dn9Efq6sN5esaHconVKwVLbDGNQLrwpOx/g17mkwErHzU72PutL67nf3wNAkbq122H+zLxag==", "cpu": [ "ppc64" ], @@ -192,9 +192,9 @@ } }, "node_modules/@oxfmt/binding-linux-riscv64-gnu": { - "version": "0.48.0", - "resolved": "https://registry.npmjs.org/@oxfmt/binding-linux-riscv64-gnu/-/binding-linux-riscv64-gnu-0.48.0.tgz", - "integrity": "sha512-SYt0UhOvZD/UwZz9sXq6J2uAw8o24f5VZpLB2DH01f6MevshmlgakQlZe2lwek2sZJkd07eLu7mZa0g7yeiw7Q==", + "version": "0.51.0", + "resolved": "https://registry.npmjs.org/@oxfmt/binding-linux-riscv64-gnu/-/binding-linux-riscv64-gnu-0.51.0.tgz", + "integrity": "sha512-5dlDt1dUZCVi6elIhiK1PWg9wpTzTcIuj0IZnSurvIoMrhOWqqTcc1dSTxcSkNaBZhfsNqRZdINI1zAgbKkJNQ==", "cpu": [ "riscv64" ], @@ -209,9 +209,9 @@ } }, "node_modules/@oxfmt/binding-linux-riscv64-musl": { - "version": "0.48.0", - "resolved": "https://registry.npmjs.org/@oxfmt/binding-linux-riscv64-musl/-/binding-linux-riscv64-musl-0.48.0.tgz", - "integrity": "sha512-JLbrwck2AopG4ud/XklZO5N+qxGC7cS7ROvXZVNfx0MCLDDL2kGOLvzuWORkVjnjAM0CMAfIMU2zNBtQbM+4dw==", + "version": "0.51.0", + "resolved": "https://registry.npmjs.org/@oxfmt/binding-linux-riscv64-musl/-/binding-linux-riscv64-musl-0.51.0.tgz", + "integrity": "sha512-pgdWUJn0S5nulyiVdlFV8DzCUnGXkU99W5PSkkmbaZW+LrZBPxpezun4G0DDHbQaVYuJeCuKsXsGKGo77CkUTQ==", "cpu": [ "riscv64" ], @@ -226,9 +226,9 @@ } }, "node_modules/@oxfmt/binding-linux-s390x-gnu": { - "version": "0.48.0", - "resolved": "https://registry.npmjs.org/@oxfmt/binding-linux-s390x-gnu/-/binding-linux-s390x-gnu-0.48.0.tgz", - "integrity": "sha512-mdxt5L8OQLxkQH+JVpdC/lknZNe0lX4hlO3d8+xvw2wToo+iDrid9tiGOd5bmHfUVd5wVhrUry0qlu5vq66NkQ==", + "version": "0.51.0", + "resolved": "https://registry.npmjs.org/@oxfmt/binding-linux-s390x-gnu/-/binding-linux-s390x-gnu-0.51.0.tgz", + "integrity": "sha512-2XTFUe97CbDGAI8vjwDfZ1HdakO0XIADyJ24idEg64SC4/K4in/OisXVnrW4NMK7I6TgC7EqRhC0Ln/nKhAemA==", "cpu": [ "s390x" ], @@ -243,9 +243,9 @@ } }, "node_modules/@oxfmt/binding-linux-x64-gnu": { - "version": "0.48.0", - "resolved": "https://registry.npmjs.org/@oxfmt/binding-linux-x64-gnu/-/binding-linux-x64-gnu-0.48.0.tgz", - "integrity": "sha512-oEz1BQwMrV7OMEFx/3VPDU3n9TM0AnxpktDYXjEg5i6nTX87wo18wSfBvkl4tzAICdKtoAQAdBIl7Y7hsPlx5w==", + "version": "0.51.0", + "resolved": "https://registry.npmjs.org/@oxfmt/binding-linux-x64-gnu/-/binding-linux-x64-gnu-0.51.0.tgz", + "integrity": "sha512-kQ1OuCqqt/yyf0ZN9VFxW1/JnlgJgii3Dr7pWf9vNBvrX1hv6g39/+mc5oGRHRGJFZtl3zsGDWR9c5N2B/gwBw==", "cpu": [ "x64" ], @@ -260,9 +260,9 @@ } }, "node_modules/@oxfmt/binding-linux-x64-musl": { - "version": "0.48.0", - "resolved": "https://registry.npmjs.org/@oxfmt/binding-linux-x64-musl/-/binding-linux-x64-musl-0.48.0.tgz", - "integrity": "sha512-g2SKTTurP5mWjd8Ecait0erYqmltL4IqW1EwttM25BxM6NiTt4ubobJYMR1uox1V2QgG4UfHH10CGRvWlUixjw==", + "version": "0.51.0", + "resolved": "https://registry.npmjs.org/@oxfmt/binding-linux-x64-musl/-/binding-linux-x64-musl-0.51.0.tgz", + "integrity": "sha512-ARTYqxHF475o96Gbn41hvSWSSRygPlRDXZZgZ9I2scU1y0qiWpCQyZCoefaQa0mwv+wwtZ+luS4YOzsRzM/izg==", "cpu": [ "x64" ], @@ -277,9 +277,9 @@ } }, "node_modules/@oxfmt/binding-openharmony-arm64": { - "version": "0.48.0", - "resolved": "https://registry.npmjs.org/@oxfmt/binding-openharmony-arm64/-/binding-openharmony-arm64-0.48.0.tgz", - "integrity": "sha512-CIg24VgheEpvolHL2gQuax5qcQ602bRMHrJ9g8XsQr3iVj9aSPgopigBKuMqrXsupwkrU+RQCn5cG8PgFntR6w==", + "version": "0.51.0", + "resolved": "https://registry.npmjs.org/@oxfmt/binding-openharmony-arm64/-/binding-openharmony-arm64-0.51.0.tgz", + "integrity": "sha512-QiC1XrCl6a6BmqMzduO8hdIRMf1m44hCkt2Q68KWkTvUB/E7fd2iomyNh6KnnRca5w6eBrRAAtLFqTh+xjsjJA==", "cpu": [ "arm64" ], @@ -294,9 +294,9 @@ } }, "node_modules/@oxfmt/binding-win32-arm64-msvc": { - "version": "0.48.0", - "resolved": "https://registry.npmjs.org/@oxfmt/binding-win32-arm64-msvc/-/binding-win32-arm64-msvc-0.48.0.tgz", - "integrity": "sha512-zeaWkcxcEULwkGF3I/HgEvcDPN8buYDrxibBUa/IFh5Vmwyge+KpLO+hEwSovW349H0O/C0Z2kaFmEzEDm00/Q==", + "version": "0.51.0", + "resolved": "https://registry.npmjs.org/@oxfmt/binding-win32-arm64-msvc/-/binding-win32-arm64-msvc-0.51.0.tgz", + "integrity": "sha512-NC/hJb9dtU23Zf8L7IVK95xnFjiQ7AfcLO2l5pb69TDEr958qxrtnB2CveeeNSCBFNIkgaTCfd/vHNSoG78l9g==", "cpu": [ "arm64" ], @@ -311,9 +311,9 @@ } }, "node_modules/@oxfmt/binding-win32-ia32-msvc": { - "version": "0.48.0", - "resolved": "https://registry.npmjs.org/@oxfmt/binding-win32-ia32-msvc/-/binding-win32-ia32-msvc-0.48.0.tgz", - "integrity": "sha512-yiEKnIAGvx5CyZQOlMaNlZkAbwT7/Quk0j3WLt+PR5hK+qYjPTRRJYDfD77wCBPLvEYAG41v4KG3iL0H+uxoxg==", + "version": "0.51.0", + "resolved": "https://registry.npmjs.org/@oxfmt/binding-win32-ia32-msvc/-/binding-win32-ia32-msvc-0.51.0.tgz", + "integrity": "sha512-2C45za4Rj36n8YIbhRL1PQbxmXJYf81WEcAgvj5I4ptRROG+A+81hREEN5bmCHADE1UfYaN312U6tkILoZZy6w==", "cpu": [ "ia32" ], @@ -328,9 +328,9 @@ } }, "node_modules/@oxfmt/binding-win32-x64-msvc": { - "version": "0.48.0", - "resolved": "https://registry.npmjs.org/@oxfmt/binding-win32-x64-msvc/-/binding-win32-x64-msvc-0.48.0.tgz", - "integrity": "sha512-GSD2+7t2UoVMV2NgxXypa4bKewflPMAjYnF0Xw9/ht82ZfafAHhb8STwrEd7wlH2PFogt5zw3WVCxYJaHUdbeQ==", + "version": "0.51.0", + "resolved": "https://registry.npmjs.org/@oxfmt/binding-win32-x64-msvc/-/binding-win32-x64-msvc-0.51.0.tgz", + "integrity": "sha512-73RqdAuVKQTkjZIDw08JaDHUM4lav5Qu+CaPwg4QbbA7k8o7LEW0p3UsfZ/F8dsO/pwVYh3RzFcanwLRTTahbQ==", "cpu": [ "x64" ], @@ -345,9 +345,9 @@ } }, "node_modules/@oxlint/binding-android-arm-eabi": { - "version": "1.63.0", - "resolved": "https://registry.npmjs.org/@oxlint/binding-android-arm-eabi/-/binding-android-arm-eabi-1.63.0.tgz", - "integrity": "sha512-A9xLtQt7i0OA1PoB/meog6kikXI9CdwEp7ZwQqmgnpKn3G3b1orvTDy8CQ6T7w1HvDrgWGB78PkFKcWgibcTCg==", + "version": "1.66.0", + "resolved": "https://registry.npmjs.org/@oxlint/binding-android-arm-eabi/-/binding-android-arm-eabi-1.66.0.tgz", + "integrity": "sha512-f7kq8N51T4phpzqfBpA2qaVTI/KrkCmNwaj3t/97I/WLTDI+UhlP5GL9eER+zVxBhtlx5rKXWByJU1/zDAvyaw==", "cpu": [ "arm" ], @@ -362,9 +362,9 @@ } }, "node_modules/@oxlint/binding-android-arm64": { - "version": "1.63.0", - "resolved": "https://registry.npmjs.org/@oxlint/binding-android-arm64/-/binding-android-arm64-1.63.0.tgz", - "integrity": "sha512-SQo+ZMvdR9l3CxZp5W5gFNxSiDxclY6lOzzNpKYLF8asESpm3Pwumx0gER5T7aHLF1/2BAAtLD3DiDkdgy4V1A==", + "version": "1.66.0", + "resolved": "https://registry.npmjs.org/@oxlint/binding-android-arm64/-/binding-android-arm64-1.66.0.tgz", + "integrity": "sha512-xu6QO71tdDS9mjmLZ3AqhtaVHBvdmsOKkYnReNNDgh+XiwnsipeQOIxbiYOOO0iAXycJ+GK0wdMSZP/2j/AmSg==", "cpu": [ "arm64" ], @@ -379,9 +379,9 @@ } }, "node_modules/@oxlint/binding-darwin-arm64": { - "version": "1.63.0", - "resolved": "https://registry.npmjs.org/@oxlint/binding-darwin-arm64/-/binding-darwin-arm64-1.63.0.tgz", - "integrity": "sha512-6W82XjJDTmMnjg30427l0dufpnyLoq7wEukKdM6/g2VIybRVuQiBVh43EA4b+UxZ3+tLcKm+Or/pXGNgLCEU8g==", + "version": "1.66.0", + "resolved": "https://registry.npmjs.org/@oxlint/binding-darwin-arm64/-/binding-darwin-arm64-1.66.0.tgz", + "integrity": "sha512-HZ24VimSOC7mxuEA99e0H2FS0C1yO3+iW13jPRAk+e2njsUs3QeAXsafCDyaIrV/MirdOVez+etQNQsJE43zNQ==", "cpu": [ "arm64" ], @@ -396,9 +396,9 @@ } }, "node_modules/@oxlint/binding-darwin-x64": { - "version": "1.63.0", - "resolved": "https://registry.npmjs.org/@oxlint/binding-darwin-x64/-/binding-darwin-x64-1.63.0.tgz", - "integrity": "sha512-CnWd/YCuVG5W1BYkjJEVbJG11o526O9qAwBEQM+nh8K19CRFUkFdROXCyYkGmroHEYQe4vgQ6+lh3550Lp35Xw==", + "version": "1.66.0", + "resolved": "https://registry.npmjs.org/@oxlint/binding-darwin-x64/-/binding-darwin-x64-1.66.0.tgz", + "integrity": "sha512-awhj8ZvJrrRSnXj7V++rpZvTmnl99L6mi0B7gg7Cp7BN6cKpzuI481bHNLvXGA9GB1/oEgA3ponuyoAc6Md12A==", "cpu": [ "x64" ], @@ -413,9 +413,9 @@ } }, "node_modules/@oxlint/binding-freebsd-x64": { - "version": "1.63.0", - "resolved": "https://registry.npmjs.org/@oxlint/binding-freebsd-x64/-/binding-freebsd-x64-1.63.0.tgz", - "integrity": "sha512-a4eZAqrmtajqcxfdAzC+l7g3PaE3V8hpAYqqeD3fTxLXOMFdK3eNTZrU80n4dDEVm0JXy1aL5PqvqWldBl6zYA==", + "version": "1.66.0", + "resolved": "https://registry.npmjs.org/@oxlint/binding-freebsd-x64/-/binding-freebsd-x64-1.66.0.tgz", + "integrity": "sha512-KQF0oVV21/FjIqkRuL8Q1vh8ECsE5+ocdH5tcqTQ4ZnYuDVoYibQUNfqBjQaUsP6UIIda5Y75Wpm5p4RgQWiWw==", "cpu": [ "x64" ], @@ -430,9 +430,9 @@ } }, "node_modules/@oxlint/binding-linux-arm-gnueabihf": { - "version": "1.63.0", - "resolved": "https://registry.npmjs.org/@oxlint/binding-linux-arm-gnueabihf/-/binding-linux-arm-gnueabihf-1.63.0.tgz", - "integrity": "sha512-tYUtU9TdbU3uXF5D62g5zXJ13iniFGhXQx5vp9cyEjGdbSAY3VdFBSaldYvyoDmgMZ0ZYuwQP1Y4t2Fhejwa0w==", + "version": "1.66.0", + "resolved": "https://registry.npmjs.org/@oxlint/binding-linux-arm-gnueabihf/-/binding-linux-arm-gnueabihf-1.66.0.tgz", + "integrity": "sha512-9u1rgwZSEXWb30vbFZzQ78HVXBo0WCKNwJ3a2InRUTNMRng+PUDIoSFmA+m4HdUfBaIqftShq8J8qHc+eE/Vig==", "cpu": [ "arm" ], @@ -447,9 +447,9 @@ } }, "node_modules/@oxlint/binding-linux-arm-musleabihf": { - "version": "1.63.0", - "resolved": "https://registry.npmjs.org/@oxlint/binding-linux-arm-musleabihf/-/binding-linux-arm-musleabihf-1.63.0.tgz", - "integrity": "sha512-I5r3twFf776UZg9dmRo2xbrKt00tTkORXEVe0ctg4vdTkQvJAjiCHxnbAU2HL1AiJ9cqADA76MAliuilsAWnvg==", + "version": "1.66.0", + "resolved": "https://registry.npmjs.org/@oxlint/binding-linux-arm-musleabihf/-/binding-linux-arm-musleabihf-1.66.0.tgz", + "integrity": "sha512-Ynot2HR1bHxUaNWoC280MVTDfZuaWuP3XfSMRDhyuZrVjhzoaBCVFlw8h8qeZjWKVUBhPWFIxB7AQTlK8Z2WWg==", "cpu": [ "arm" ], @@ -464,9 +464,9 @@ } }, "node_modules/@oxlint/binding-linux-arm64-gnu": { - "version": "1.63.0", - "resolved": "https://registry.npmjs.org/@oxlint/binding-linux-arm64-gnu/-/binding-linux-arm64-gnu-1.63.0.tgz", - "integrity": "sha512-t7ltUkg6FFh4b564QyGir8xIj/QZbXu8FlcRkcyW9+ztr/mfRHlvUOFd95pJCXi9s/L5DrUeWWgpXRS+V+6igQ==", + "version": "1.66.0", + "resolved": "https://registry.npmjs.org/@oxlint/binding-linux-arm64-gnu/-/binding-linux-arm64-gnu-1.66.0.tgz", + "integrity": "sha512-xCbgzciGgo+A4aQZEknsNrNiIwY7sU5SfRuMmRjPIvZAgdF34cIHiKvwOsS5XRLjlTVSFwitmq6YclTtHTfU+g==", "cpu": [ "arm64" ], @@ -481,9 +481,9 @@ } }, "node_modules/@oxlint/binding-linux-arm64-musl": { - "version": "1.63.0", - "resolved": "https://registry.npmjs.org/@oxlint/binding-linux-arm64-musl/-/binding-linux-arm64-musl-1.63.0.tgz", - "integrity": "sha512-Q5mmZy/XWjuYFUuQyYjOvZ5U/JkKEwnpir6hGxhh6HcdP0V/BKxLo8dqkfF/t7r7AguB17dfS/8+go5AQDRR6g==", + "version": "1.66.0", + "resolved": "https://registry.npmjs.org/@oxlint/binding-linux-arm64-musl/-/binding-linux-arm64-musl-1.66.0.tgz", + "integrity": "sha512-hmo+ZB/lHkR1HdDmnziNpzSLmulnUSu10VEqX2Yex7OwvoBAbjJQLvy4gIBRV3AAwWnCvAxKp5Nv1GE6LU1QMg==", "cpu": [ "arm64" ], @@ -498,9 +498,9 @@ } }, "node_modules/@oxlint/binding-linux-ppc64-gnu": { - "version": "1.63.0", - "resolved": "https://registry.npmjs.org/@oxlint/binding-linux-ppc64-gnu/-/binding-linux-ppc64-gnu-1.63.0.tgz", - "integrity": "sha512-uBGtuZ0TzLB4x5wVa82HGNvYqY8buwDhyCnCP0R0gkk9szqVsP0MeTtD5HX7EsEuFIt+aYmYxuxeVxs3nTSwtQ==", + "version": "1.66.0", + "resolved": "https://registry.npmjs.org/@oxlint/binding-linux-ppc64-gnu/-/binding-linux-ppc64-gnu-1.66.0.tgz", + "integrity": "sha512-2Invd4Uyy81mVooQC5FBtfxSNrvcX1OxbMlVQ6M2erRrNI2awFYF26YNW2yFxdVFZ4ffNOWKghtMjhnUPsXsVA==", "cpu": [ "ppc64" ], @@ -515,9 +515,9 @@ } }, "node_modules/@oxlint/binding-linux-riscv64-gnu": { - "version": "1.63.0", - "resolved": "https://registry.npmjs.org/@oxlint/binding-linux-riscv64-gnu/-/binding-linux-riscv64-gnu-1.63.0.tgz", - "integrity": "sha512-h4s6FwxE+9MeA181o0dnDwHP32Y/bG8EiB/vrD6Ib+AMt6haigDc/0bUtI/sLmQDBMJnUfaCmtSSrEAqjtEVrA==", + "version": "1.66.0", + "resolved": "https://registry.npmjs.org/@oxlint/binding-linux-riscv64-gnu/-/binding-linux-riscv64-gnu-1.66.0.tgz", + "integrity": "sha512-s0iXPDQVdgayE3RGa/N2DZF7tjgg0TwEtD1sGoDxqPDGrIXgo45H0yHknT0f9A0yteASsweYZtDyTuVlM4aSag==", "cpu": [ "riscv64" ], @@ -532,9 +532,9 @@ } }, "node_modules/@oxlint/binding-linux-riscv64-musl": { - "version": "1.63.0", - "resolved": "https://registry.npmjs.org/@oxlint/binding-linux-riscv64-musl/-/binding-linux-riscv64-musl-1.63.0.tgz", - "integrity": "sha512-2EaNcCBR8Mcjl5ARtuN3BdEpVkX7KpjSjMGZ/mJMIeaXgTtdz5ytg2VwygMSStA/k0ixfvZFoZOfjDEcouV5vQ==", + "version": "1.66.0", + "resolved": "https://registry.npmjs.org/@oxlint/binding-linux-riscv64-musl/-/binding-linux-riscv64-musl-1.66.0.tgz", + "integrity": "sha512-OekL4XFiu7RPK0JIZi8VeHgtIXPREf42t8Cy/rKEsC+P3gcqDgNAAGiyuUOpdbG4wwbfue1q4CHcCO7spSve6w==", "cpu": [ "riscv64" ], @@ -549,9 +549,9 @@ } }, "node_modules/@oxlint/binding-linux-s390x-gnu": { - "version": "1.63.0", - "resolved": "https://registry.npmjs.org/@oxlint/binding-linux-s390x-gnu/-/binding-linux-s390x-gnu-1.63.0.tgz", - "integrity": "sha512-p4hlf/fd7TrYYl3QrWWD0GocqJefwMu3cHQhmi2FvEB/YOvFb5DZN3SMBaPi7B1TM5DeypkEtrVib674q1KKPg==", + "version": "1.66.0", + "resolved": "https://registry.npmjs.org/@oxlint/binding-linux-s390x-gnu/-/binding-linux-s390x-gnu-1.66.0.tgz", + "integrity": "sha512-Ga1D0kj1SFslm34ThA/BdkUlyAYEnTsXyRC4pF0C5agZSwtGdHYWMTQWemUfBGp4RCG4QWXgdO+HmmmKqOtlBg==", "cpu": [ "s390x" ], @@ -566,9 +566,9 @@ } }, "node_modules/@oxlint/binding-linux-x64-gnu": { - "version": "1.63.0", - "resolved": "https://registry.npmjs.org/@oxlint/binding-linux-x64-gnu/-/binding-linux-x64-gnu-1.63.0.tgz", - "integrity": "sha512-Vgq9rkRVcPcjbcH+ihYTfpeR7vCXfqpd+z5ItTGc0yYUV59L5ceHYN1iV4H9bKGV7Rn5hkVc7x3mSvHegduENA==", + "version": "1.66.0", + "resolved": "https://registry.npmjs.org/@oxlint/binding-linux-x64-gnu/-/binding-linux-x64-gnu-1.66.0.tgz", + "integrity": "sha512-p5jfP1wUZe/IC3qpQO84n9DRnf9g3lKRtLBlQq23ykyrDglHcVx7sWmVTlPuU6SBw8mNnPzyOn022G3XZHnlww==", "cpu": [ "x64" ], @@ -583,9 +583,9 @@ } }, "node_modules/@oxlint/binding-linux-x64-musl": { - "version": "1.63.0", - "resolved": "https://registry.npmjs.org/@oxlint/binding-linux-x64-musl/-/binding-linux-x64-musl-1.63.0.tgz", - "integrity": "sha512-3/Lkq/ncooA61rorrC+ZQed1Bc4VpGj+WnGsp58zmxKgvZ2vhreu+dcVyr3mX8NUpq7mfZ4gDDTou/yrF1Pd7A==", + "version": "1.66.0", + "resolved": "https://registry.npmjs.org/@oxlint/binding-linux-x64-musl/-/binding-linux-x64-musl-1.66.0.tgz", + "integrity": "sha512-vUB/sYlYZorDL1ZD+o9mRv7zbsykrrFRtmgS6R8musZqLtrPRQn1gc1eGpuX+sfdccz42STl/AqldY6XRb2upQ==", "cpu": [ "x64" ], @@ -600,9 +600,9 @@ } }, "node_modules/@oxlint/binding-openharmony-arm64": { - "version": "1.63.0", - "resolved": "https://registry.npmjs.org/@oxlint/binding-openharmony-arm64/-/binding-openharmony-arm64-1.63.0.tgz", - "integrity": "sha512-0/EdD/6hDkx5Mfd769PTjvEM8mZ/6Dfukp1dBCL/2PjlIVGEtYdNZyok6ChqYPsT9JcFnlQnUeQzO0/1L/oC9w==", + "version": "1.66.0", + "resolved": "https://registry.npmjs.org/@oxlint/binding-openharmony-arm64/-/binding-openharmony-arm64-1.66.0.tgz", + "integrity": "sha512-yde+6p/F59xRkGR9H1HfngWRif1QRJjynZK349l+UI0H6w9hL3G8/AVaTHFyTtLVQ56qtNbX2/5Dc77n1ovnOg==", "cpu": [ "arm64" ], @@ -617,9 +617,9 @@ } }, "node_modules/@oxlint/binding-win32-arm64-msvc": { - "version": "1.63.0", - "resolved": "https://registry.npmjs.org/@oxlint/binding-win32-arm64-msvc/-/binding-win32-arm64-msvc-1.63.0.tgz", - "integrity": "sha512-wb0CUkN8ngwPiRQBjD1Cj0LsHeNvm+Xt6YBHDMtj2DVQVD6Oj8Ri7g6BD+KICf6LaBqZlmzOvy6nF9E/8yyGOg==", + "version": "1.66.0", + "resolved": "https://registry.npmjs.org/@oxlint/binding-win32-arm64-msvc/-/binding-win32-arm64-msvc-1.66.0.tgz", + "integrity": "sha512-O9GLucgoTdmOrbBX+EjzNe7o/Ze5TFOvXcib6bzUOtBOmj6cV+zw18NgB+cGKAkDw1Pdqs8vGkfHbbsLuDtXWg==", "cpu": [ "arm64" ], @@ -634,9 +634,9 @@ } }, "node_modules/@oxlint/binding-win32-ia32-msvc": { - "version": "1.63.0", - "resolved": "https://registry.npmjs.org/@oxlint/binding-win32-ia32-msvc/-/binding-win32-ia32-msvc-1.63.0.tgz", - "integrity": "sha512-BX5iq+ovdNlVYhSn5qPMUIT0uwAwt2lmEnCnzK+Gkhw4DovIvhGb96OFhV8yzQNUnQxn/xGkOR+X+BLrLDNm8w==", + "version": "1.66.0", + "resolved": "https://registry.npmjs.org/@oxlint/binding-win32-ia32-msvc/-/binding-win32-ia32-msvc-1.66.0.tgz", + "integrity": "sha512-m3Pjwc2MfTcom4E4gOv7DyuGyt7OfGNCbmqDHd+N7EzXmP+ppHuudm2NjcA3AjV5TSeGxaguVF4SbTKHe1USYA==", "cpu": [ "ia32" ], @@ -651,9 +651,9 @@ } }, "node_modules/@oxlint/binding-win32-x64-msvc": { - "version": "1.63.0", - "resolved": "https://registry.npmjs.org/@oxlint/binding-win32-x64-msvc/-/binding-win32-x64-msvc-1.63.0.tgz", - "integrity": "sha512-QeN/WELOfsXMeYwxvfgQrl6CbVftYUCZsGXHjXQd5Trccm8+i4gmtxaOui4xbJQaiDlviF8F3yLSBloQUeFsfA==", + "version": "1.66.0", + "resolved": "https://registry.npmjs.org/@oxlint/binding-win32-x64-msvc/-/binding-win32-x64-msvc-1.66.0.tgz", + "integrity": "sha512-/DbBvw8UFBhja6PqudUjV4UtfsJr0Oa7jUjWVKB0g86lj/VwnPrkngn0sFql3c9RDA0O16dh7ozsXb6GjNAzBQ==", "cpu": [ "x64" ], @@ -668,13 +668,13 @@ } }, "node_modules/@types/node": { - "version": "25.6.0", - "resolved": "https://registry.npmjs.org/@types/node/-/node-25.6.0.tgz", - "integrity": "sha512-+qIYRKdNYJwY3vRCZMdJbPLJAtGjQBudzZzdzwQYkEPQd+PJGixUL5QfvCLDaULoLv+RhT3LDkwEfKaAkgSmNQ==", + "version": "25.9.1", + "resolved": "https://registry.npmjs.org/@types/node/-/node-25.9.1.tgz", + "integrity": "sha512-xfrlY7UD5rMJk3ZVJP8BNzS28J36YJg+xp+LPXV1TdWxr8uMH5A860QNxYDGQe/ylDSgjxE52Q9VnO7p75tJxg==", "dev": true, "license": "MIT", "dependencies": { - "undici-types": "~7.19.0" + "undici-types": ">=7.24.0 <7.24.7" } }, "node_modules/boolbase": { @@ -874,9 +874,9 @@ } }, "node_modules/oxfmt": { - "version": "0.48.0", - "resolved": "https://registry.npmjs.org/oxfmt/-/oxfmt-0.48.0.tgz", - "integrity": "sha512-AVaLh+7XeGx+R1zfFV+f6VV61nT2MWVJXVUDhbTm5LBWGyNt64xAyh3NYYyjeY2WykNt9AvqSQLPHcbWquYF9g==", + "version": "0.51.0", + "resolved": "https://registry.npmjs.org/oxfmt/-/oxfmt-0.51.0.tgz", + "integrity": "sha512-l/AoAnaEOV7Q5/Z9kHOMDehVJnCgYN7wRoooWCTUMBMi16BJhLZqd9cmCnwcVFfVlzkt53zK2KLPFNp8vSsoDg==", "dev": true, "license": "MIT", "dependencies": { @@ -892,31 +892,39 @@ "url": "https://github.com/sponsors/Boshen" }, "optionalDependencies": { - "@oxfmt/binding-android-arm-eabi": "0.48.0", - "@oxfmt/binding-android-arm64": "0.48.0", - "@oxfmt/binding-darwin-arm64": "0.48.0", - "@oxfmt/binding-darwin-x64": "0.48.0", - "@oxfmt/binding-freebsd-x64": "0.48.0", - "@oxfmt/binding-linux-arm-gnueabihf": "0.48.0", - "@oxfmt/binding-linux-arm-musleabihf": "0.48.0", - "@oxfmt/binding-linux-arm64-gnu": "0.48.0", - "@oxfmt/binding-linux-arm64-musl": "0.48.0", - "@oxfmt/binding-linux-ppc64-gnu": "0.48.0", - "@oxfmt/binding-linux-riscv64-gnu": "0.48.0", - "@oxfmt/binding-linux-riscv64-musl": "0.48.0", - "@oxfmt/binding-linux-s390x-gnu": "0.48.0", - "@oxfmt/binding-linux-x64-gnu": "0.48.0", - "@oxfmt/binding-linux-x64-musl": "0.48.0", - "@oxfmt/binding-openharmony-arm64": "0.48.0", - "@oxfmt/binding-win32-arm64-msvc": "0.48.0", - "@oxfmt/binding-win32-ia32-msvc": "0.48.0", - "@oxfmt/binding-win32-x64-msvc": "0.48.0" + "@oxfmt/binding-android-arm-eabi": "0.51.0", + "@oxfmt/binding-android-arm64": "0.51.0", + "@oxfmt/binding-darwin-arm64": "0.51.0", + "@oxfmt/binding-darwin-x64": "0.51.0", + "@oxfmt/binding-freebsd-x64": "0.51.0", + "@oxfmt/binding-linux-arm-gnueabihf": "0.51.0", + "@oxfmt/binding-linux-arm-musleabihf": "0.51.0", + "@oxfmt/binding-linux-arm64-gnu": "0.51.0", + "@oxfmt/binding-linux-arm64-musl": "0.51.0", + "@oxfmt/binding-linux-ppc64-gnu": "0.51.0", + "@oxfmt/binding-linux-riscv64-gnu": "0.51.0", + "@oxfmt/binding-linux-riscv64-musl": "0.51.0", + "@oxfmt/binding-linux-s390x-gnu": "0.51.0", + "@oxfmt/binding-linux-x64-gnu": "0.51.0", + "@oxfmt/binding-linux-x64-musl": "0.51.0", + "@oxfmt/binding-openharmony-arm64": "0.51.0", + "@oxfmt/binding-win32-arm64-msvc": "0.51.0", + "@oxfmt/binding-win32-ia32-msvc": "0.51.0", + "@oxfmt/binding-win32-x64-msvc": "0.51.0" + }, + "peerDependencies": { + "svelte": "^5.0.0" + }, + "peerDependenciesMeta": { + "svelte": { + "optional": true + } } }, "node_modules/oxlint": { - "version": "1.63.0", - "resolved": "https://registry.npmjs.org/oxlint/-/oxlint-1.63.0.tgz", - "integrity": "sha512-9TGXetdjgIHOJ9OiReomP7nnrMkV9HxC1xM2ramJSLQpzxjsAJtQwa4wqkJN2f/uCrqZuJseFuSlWDdvcruveg==", + "version": "1.66.0", + "resolved": "https://registry.npmjs.org/oxlint/-/oxlint-1.66.0.tgz", + "integrity": "sha512-N4LLxYLd94KEBqXDMDM5f+2PUpItTjDLreXe2Gn5KhjhCK4Qp2YUXaBi8Yu325ryOgKwt22m45fpD7nPOn69Yw==", "dev": true, "license": "MIT", "bin": { @@ -929,25 +937,25 @@ "url": "https://github.com/sponsors/Boshen" }, "optionalDependencies": { - "@oxlint/binding-android-arm-eabi": "1.63.0", - "@oxlint/binding-android-arm64": "1.63.0", - "@oxlint/binding-darwin-arm64": "1.63.0", - "@oxlint/binding-darwin-x64": "1.63.0", - "@oxlint/binding-freebsd-x64": "1.63.0", - "@oxlint/binding-linux-arm-gnueabihf": "1.63.0", - "@oxlint/binding-linux-arm-musleabihf": "1.63.0", - "@oxlint/binding-linux-arm64-gnu": "1.63.0", - "@oxlint/binding-linux-arm64-musl": "1.63.0", - "@oxlint/binding-linux-ppc64-gnu": "1.63.0", - "@oxlint/binding-linux-riscv64-gnu": "1.63.0", - "@oxlint/binding-linux-riscv64-musl": "1.63.0", - "@oxlint/binding-linux-s390x-gnu": "1.63.0", - "@oxlint/binding-linux-x64-gnu": "1.63.0", - "@oxlint/binding-linux-x64-musl": "1.63.0", - "@oxlint/binding-openharmony-arm64": "1.63.0", - "@oxlint/binding-win32-arm64-msvc": "1.63.0", - "@oxlint/binding-win32-ia32-msvc": "1.63.0", - "@oxlint/binding-win32-x64-msvc": "1.63.0" + "@oxlint/binding-android-arm-eabi": "1.66.0", + "@oxlint/binding-android-arm64": "1.66.0", + "@oxlint/binding-darwin-arm64": "1.66.0", + "@oxlint/binding-darwin-x64": "1.66.0", + "@oxlint/binding-freebsd-x64": "1.66.0", + "@oxlint/binding-linux-arm-gnueabihf": "1.66.0", + "@oxlint/binding-linux-arm-musleabihf": "1.66.0", + "@oxlint/binding-linux-arm64-gnu": "1.66.0", + "@oxlint/binding-linux-arm64-musl": "1.66.0", + "@oxlint/binding-linux-ppc64-gnu": "1.66.0", + "@oxlint/binding-linux-riscv64-gnu": "1.66.0", + "@oxlint/binding-linux-riscv64-musl": "1.66.0", + "@oxlint/binding-linux-s390x-gnu": "1.66.0", + "@oxlint/binding-linux-x64-gnu": "1.66.0", + "@oxlint/binding-linux-x64-musl": "1.66.0", + "@oxlint/binding-openharmony-arm64": "1.66.0", + "@oxlint/binding-win32-arm64-msvc": "1.66.0", + "@oxlint/binding-win32-ia32-msvc": "1.66.0", + "@oxlint/binding-win32-x64-msvc": "1.66.0" }, "peerDependencies": { "oxlint-tsgolint": ">=0.22.1" @@ -969,9 +977,9 @@ } }, "node_modules/typescript": { - "version": "5.9.3", - "resolved": "https://registry.npmjs.org/typescript/-/typescript-5.9.3.tgz", - "integrity": "sha512-jl1vZzPDinLr9eUt3J/t7V6FgNEw9QjvBPdysz9KfQDD41fQrC2Y4vKQdiaUpFT4bXlb1RHhLpp8wtm6M5TgSw==", + "version": "6.0.3", + "resolved": "https://registry.npmjs.org/typescript/-/typescript-6.0.3.tgz", + "integrity": "sha512-y2TvuxSZPDyQakkFRPZHKFm+KKVqIisdg9/CZwm9ftvKXLP8NRWj38/ODjNbr43SsoXqNuAisEf1GdCxqWcdBw==", "dev": true, "license": "Apache-2.0", "bin": { @@ -989,16 +997,16 @@ "license": "ISC" }, "node_modules/undici-types": { - "version": "7.19.2", - "resolved": "https://registry.npmjs.org/undici-types/-/undici-types-7.19.2.tgz", - "integrity": "sha512-qYVnV5OEm2AW8cJMCpdV20CDyaN3g0AjDlOGf1OW4iaDEx8MwdtChUp4zu4H0VP3nDRF/8RKWH+IPp9uW0YGZg==", + "version": "7.24.6", + "resolved": "https://registry.npmjs.org/undici-types/-/undici-types-7.24.6.tgz", + "integrity": "sha512-WRNW+sJgj5OBN4/0JpHFqtqzhpbnV0GuB+OozA9gCL7a993SmU+1JBZCzLNxYsbMfIeDL+lTsphD5jN5N+n0zg==", "dev": true, "license": "MIT" }, "node_modules/yaml": { - "version": "2.8.4", - "resolved": "https://registry.npmjs.org/yaml/-/yaml-2.8.4.tgz", - "integrity": "sha512-ml/JPOj9fOQK8RNnWojA67GbZ0ApXAUlN2UQclwv2eVgTgn7O9gg9o7paZWKMp4g0H3nTLtS9LVzhkpOFIKzog==", + "version": "2.9.0", + "resolved": "https://registry.npmjs.org/yaml/-/yaml-2.9.0.tgz", + "integrity": "sha512-2AvhNX3mb8zd6Zy7INTtSpl1F15HW6Wnqj0srWlkKLcpYl/gMIMJiyuGq2KeI2YFxUPjdlB+3Lc10seMLtL4cA==", "license": "ISC", "bin": { "yaml": "bin.mjs" diff --git a/package.json b/package.json index 336fc645..94711a13 100644 --- a/package.json +++ b/package.json @@ -1,29 +1,116 @@ { "name": "ai-models", - "version": "0.1.0", - "description": "A structured catalog of AI model providers and their models", + "version": "0.2.2", + "description": "Structured YAML catalog of 4,587 AI models across 95 providers โ€” pricing, context windows, modalities, capabilities. First-party data with TypeScript types and Zod validation.", + "keywords": [ + "agentic-models", + "ai-agents", + "ai-catalog", + "ai-directory", + "ai-model-pricing", + "ai-models", + "ai-pricing", + "ai-provider", + "anthropic", + "cached-pricing", + "cdn", + "cerebras", + "chat-models", + "chatgpt", + "claude", + "code-models", + "context-window", + "deepseek", + "edge-ai", + "embedding-models", + "free-models", + "function-calling", + "github-action", + "google-gemini", + "gpt-4", + "groq", + "image-generation", + "inference-api", + "json-mode", + "large-context-models", + "large-language-model", + "llama", + "llm", + "llm-api", + "llm-catalog", + "llm-pricing", + "machine-readable", + "migration-guide", + "mistral", + "model-catalog", + "model-comparison", + "model-directory", + "model-metadata", + "model-pricing", + "model-selection", + "multimodal-models", + "on-device-ai", + "open-weights", + "openai", + "prompt-caching", + "provider-comparison", + "qwen", + "reasoning-models", + "small-models", + "structured-output", + "tool-calling", + "vision-models", + "yaml" + ], + "homepage": "https://i-need-token.github.io/ai-models/", + "bugs": { + "url": "https://github.com/i-need-token/ai-models/issues" + }, "license": "MIT", + "repository": { + "type": "git", + "url": "git+https://github.com/i-need-token/ai-models.git" + }, + "files": [ + "dist/", + "types/", + "providers/", + "LICENSE" + ], "type": "module", + "main": "dist/models.json", + "types": "dist/index.d.ts", + "exports": { + ".": { + "types": "./dist/index.d.ts", + "default": "./dist/models.json" + }, + "./models.json": "./dist/models.json" + }, "scripts": { "sync": "npx tsx scripts/sync.ts", "validate": "npx tsx scripts/validate.ts", + "stats": "npx tsx scripts/stats.ts", + "compile": "npx tsx scripts/compile.ts", "fmt": "oxfmt", "fmt:check": "oxfmt --check", "lint": "oxlint", "typecheck": "tsc --noEmit", "check": "npm run fmt:check && npm run lint && npm run typecheck", - "prepare": "husky" + "prepare": "husky", + "build": "tsc -p tsconfig.build.json && npx tsx scripts/compile.ts", + "prepublishOnly": "npm run build" }, "dependencies": { "linkedom": "^0.18.12", - "yaml": "^2.7.0", + "yaml": "^2.9.0", "zod": "^3.24.0" }, "devDependencies": { - "@types/node": "^25.6.0", + "@types/node": "^25.9.1", "husky": "^9.1.7", - "oxfmt": "^0.48.0", - "oxlint": "^1.63.0", - "typescript": "^5.7.0" + "oxfmt": "^0.51.0", + "oxlint": "^1.66.0", + "typescript": "^6.0.3" } } diff --git a/providers/aion/README.md b/providers/aion/README.md new file mode 100644 index 00000000..0f7281f7 --- /dev/null +++ b/providers/aion/README.md @@ -0,0 +1,12 @@ +# Aion Labs + +[Aion Labs](https://aionlabs.ai) provides AI model inference services. + +## Data Source + +Model data is fetched from the Aion Labs API endpoint. + +## Notes + +- Models are discovered dynamically from the API +- Pricing follows the provider's published rates diff --git a/providers/auriko/README.md b/providers/auriko/README.md new file mode 100644 index 00000000..d0d46dd5 --- /dev/null +++ b/providers/auriko/README.md @@ -0,0 +1,12 @@ +# Auriko + +[Auriko](https://auriko.com) provides AI model inference services. + +## Data Source + +Model data is fetched from the Auriko API endpoint. + +## Notes + +- Models are discovered dynamically from the API +- Pricing follows the provider's published rates diff --git a/providers/baichuan/README.md b/providers/baichuan/README.md new file mode 100644 index 00000000..0ab56006 --- /dev/null +++ b/providers/baichuan/README.md @@ -0,0 +1,13 @@ +# Baichuan AI + +[Baichuan AI](https://platform.baichuan-ai.com) is a Chinese AI model producer, developer of the Baichuan series of large language models. + +## Data Source + +Model data is fetched from the Baichuan AI API endpoint. + +## Notes + +- Models are discovered dynamically from the API +- Pricing is in CNY +- Baichuan models include both general-purpose and specialized variants diff --git a/providers/cloudferro-sherlock/README.md b/providers/cloudferro-sherlock/README.md new file mode 100644 index 00000000..efc94f84 --- /dev/null +++ b/providers/cloudferro-sherlock/README.md @@ -0,0 +1,13 @@ +# CloudFerro Sherlock + +[CloudFerro Sherlock](https://sherlock.cloudferro.com) provides AI model inference on European cloud infrastructure. + +## Data Source + +Model data is fetched from the CloudFerro Sherlock API endpoint. + +## Notes + +- Models are discovered dynamically from the API +- Pricing follows the provider's published rates +- Hosted on European infrastructure (GDPR-friendly) diff --git a/providers/iflytek/README.md b/providers/iflytek/README.md new file mode 100644 index 00000000..baa4b6e7 --- /dev/null +++ b/providers/iflytek/README.md @@ -0,0 +1,13 @@ +# iFlytek SparkDesk + +[iFlytek SparkDesk](https://xinghuo.xfyun.cn) is a Chinese AI model platform by iFlytek (็ง‘ๅคง่ฎฏ้ฃž), providing the SparkDesk (ๆ˜Ÿ็ซ) series of large language models. + +## Data Source + +Model data is fetched from the iFlytek SparkDesk API endpoint. + +## Notes + +- Models are discovered dynamically from the API +- Pricing is in CNY +- SparkDesk models support both Chinese and English diff --git a/providers/llmgateway/README.md b/providers/llmgateway/README.md new file mode 100644 index 00000000..f04c7505 --- /dev/null +++ b/providers/llmgateway/README.md @@ -0,0 +1,13 @@ +# LLM Gateway + +[LLM Gateway](https://llmgateway.com) provides a unified API gateway for accessing multiple AI model providers. + +## Data Source + +Model data is fetched from the LLM Gateway API endpoint. + +## Notes + +- Models are discovered dynamically from the API +- Aggregates models from multiple upstream providers +- Pricing follows the provider's published rates diff --git a/providers/martian/README.md b/providers/martian/README.md new file mode 100644 index 00000000..3a21898a --- /dev/null +++ b/providers/martian/README.md @@ -0,0 +1,13 @@ +# Martian + +[Martian](https://withmartian.com) provides AI model inference services with a unified API. + +## Data Source + +Model data is fetched from the Martian API endpoint. + +## Notes + +- Models are discovered dynamically from the API +- Aggregates models from multiple upstream providers +- Pricing follows the provider's published rates diff --git a/providers/tencent-tokenhub/README.md b/providers/tencent-tokenhub/README.md new file mode 100644 index 00000000..b32611e0 --- /dev/null +++ b/providers/tencent-tokenhub/README.md @@ -0,0 +1,13 @@ +# Tencent Cloud TokenHub + +[Tencent Cloud TokenHub](https://cloud.tencent.com/product/ti) is a Chinese AI model platform by Tencent, providing access to various large language models. + +## Data Source + +Model data is fetched from the Tencent Cloud TokenHub API endpoint. + +## Notes + +- Models are discovered dynamically from the API +- Pricing is in CNY +- Provides access to both Tencent's own models and third-party models diff --git a/renovate.json b/renovate.json new file mode 100644 index 00000000..93da19a7 --- /dev/null +++ b/renovate.json @@ -0,0 +1,20 @@ +{ + "$schema": "https://docs.renovatebot.com/renovate-schema.json", + "extends": ["config:recommended"], + "schedule": ["before 5am on Monday"], + "labels": ["dependencies"], + "reviewers": ["liushuai"], + "prConcurrentLimit": 5, + "prHourlyLimit": 2, + "packageRules": [ + { + "matchUpdateTypes": ["minor", "patch"], + "automerge": true, + "automergeType": "squash" + }, + { + "matchUpdateTypes": ["major"], + "automerge": false + } + ] +} diff --git a/schema.json b/schema.json new file mode 100644 index 00000000..477fe74d --- /dev/null +++ b/schema.json @@ -0,0 +1,281 @@ +{ + "$schema": "https://json-schema.org/draft/2020-12/schema", + "$id": "https://raw.githubusercontent.com/i-need-token/ai-models/main/schema.json", + "title": "AI Models Catalog", + "description": "Schema for the AI Models Catalog YAML data files", + "definitions": { + "TokenPricing": { + "type": "object", + "description": "Per-million-token pricing (most common)", + "properties": { + "input": { + "type": "number", + "minimum": 0, + "description": "Price per 1M input tokens (USD or CNY)" + }, + "output": { + "type": "number", + "minimum": 0, + "description": "Price per 1M output tokens (USD or CNY)" + }, + "cache_write": { + "type": "number", + "minimum": 0, + "description": "Price per 1M cached write tokens" + }, + "cache_read": { + "type": "number", + "minimum": 0, + "description": "Price per 1M cached read tokens" + } + }, + "required": ["input", "output"] + }, + "VideoPricing": { + "type": "object", + "description": "Per-second video pricing", + "properties": { + "unit": { + "type": "string", + "const": "per_second", + "description": "Pricing unit" + }, + "price": { + "type": "number", + "minimum": 0, + "description": "Price per second" + } + }, + "required": ["unit", "price"] + }, + "UnitPricing": { + "type": "object", + "description": "Per-unit pricing (per image, per request, etc.)", + "properties": { + "unit": { + "type": "string", + "enum": ["per_image", "per_request"], + "description": "Pricing unit" + }, + "price": { + "type": "number", + "minimum": 0, + "description": "Price per unit" + } + }, + "required": ["unit", "price"] + }, + "FreePricing": { + "type": "object", + "description": "Free pricing (no cost)", + "properties": { + "unit": { + "type": "string", + "const": "free", + "description": "Pricing unit" + } + }, + "required": ["unit"] + }, + "Pricing": { + "oneOf": [ + { "$ref": "#/definitions/TokenPricing" }, + { "$ref": "#/definitions/VideoPricing" }, + { "$ref": "#/definitions/UnitPricing" }, + { "$ref": "#/definitions/FreePricing" } + ] + }, + "Modality": { + "type": "string", + "enum": ["text", "image", "video", "audio", "pdf"], + "description": "Input or output modality" + }, + "Snapshot": { + "type": "object", + "description": "A dated version of a model (inherits parent fields)", + "properties": { + "id": { + "type": "string", + "description": "Snapshot ID (typically includes date, e.g. gpt-4o-2024-08-06)" + }, + "name": { + "type": "string", + "description": "Display name override" + }, + "reasoning": { + "type": "boolean", + "description": "Supports reasoning/thinking mode" + }, + "temperature": { + "type": "boolean", + "description": "Supports temperature parameter" + }, + "tool_call": { + "type": "boolean", + "description": "Supports tool/function calling" + }, + "attachment": { + "type": "boolean", + "description": "Supports file attachments" + }, + "structured_output": { + "type": "boolean", + "description": "Supports structured/JSON output" + }, + "open_weights": { + "type": "boolean", + "description": "Open-weight model" + }, + "deprecated": { + "type": "boolean", + "description": "Deprecated but still accessible" + }, + "limit": { + "type": "object", + "properties": { + "context": { + "type": "integer", + "minimum": 1, + "description": "Maximum context window in tokens" + }, + "output": { + "type": "integer", + "minimum": 1, + "description": "Maximum output tokens" + } + } + }, + "pricing": { + "$ref": "#/definitions/Pricing" + }, + "modalities": { + "type": "object", + "properties": { + "input": { + "type": "array", + "items": { "$ref": "#/definitions/Modality" } + }, + "output": { + "type": "array", + "items": { "$ref": "#/definitions/Modality" } + } + } + }, + "knowledge": { + "type": "string", + "description": "Training data cutoff (e.g. 2023-10)" + }, + "release_date": { + "type": "string", + "description": "Model release date (YYYY-MM-DD or YYYY-MM)" + }, + "last_updated": { + "type": "string", + "description": "Last data update (YYYY-MM-DD or YYYY-MM)" + } + }, + "required": ["id", "last_updated"] + } + }, + "type": "object", + "description": "A single AI model definition", + "properties": { + "id": { + "type": "string", + "description": "Stable model ID (no date suffix)", + "pattern": "^[a-z0-9][a-z0-9._-]*[a-z0-9]$" + }, + "name": { + "type": "string", + "description": "Display name" + }, + "family": { + "type": "string", + "description": "Model family (broad lineage)" + }, + "reasoning": { + "type": "boolean", + "default": false, + "description": "Supports reasoning/thinking mode" + }, + "temperature": { + "type": "boolean", + "default": true, + "description": "Supports temperature parameter" + }, + "tool_call": { + "type": "boolean", + "default": false, + "description": "Supports tool/function calling" + }, + "attachment": { + "type": "boolean", + "default": false, + "description": "Supports file attachments" + }, + "structured_output": { + "type": "boolean", + "default": false, + "description": "Supports structured/JSON output" + }, + "open_weights": { + "type": "boolean", + "default": false, + "description": "Open-weight model" + }, + "deprecated": { + "type": "boolean", + "default": false, + "description": "Deprecated but still accessible" + }, + "limit": { + "type": "object", + "properties": { + "context": { + "type": "integer", + "minimum": 1, + "description": "Maximum context window in tokens" + }, + "output": { + "type": "integer", + "minimum": 1, + "description": "Maximum output tokens" + } + } + }, + "pricing": { + "$ref": "#/definitions/Pricing" + }, + "modalities": { + "type": "object", + "properties": { + "input": { + "type": "array", + "items": { "$ref": "#/definitions/Modality" } + }, + "output": { + "type": "array", + "items": { "$ref": "#/definitions/Modality" } + } + } + }, + "knowledge": { + "type": "string", + "description": "Training data cutoff (e.g. 2023-10)" + }, + "release_date": { + "type": "string", + "description": "Model release date (YYYY-MM-DD or YYYY-MM)" + }, + "last_updated": { + "type": "string", + "description": "Last data update (YYYY-MM-DD or YYYY-MM)" + }, + "snapshots": { + "type": "array", + "items": { "$ref": "#/definitions/Snapshot" }, + "description": "Dated model versions" + } + }, + "required": ["id", "name", "family", "pricing", "modalities", "last_updated"] +} diff --git a/scripts/compile.ts b/scripts/compile.ts new file mode 100644 index 00000000..1d0972da --- /dev/null +++ b/scripts/compile.ts @@ -0,0 +1,132 @@ +import fs from "node:fs"; +import path from "node:path"; +import { fileURLToPath } from "node:url"; +import YAML from "yaml"; +import { ModelSchema } from "../types/schemas"; + +const __dirname = path.dirname(fileURLToPath(import.meta.url)); +const PROJECT_ROOT = path.resolve(__dirname, ".."); + +interface CompiledModel { + id: string; + name: string; + family?: string; + provider: string; + reasoning?: boolean | undefined; + tool_call?: boolean | undefined; + structured_output?: boolean | undefined; + open_weights?: boolean | undefined; + deprecated?: boolean | undefined; + pricing?: Record | undefined; + limit?: Record | undefined; + modalities?: Record | undefined; + release_date?: string | undefined; + last_updated?: string | undefined; +} + +interface CompiledCatalog { + generated_at: string; + stats: { + providers: number; + models: number; + unique_model_ids: number; + families: number; + }; + providers: Record; + models: CompiledModel[]; +} + +function compile(): CompiledCatalog { + const providersDir = path.join(PROJECT_ROOT, "providers"); + const providerDirs = fs + .readdirSync(providersDir, { withFileTypes: true }) + .filter((d) => d.isDirectory()) + .map((d) => d.name) + .filter((name) => fs.existsSync(path.join(providersDir, name, "models"))); + + const models: CompiledModel[] = []; + const providers: Record = {}; + const uniqueIds = new Set(); + const families = new Set(); + + for (const providerId of providerDirs) { + const modelsDir = path.join(providersDir, providerId, "models"); + const files = fs.readdirSync(modelsDir).filter((f) => f.endsWith(".yaml")); + + // Read provider name from provider.yaml + let providerName = providerId; + const providerYamlPath = path.join(providersDir, providerId, "provider.yaml"); + if (fs.existsSync(providerYamlPath)) { + try { + const providerRaw = fs.readFileSync(providerYamlPath, "utf-8"); + const providerData = YAML.parse(providerRaw); + if (providerData?.name) providerName = providerData.name; + } catch { + // ignore + } + } + + providers[providerId] = { name: providerName, model_count: files.length }; + + for (const file of files) { + const raw = fs.readFileSync(path.join(modelsDir, file), "utf-8"); + const data = YAML.parse(raw); + const result = ModelSchema.safeParse(data); + if (!result.success) continue; + + const model = result.data; + uniqueIds.add(model.id); + if (model.family) families.add(model.family); + + models.push({ + id: model.id, + name: model.name, + family: model.family, + provider: providerId, + reasoning: model.reasoning, + tool_call: model.tool_call, + structured_output: model.structured_output, + open_weights: model.open_weights, + deprecated: model.deprecated, + pricing: model.pricing as Record | undefined, + limit: model.limit as Record | undefined, + modalities: model.modalities as Record | undefined, + release_date: model.release_date, + last_updated: model.last_updated, + }); + } + } + + return { + generated_at: new Date().toISOString(), + stats: { + providers: providerDirs.length, + models: models.length, + unique_model_ids: uniqueIds.size, + families: families.size, + }, + providers, + models, + }; +} + +function main(): void { + const catalog = compile(); + + const distDir = path.join(PROJECT_ROOT, "dist"); + if (!fs.existsSync(distDir)) fs.mkdirSync(distDir, { recursive: true }); + + const outPath = path.join(distDir, "models.json"); + fs.writeFileSync(outPath, JSON.stringify(catalog, null, 2)); + + console.log( + `โœ… Compiled ${catalog.models.length} models from ${catalog.stats.providers} providers`, + ); + console.log( + ` ${catalog.stats.unique_model_ids} unique IDs, ${catalog.stats.families} families`, + ); + console.log(` Written to ${outPath}`); + console.log(` Size: ${(fs.statSync(outPath).size / 1024 / 1024).toFixed(1)} MB`); +} + +main(); diff --git a/scripts/export-csv.ts b/scripts/export-csv.ts new file mode 100644 index 00000000..b87f4c14 --- /dev/null +++ b/scripts/export-csv.ts @@ -0,0 +1,120 @@ +import fs from "node:fs"; +import path from "node:path"; +import YAML from "yaml"; +import { ModelSchema } from "../types/schemas"; + +const providersDir = "providers"; + +interface FlatModel { + id: string; + name: string; + provider: string; + family: string; + deprecated: boolean; + reasoning: boolean; + tool_call: boolean; + structured_output: boolean; + open_weights: boolean; + context_window: number | undefined; + max_output: number | undefined; + input_modalities: string; + output_modalities: string; + pricing_type: string; + input_price: number | undefined; + output_price: number | undefined; + image_input_price: number | undefined; + image_output_price: number | undefined; + cached_input_price: number | undefined; +} + +const models: FlatModel[] = []; + +for (const provider of fs.readdirSync(providersDir)) { + const mDir = path.join(providersDir, provider, "models"); + if (!fs.existsSync(mDir)) continue; + for (const f of fs.readdirSync(mDir).filter((f) => f.endsWith(".yaml"))) { + const raw = fs.readFileSync(path.join(mDir, f), "utf-8"); + const data = YAML.parse(raw); + const r = ModelSchema.safeParse(data); + if (!r.success) continue; + const m = r.data; + + const pr = m.pricing as Record | undefined; + let pricingType = "unknown"; + let inputPrice: number | undefined; + let outputPrice: number | undefined; + let imageInputPrice: number | undefined; + let imageOutputPrice: number | undefined; + let cachedInputPrice: number | undefined; + + if (pr) { + pricingType = (pr["type"] as string) ?? "token"; + if (pricingType === "token") { + inputPrice = pr["input"] as number | undefined; + outputPrice = pr["output"] as number | undefined; + imageInputPrice = pr["image_input"] as number | undefined; + imageOutputPrice = pr["image_output"] as number | undefined; + cachedInputPrice = pr["cached_input"] as number | undefined; + } + } + + models.push({ + id: m.id, + name: m.name ?? m.id, + provider, + family: m.family ?? "", + deprecated: m.deprecated ?? false, + reasoning: m.reasoning ?? false, + tool_call: m.tool_call ?? false, + structured_output: m.structured_output ?? false, + open_weights: m.open_weights ?? false, + context_window: m.limit?.context, + max_output: m.limit?.output, + input_modalities: (m.modalities?.input ?? []).join(";"), + output_modalities: (m.modalities?.output ?? []).join(";"), + pricing_type: pricingType, + input_price: inputPrice, + output_price: outputPrice, + image_input_price: imageInputPrice, + image_output_price: imageOutputPrice, + cached_input_price: cachedInputPrice, + }); + } +} + +function escapeCsv(val: unknown): string { + const s = String(val ?? ""); + if (s.includes(",") || s.includes('"') || s.includes("\n")) { + return `"${s.replace(/"/g, '""')}"`; + } + return s; +} + +const header = [ + "id", + "name", + "provider", + "family", + "deprecated", + "reasoning", + "tool_call", + "structured_output", + "open_weights", + "context_window", + "max_output", + "input_modalities", + "output_modalities", + "pricing_type", + "input_price", + "output_price", + "image_input_price", + "image_output_price", + "cached_input_price", +]; + +const rows = models.map((m) => header.map((k) => escapeCsv(m[k as keyof FlatModel])).join(",")); + +const csv = [header.join(","), ...rows].join("\n"); + +fs.writeFileSync("models.csv", csv); +console.log(`Wrote ${models.length} models to models.csv`); diff --git a/scripts/scrape-all.ts b/scripts/scrape-all.ts new file mode 100644 index 00000000..48fe052e --- /dev/null +++ b/scripts/scrape-all.ts @@ -0,0 +1,58 @@ +/** + * Run all provider scrape scripts and write updated model YAML files. + * + * Usage: npx tsx scripts/scrape-all.ts + * + * Each provider's scrape.ts exports a `scrape()` function that returns + * a ScrapeResult. This script calls each one and writes the results + * to providers//models/.yaml. + */ +import fs from "node:fs"; +import path from "node:path"; +import YAML from "yaml"; +import { defineModel } from "./lib/utils"; +import type { ScrapeResult } from "./lib/types"; + +const providersDir = "providers"; + +async function main() { + const providerDirs = fs + .readdirSync(providersDir) + .filter((d) => fs.statSync(path.join(providersDir, d)).isDirectory()); + + let totalUpdated = 0; + let totalFailed = 0; + + for (const provider of providerDirs) { + const scrapePath = path.join(providersDir, provider, "scrape.ts"); + if (!fs.existsSync(scrapePath)) continue; + + console.log(`Scraping ${provider}...`); + try { + const mod = await import(`../providers/${provider}/scrape.ts`); + const result: ScrapeResult = await mod.scrape(); + + const mDir = path.join(providersDir, provider, "models"); + fs.mkdirSync(mDir, { recursive: true }); + + for (const model of result.models) { + const validated = defineModel(model); + const filePath = path.join(mDir, `${validated.id}.yaml`); + fs.writeFileSync(filePath, YAML.stringify(validated)); + totalUpdated++; + } + + console.log(` โœ“ ${provider}: ${result.models.length} models`); + } catch (err) { + console.error(` โœ— ${provider}: ${err}`); + totalFailed++; + } + } + + console.log(`\nDone: ${totalUpdated} models updated, ${totalFailed} providers failed`); + if (totalFailed > 0) { + process.exit(1); + } +} + +main(); diff --git a/scripts/social-preview.ts b/scripts/social-preview.ts new file mode 100644 index 00000000..562db303 --- /dev/null +++ b/scripts/social-preview.ts @@ -0,0 +1,112 @@ +#!/usr/bin/env node +/** + * Generate a social preview image (1280ร—640) for GitHub repo. + * Outputs an SVG that can be converted to PNG via any browser or tool. + * + * Usage: + * npx tsx scripts/social-preview.ts > social-preview.svg + */ + +import fs from "node:fs"; +import path from "node:path"; + +const providersDir = path.join(import.meta.dirname, "..", "providers"); + +let providerCount = 0; +let modelCount = 0; + +for (const p of fs.readdirSync(providersDir)) { + const mDir = path.join(providersDir, p, "models"); + if (!fs.existsSync(mDir)) continue; + providerCount++; + for (const _f of fs.readdirSync(mDir).filter((f) => f.endsWith(".yaml"))) { + modelCount++; + } +} + +const svg = ` + + + + + + + + + + + + + + + + + + + + + + + + + ๐Ÿค– + + + AI Models Catalog + + + The most comprehensive structured catalog of AI models on GitHub + + + + ${modelCount.toLocaleString()} + Models + + + ${providerCount} + Providers + + + 2,350 + Tool Calling + + + 1,306 + Reasoning + + + 81 + Free + + + + Pricing + + + Context Windows + + + Modalities + + + Open Weights + + + Cached Pricing + + + + โœ“ First-Party Data Only ยท Zod Validation + + + npm ยท CDN ยท CSV ยท GitHub Action ยท Hugging Face + + + + $ npm install ai-models + + + +`; + +process.stdout.write(svg); diff --git a/scripts/stats.ts b/scripts/stats.ts new file mode 100644 index 00000000..ec294a7e --- /dev/null +++ b/scripts/stats.ts @@ -0,0 +1,141 @@ +import fs from "node:fs"; +import path from "node:path"; +import { fileURLToPath } from "node:url"; +import YAML from "yaml"; +import { ModelSchema } from "../types/schemas"; + +const __dirname = path.dirname(fileURLToPath(import.meta.url)); +const PROJECT_ROOT = path.resolve(__dirname, ".."); + +interface Stats { + providers: number; + modelFiles: number; + uniqueModelIds: Set; + families: Set; + reasoning: number; + toolCall: number; + structuredOutput: number; + openWeights: number; + free: number; + vision: number; + imageOutput: number; + audioInput: number; + audioOutput: number; + videoInput: number; +} + +function computeStats(): Stats { + const providersDir = path.join(PROJECT_ROOT, "providers"); + const providerDirs = fs + .readdirSync(providersDir, { withFileTypes: true }) + .filter((d) => d.isDirectory()) + .map((d) => d.name) + .filter((name) => fs.existsSync(path.join(providersDir, name, "models"))); + + const stats: Stats = { + providers: providerDirs.length, + modelFiles: 0, + uniqueModelIds: new Set(), + families: new Set(), + reasoning: 0, + toolCall: 0, + structuredOutput: 0, + openWeights: 0, + free: 0, + vision: 0, + imageOutput: 0, + audioInput: 0, + audioOutput: 0, + videoInput: 0, + }; + + for (const providerId of providerDirs) { + const modelsDir = path.join(providersDir, providerId, "models"); + const files = fs.readdirSync(modelsDir).filter((f) => f.endsWith(".yaml")); + + for (const file of files) { + stats.modelFiles++; + const raw = fs.readFileSync(path.join(modelsDir, file), "utf-8"); + const data = YAML.parse(raw); + const result = ModelSchema.safeParse(data); + if (!result.success) continue; + + const model = result.data; + stats.uniqueModelIds.add(model.id); + if (model.family) stats.families.add(model.family); + if (model.reasoning) stats.reasoning++; + if (model.tool_call) stats.toolCall++; + if (model.structured_output) stats.structuredOutput++; + if (model.open_weights) stats.openWeights++; + + // Check pricing for free models + if (model.pricing) { + const p = model.pricing as Record; + if (p["unit"] === "free") stats.free++; + } + + // Check modalities + if (model.modalities) { + const input = model.modalities.input ?? []; + const output = model.modalities.output ?? []; + if (input.includes("image")) stats.vision++; + if (output.includes("image")) stats.imageOutput++; + if (input.includes("audio")) stats.audioInput++; + if (output.includes("audio")) stats.audioOutput++; + if (input.includes("video")) stats.videoInput++; + } + } + } + + return stats; +} + +function main(): void { + const stats = computeStats(); + + const format = process.argv[2] ?? "table"; + + if (format === "json") { + console.log( + JSON.stringify( + { + providers: stats.providers, + model_files: stats.modelFiles, + unique_model_ids: stats.uniqueModelIds.size, + families: stats.families.size, + reasoning: stats.reasoning, + tool_call: stats.toolCall, + structured_output: stats.structuredOutput, + open_weights: stats.openWeights, + free: stats.free, + vision: stats.vision, + image_output: stats.imageOutput, + audio_input: stats.audioInput, + audio_output: stats.audioOutput, + video_input: stats.videoInput, + }, + null, + 2, + ), + ); + return; + } + + console.log("๐Ÿ“Š AI Models Catalog Stats\n"); + console.log(`Providers: ${stats.providers}`); + console.log(`Model files: ${stats.modelFiles}`); + console.log(`Unique model IDs: ${stats.uniqueModelIds.size}`); + console.log(`Model families: ${stats.families.size}`); + console.log(`Reasoning models: ${stats.reasoning}`); + console.log(`Tool-calling models: ${stats.toolCall}`); + console.log(`Structured output: ${stats.structuredOutput}`); + console.log(`Open-weight models: ${stats.openWeights}`); + console.log(`Free models: ${stats.free}`); + console.log(`Vision (image input): ${stats.vision}`); + console.log(`Image output: ${stats.imageOutput}`); + console.log(`Audio input: ${stats.audioInput}`); + console.log(`Audio output: ${stats.audioOutput}`); + console.log(`Video input: ${stats.videoInput}`); +} + +main(); diff --git a/site/404.html b/site/404.html new file mode 100644 index 00000000..f42be64e --- /dev/null +++ b/site/404.html @@ -0,0 +1,83 @@ + + + + + + Page Not Found โ€” AI Models Catalog + + + +
+

404

+

Model not found

+

+ This page doesn't exist in the AI Models Catalog. Maybe the model was deprecated, or the URL + is incorrect. +

+ โ† Back to Catalog +
+ + diff --git a/site/ai-model-benchmarks.html b/site/ai-model-benchmarks.html new file mode 100644 index 00000000..7cbf1be8 --- /dev/null +++ b/site/ai-model-benchmarks.html @@ -0,0 +1,653 @@ + + + + + + + AI Model Benchmarks Comparison 2025 โ€” MMLU, MATH, HumanEval, SWE-bench | AI Models Catalog + + + + + + + + + + + + + + + +
+

๐Ÿ“Š AI Model Benchmarks Comparison 2025

+

+ How do top AI models compare on MMLU, MATH-500, HumanEval, SWE-bench, and Chatbot Arena? A + comprehensive benchmark analysis of 4,587 models across 95 providers. +

+
+
+

1. General Knowledge โ€” MMLU & MMLU-Pro

+

+ MMLU (Massive Multitask Language Understanding) tests knowledge across 57 academic subjects. + MMLU-Pro is a harder variant requiring deeper reasoning. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelMMLUMMLU-ProProviderInput $/M
GPT-4.1~90%~78%OpenAI$2.00
Claude Opus 4~90%~78%Anthropic$15.00
Gemini 2.5 Pro~90%~78%Google$1.25
Claude Sonnet 4~88%~76%Anthropic$3.00
Grok 3~87%~75%xAI$3.00
DeepSeek R1~85%~72%DeepSeekFree
Qwen3-235B~85%~72%AlibabaFree
Llama 4 Maverick~82%~68%MetaFree
+
+ Key Insight: MMLU is near-saturated for frontier models. Use MMLU-Pro or + GPQA for more discriminating comparisons. +
+ +

2. Mathematics โ€” MATH-500 & AIME

+

+ MATH-500 tests competition-level mathematics. AIME 2024 is an even harder math competition + benchmark. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelMATH-500AIME 2024ProviderInput $/M
o3~96%~83%OpenAI$2.00
o4-mini~93%~75%OpenAI$1.10
DeepSeek R1~92%~72%DeepSeekFree
Gemini 2.5 Pro~91%~70%Google$1.25
Qwen3-235B~90%~68%AlibabaFree
Claude Sonnet 4~88%~65%Anthropic$3.00
+
+ Key Insight: Reasoning models (o3, DeepSeek R1) dominate math benchmarks. + For cost-sensitive math tasks, DeepSeek R1 is free and performs near o3. +
+ +

3. Coding โ€” HumanEval & SWE-bench

+

+ HumanEval tests Python code generation. SWE-bench tests real GitHub issue resolution โ€” more + realistic for production use. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelHumanEvalSWE-bench VerifiedProviderInput $/M
Claude Sonnet 4~93%~72%Anthropic$3.00
o3~92%~70%OpenAI$2.00
GPT-4.1~91%~65%OpenAI$2.00
Gemini 2.5 Pro~90%~63%Google$1.25
DeepSeek V3~88%~55%DeepSeek$0.07
Codestral~86%N/AMistral$0.30
+
+ Key Insight: SWE-bench is more realistic than HumanEval. Claude Sonnet 4 + leads on SWE-bench. For budget coding, DeepSeek V3 at $0.07/M offers remarkable value. +
+ +

4. Science & Reasoning โ€” GPQA

+

+ GPQA (Graduate-Level Google-Proof Q&A) tests expert-level scientific reasoning. Even + PhDs with internet access struggle. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelGPQA DiamondProviderInput $/M
o3~80%OpenAI$2.00
Gemini 2.5 Pro~78%Google$1.25
Claude Opus 4~75%Anthropic$15.00
o4-mini~73%OpenAI$1.10
DeepSeek R1~71%DeepSeekFree
+ +

5. Tool Calling โ€” BFCL v3

+

+ BFCL (Berkeley Function Calling Leaderboard) tests function calling accuracy โ€” critical for + AI agents. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelBFCL v3ProviderInput $/M
GPT-4.1~88%OpenAI$2.00
Claude Sonnet 4~86%Anthropic$3.00
Gemini 2.5 Pro~85%Google$1.25
Grok 3~83%xAI$3.00
Gemini 2.5 Flash~82%GoogleFree
+
+ Key Insight: 2,350 models in our catalog support tool calling. GPT-4.1 + leads on BFCL, but Gemini 2.5 Flash offers strong performance for free. +
+ +

6. Human Preference โ€” Chatbot Arena

+

+ LMSYS Chatbot Arena uses blind human comparisons. This is the most practical benchmark for + chat quality. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelArena ScoreProviderInput $/M
GPT-4.1~1380OpenAI$2.00
Claude Sonnet 4~1370Anthropic$3.00
Gemini 2.5 Pro~1360Google$1.25
Grok 3~1350xAI$3.00
DeepSeek R1~1330DeepSeekFree
+
+ Key Insight: Chatbot Arena correlates best with real-world chat quality. + The top 5 models are very close โ€” pricing and features should drive your decision. +
+ +

7. Best Value by Benchmark

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
BenchmarkBest FreeBest PaidBest Overall
MMLUDeepSeek R1 / Qwen3Gemini 2.5 Pro ($1.25)GPT-4.1
MATHDeepSeek R1o4-mini ($1.10)o3
CodingDeepSeek V3 ($0.07)Gemini 2.5 Pro ($1.25)Claude Sonnet 4
GPQADeepSeek R1Gemini 2.5 Pro ($1.25)o3
Tool CallingGemini 2.5 FlashGemini 2.5 Pro ($1.25)GPT-4.1
ChatDeepSeek R1Gemini 2.5 Pro ($1.25)GPT-4.1
+ +

8. Benchmark Limitations

+
+ Data contamination: Models may have seen benchmark data during training. + Prefer LiveCodeBench over HumanEval for coding. +
+
+ Task narrowness: Benchmarks test specific skills. Real-world performance + may differ significantly. +
+
+ Cost blindness: Benchmarks ignore pricing, latency, and availability. + Always combine with our + pricing data. +
+
+ Staleness: Saturated benchmarks (GSM8K, HellaSwag) are uninformative. Focus + on harder benchmarks like GPQA and SWE-bench. +
+ + +
+ Small Language Models +

๐ŸŽฏ AI Model Picker

+

โšก GitHub Action

+
+

+ Data from AI Models Catalog โ€” 4,587 + models across 95 providers. Updated continuously. +

+
+ + diff --git a/site/ai-model-comparison-chart.html b/site/ai-model-comparison-chart.html new file mode 100644 index 00000000..af581e62 --- /dev/null +++ b/site/ai-model-comparison-chart.html @@ -0,0 +1,760 @@ + + + + + + + AI Model Comparison Chart 2025 โ€” Pricing, Context, Capabilities | AI Models Catalog + + + + + + + + + + + + + + + +
+

๐Ÿ“Š AI Model Comparison Chart 2025

+

+ Side-by-side comparison of AI models: pricing, context windows, tool calling, reasoning, + vision, and structured output. Data from 95 providers, 4,587 models. +

+
+
+

1. Flagship Models Comparison

+

The top models from each major provider, compared across all key dimensions.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/MOutput $/MContextTool CallReasoningVisionStruct. Output
GPT-4.1OpenAI$2.00$8.001,047Kโœ…โŒโœ…โœ…
o3OpenAI$2.00$8.00200Kโœ…โœ…โœ…โœ…
o4-miniOpenAI$1.10$4.40200Kโœ…โœ…โœ…โœ…
Claude Opus 4Anthropic$15.00$75.00200Kโœ…โœ…โœ…โœ…
Claude Sonnet 4Anthropic$3.00$15.00200Kโœ…โœ…โœ…โœ…
Claude Haiku 3.5Anthropic$0.80$4.00200Kโœ…โŒโœ…โœ…
Gemini 2.5 ProGoogle$1.25$10.001,048Kโœ…โœ…โœ…โœ…
Gemini 2.5 FlashGoogleFreeFree1,048Kโœ…โœ…โœ…โœ…
Grok 3xAI$3.00$15.00131Kโœ…โŒโŒโŒ
Grok 3 MinixAI$0.30$0.50131Kโœ…โœ…โŒโŒ
DeepSeek R1DeepSeekFreeFree164Kโœ…โœ…โŒโŒ
DeepSeek V3DeepSeek$0.07$0.27164Kโœ…โŒโŒโŒ
Mistral LargeMistral$2.00$6.00128Kโœ…โŒโœ…โœ…
CodestralMistral$0.30$0.90256KโŒโŒโŒโŒ
Qwen3-235BAlibabaFreeFree128Kโœ…โœ…โœ…โœ…
Command R+Cohere$2.50$10.00128Kโœ…โŒโŒโœ…
Llama 4 MaverickMetaFreeFree1,048Kโœ…โŒโœ…โŒ
Nova ProAmazon$0.80$3.20300Kโœ…โŒโœ…โœ…
+ +

2. Best Value Models (Under $1/M Input)

+

Models that offer strong capabilities at budget-friendly prices.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/MOutput $/MContextTool CallReasoningVision
Gemini 2.5 FlashGoogleFreeFree1,048Kโœ…โœ…โœ…
DeepSeek R1DeepSeekFreeFree164Kโœ…โœ…โŒ
Qwen3-235BAlibabaFreeFree128Kโœ…โœ…โœ…
DeepSeek V3DeepSeek$0.07$0.27164Kโœ…โŒโŒ
Grok 3 MinixAI$0.30$0.50131Kโœ…โœ…โŒ
CodestralMistral$0.30$0.90256KโŒโŒโŒ
Claude Haiku 3.5Anthropic$0.80$4.00200Kโœ…โŒโœ…
Nova ProAmazon$0.80$3.20300Kโœ…โŒโœ…
+ +

3. Context Window Comparison

+

Models with the largest context windows for processing long documents.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContext WindowInput $/MTool Call
Gemini 2.5 ProGoogle1,048,576$1.25โœ…
Gemini 2.5 FlashGoogle1,048,576Freeโœ…
GPT-4.1OpenAI1,047,576$2.00โœ…
Llama 4 MaverickMeta1,048,576Freeโœ…
Nova ProAmazon300,000$0.80โœ…
Claude Opus/Sonnet 4Anthropic200,000$3-15โœ…
o3 / o4-miniOpenAI200,000$1.10-2โœ…
DeepSeek R1/V3DeepSeek163,840Freeโœ…
+ +

4. Capability Matrix

+

How many models support each capability across our catalog.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
CapabilityModelsFree ModelsCheapest Paid
Tool Calling2,35054ling-2.6-flash ($0.01/$0.03)
Reasoning1,30618qwen3.5-0.8b ($0.01/$0.05)
Vision1,48735ling-2.6-flash ($0.01/$0.03)
Structured Output82924ling-2.6-flash ($0.01/$0.03)
Open Weights52781Free
Image Output285Various
Audio Input11812Various
Audio Output348Various
+ +

5. Best Model by Use Case

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
Use CaseBest ModelWhyCost
AI AgentsGPT-4.1#1 tool calling, parallel calls$2/$8
CodingClaude Sonnet 4#1 SWE-bench, 64K output$3/$15
Reasoningo3#1 MATH, GPQA$2/$8
Long DocumentsGemini 2.5 Pro1M context, best price$1.25/$10
ChatGPT-4.1#1 Chatbot Arena$2/$8
BudgetGemini 2.5 FlashFree with 1M contextFree
Open SourceQwen3-235BBest open-weight modelFree
VisionGemini 2.5 ProBest MMMU, image+video$1.25/$10
+ +
+ Explore all 4,587 models: Use our + interactive catalog to filter, sort, + compare, and calculate costs for any combination of models. +
+ + +
+

Small Language Models

+

๐ŸŽฏ AI Model Picker

+

โšก GitHub Action

+
+

+ Data from AI Models Catalog โ€” 4,587 + models across 95 providers. Updated continuously. +

+
+ + diff --git a/site/ai-model-github-action.html b/site/ai-model-github-action.html new file mode 100644 index 00000000..68999b2c --- /dev/null +++ b/site/ai-model-github-action.html @@ -0,0 +1,401 @@ + + + + + + AI Model GitHub Action โ€” Automate Model Data in CI/CD | AI Models Catalog + + + + + + + + + + + + + + + +
+

โšก AI Model GitHub Action

+

+ Automate AI model data in your CI/CD pipeline. Free, open source, and always up-to-date. +

+ +

Quick Start

+
- name: Get AI Model Data
+  uses: i-need-token/ai-models@v0.2.0
+  with:
+    format: json
+    output: models.json
+ +

Features

+
+
+

๐Ÿ“Š Model Data

+

+ Get structured model data with pricing, context windows, and capabilities for 4,587+ + models across 95 providers. +

+
+
+

๐Ÿ” Filter & Search

+

+ Filter by provider, capability (tool calling, reasoning, vision), pricing tier, or + context window size. +

+
+
+

๐Ÿ’ฐ Price Tracking

+

Monitor pricing changes across providers. Get alerts when model prices change.

+
+
+

๐Ÿ“‹ Format Options

+

Output as JSON, YAML, CSV, or Markdown table. Use in scripts, docs, or dashboards.

+
+
+ +

Action Inputs

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
InputDescriptionDefault
formatOutput format: json, yaml, csv, markdownjson
outputOutput file pathmodels.json
providerFilter by provider name(all)
capabilityFilter by capability: tool_call, reasoning, vision, structured_output(all)
free-onlyOnly include free modelsfalse
max-priceMaximum input price per M tokens(no limit)
min-contextMinimum context window size0
+ +

Usage Examples

+ +

Get Free Models with Tool Calling

+
- name: Get free tool-calling models
+  uses: i-need-token/ai-models@v0.2.0
+  with:
+    format: json
+    output: free-tc-models.json
+    capability: tool_call
+    free-only: true
+ +

Get Cheapest Models Under $0.50/M

+
- name: Get budget models
+  uses: i-need-token/ai-models@v0.2.0
+  with:
+    format: csv
+    output: budget-models.csv
+    max-price: 0.50
+ +

Generate Model Comparison Table

+
- name: Generate comparison table
+  uses: i-need-token/ai-models@v0.2.0
+  with:
+    format: markdown
+    output: model-comparison.md
+    provider: openai
+    capability: reasoning
+ +

Weekly Price Monitoring

+
name: Price Monitor
+on:
+  schedule:
+    - cron: '0 6 * * 1'  # Every Monday 6:00 UTC
+jobs:
+  check-prices:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: i-need-token/ai-models@v0.2.0
+        with:
+          format: csv
+          output: current-prices.csv
+      - name: Compare with last week
+        run: |
+          diff last-week-prices.csv current-prices.csv || echo "Prices changed!"
+      - name: Save for next week
+        run: cp current-prices.csv last-week-prices.csv
+ +

Output Formats

+ +

JSON

+
{
+  "generated_at": "2025-05-21T12:00:00Z",
+  "stats": { "models": 4587, "providers": 95 },
+  "models": [
+    {
+      "id": "gpt-4o",
+      "provider": "openai",
+      "pricing": { "input": 2.5, "output": 10 },
+      "limit": { "context": 128000 },
+      "tool_call": true,
+      "reasoning": false
+    }
+  ]
+}
+ +

CSV

+
id,provider,input_price,output_price,context_window,tool_call,reasoning
+gpt-4o,openai,2.5,10,128000,true,false
+ +

Why Use This Action?

+
    +
  • โœ… Always up-to-date โ€” data refreshed from provider APIs
  • +
  • โœ… First-party data only โ€” no third-party aggregators
  • +
  • โœ… Structured & validated โ€” TypeScript types + Zod schemas
  • +
  • โœ… Zero configuration โ€” works out of the box
  • +
  • โœ… Free & open source โ€” MIT license
  • +
+ +

+ View on GitHub โ†’ ยท + Interactive Catalog โ†’ +

+ + + + +
+ + diff --git a/site/ai-model-picker.html b/site/ai-model-picker.html new file mode 100644 index 00000000..f873a6aa --- /dev/null +++ b/site/ai-model-picker.html @@ -0,0 +1,785 @@ + + + + + + + AI Model Picker โ€” Find the Best Model for Your Use Case (2025) | AI Models Catalog + + + + + + + + + + + + + + + + +
+

๐ŸŽฏ AI Model Picker

+

+ Answer 4 questions to find the best AI model for your use case. Data from + AI Models Catalog โ€” 4,587+ models + across 95 providers. +

+ +
+
+
+
+
+
+ +
+ +
+
What are you building?
+
+
+
๐Ÿค–
+
AI Agents
+
Tool calling, autonomous workflows
+
+
+
๐Ÿ’ป
+
Code Generation
+
Code completion, review, debugging
+
+
+
๐Ÿ’ฌ
+
Chat / RAG
+
Conversational AI, document QA
+
+
+
๐Ÿงฎ
+
Math & Reasoning
+
Step-by-step problem solving
+
+
+
๐Ÿ‘๏ธ
+
Vision / Multimodal
+
Image understanding, OCR
+
+
+
๐Ÿญ
+
High-Volume Production
+
Lowest cost per token at scale
+
+
+
+ + +
+
What's your budget per million tokens?
+
+
+
๐Ÿ†“
+
Free
+
$0 โ€” prototyping & testing
+
+
+
๐Ÿ’ฐ
+
Under $0.10/M
+
Budget-friendly production
+
+
+
โš–๏ธ
+
Under $1/M
+
Balanced cost & quality
+
+
+
๐Ÿ’Ž
+
Premium
+
Best quality regardless of cost
+
+
+
+ + +
+
How much context do you need?
+
+
+
๐Ÿ“
+
Under 32K
+
Short prompts, simple tasks
+
+
+
๐Ÿ“„
+
32K โ€“ 128K
+
Documents, code files
+
+
+
๐Ÿ“š
+
128K โ€“ 512K
+
Large codebases, long documents
+
+
+
๐Ÿ—„๏ธ
+
512K+
+
Entire repos, massive datasets
+
+
+
+ + +
+
What matters most?
+
+
+
๐Ÿ’ธ
+
Lowest Cost
+
Minimize spending per token
+
+
+
๐Ÿ†
+
Best Quality
+
Highest accuracy & reasoning
+
+
+
โšก
+
Lowest Latency
+
Fastest response time
+
+
+
๐Ÿ”’
+
Privacy / On-Device
+
Data never leaves your device
+
+
+
+
+ + +
+

๐ŸŽฏ Recommended Models

+

+
+
+ ๐Ÿ” Explore All 4,587 Models โ†’ + +
+
+ + + + + +

โšก GitHub Action

+ +
+ + + + diff --git a/site/ai-model-pricing-calculator.html b/site/ai-model-pricing-calculator.html new file mode 100644 index 00000000..38b5a0fa --- /dev/null +++ b/site/ai-model-pricing-calculator.html @@ -0,0 +1,915 @@ + + + + + + AI Model Pricing Calculator โ€” LLM Cost Calculator (2025) | AI Models Catalog + + + + + + + + + + + + + + + + + + +

๐Ÿ’ฐ AI Model Pricing Calculator (2025)

+

+ Calculate your monthly AI costs. Compare pricing for 4,587+ models across + 95 providers. Real-time cost estimation based on your token usage. +

+ +
+
4,587+Models
+
95Providers
+
81Free Models
+
1,374With Cache Pricing
+
+ + ๐Ÿ” Interactive Catalog + โญ Star on GitHub + +

๐Ÿงฎ Cost Calculator

+
+ + + + + + + + + + +
+ + + +

๐Ÿ“Š Quick Cost Comparison

+

Monthly cost for 1M input + 0.5M output tokens across popular models.

+
+
+
gpt-4o
+
$7.50/mo
+
$2.5 in / $10 out per 1M
+
+
+
gpt-4o-mini
+
$0.45/mo
+
$0.15 in / $0.6 out per 1M
+
+
+
gpt-4.1
+
$6.00/mo
+
$2 in / $8 out per 1M
+
+
+
gpt-4.1-mini
+
$1.20/mo
+
$0.4 in / $1.6 out per 1M
+
+
+
o3
+
$30.00/mo
+
$10 in / $40 out per 1M
+
+
+
o4-mini
+
$3.30/mo
+
$1.1 in / $4.4 out per 1M
+
+
+
gemini-2.5-pro
+
$6.25/mo
+
$1.25 in / $10 out per 1M
+
+
+
gemini-2.5-flash
+
$1.55/mo
+
$0.3 in / $2.5 out per 1M
+
+
+
gemini-2.0-flash
+
$0.30/mo
+
$0.1 in / $0.4 out per 1M
+
+
+
deepseek-chat
+
$0.28/mo
+
$0.14 in / $0.28 out per 1M
+
+
+
deepseek-r1
+
$4.05/mo
+
$1.35 in / $5.4 out per 1M
+
+
+
llama-4-maverick
+
$0.69/mo
+
$0.25 in / $0.87 out per 1M
+
+
+ +

๐Ÿ’ต Cheapest Models Overall

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContext
openai--gpt-image-1-miniaimlapi$0.007$0.676?
mistralai--Mistral-Nemo-Instruct-2407klusterai$0.008$0.001131K
qwen3.5-0.8bdeepinfra$0.01$0.05262K
ling-2.6-flashinclusionai$0.01$0.03262K
bdc-coderinferencenet$0.01$0.01131K
openai--gpt-image-1-modelaimlapi$0.012$0.175?
klusterai--Meta-Llama-3.1-8B-Instruct-Turboklusterai$0.015$0.02131K
granite-4.0-h-microcloudflare$0.017$0.112131K
meta-llama-3.1-8b-instruct-turbodeepinfra$0.02$0.03131K
meta-llama-3.1-8b-instructdeepinfra$0.02$0.05131K
+ +

๐Ÿ”ง Cheapest with Tool Calling

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContext
ling-2.6-flashinclusionai$0.01$0.03262K
bdc-coderinferencenet$0.01$0.01131K
klusterai--Meta-Llama-3.1-8B-Instruct-Turboklusterai$0.015$0.02131K
granite-4.0-h-microcloudflare$0.017$0.112131K
llama-3.1-8b-instruct--fp-16inferencenet$0.02$0.03131K
schematron-3binferencenet$0.02$0.05131K
schematron-v3inferencenet$0.02$0.05131K
gpt-oss-20binferencenet$0.03$0.15131K
schematron-v2-turboinferencenet$0.03$0.15131K
openai--gpt-oss-20bneuralwatt$0.03$0.16?
+ +

๐Ÿง  Cheapest with Reasoning

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContext
qwen3.5-0.8bdeepinfra$0.01$0.05262K
qwen3.5-2bdeepinfra$0.02$0.1262K
gpt-oss-20bdeepinfra$0.03$0.14131K
qwen3.5-4bdeepinfra$0.03$0.15262K
openai--gpt-oss-20bneuralwatt$0.03$0.16?
qwen--qwen3-4b-fp8novitaai$0.03$0.03128K
gpt-oss-120bdeepinfra$0.039$0.19131K
nvidia-nemotron-nano-9b-v2deepinfra$0.04$0.16131K
openai--gpt-oss-20bnovitaai$0.04$0.15131K
nemotron-3-nano-30b-a3bdeepinfra$0.05$0.2262K
+ +

๐Ÿ‘๏ธ Cheapest with Vision

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContext
qwen3.5-0.8bdeepinfra$0.01$0.05262K
qwen3.5-2bdeepinfra$0.02$0.1262K
paddlepaddle--paddleocr-vlnovitaai$0.02$0.0216K
qwen3.5-4bdeepinfra$0.03$0.15262K
deepseek--deepseek-ocr-2novitaai$0.03$0.038K
deepseek--deepseek-ocrnovitaai$0.03$0.038K
reka-edge-2reka$0.03$0.1131K
zai-org--autoglm-phone-9b-multilingualnovitaai$0.035$0.13865K
gemini-1.5-flash-8bdeepinfra$0.0375$0.151M
google-gemma-3-4bamazon-bedrock$0.04$0.08131K
+ +

๐Ÿ’ก How to Reduce Your AI Costs

+
    +
  • + Use smaller models for simple tasks โ€” GPT-4o Mini is 60x cheaper than GPT-4o for + basic tasks +
  • +
  • + Enable prompt caching โ€” 1,374 models offer cache pricing (typically 50% off cached + input tokens) +
  • +
  • + Choose open-weight models โ€” 527 models you can self-host for fixed infrastructure + costs +
  • +
  • + Try free models for prototyping โ€” 81 models at zero cost before committing to paid + APIs +
  • +
  • + Compare across providers โ€” same model (e.g., Llama 4) may cost differently on Groq + vs. Together vs. Fireworks +
  • +
  • + Use the interactive catalog โ€” + filter by capability and sort by price +
  • +
+ +

๐Ÿ“Š Methodology

+

+ All pricing data is sourced from first-party provider APIs. Prices are per million + tokens (1M = 1,000,000 tokens). Aggregator providers are excluded from ranking tables to avoid + duplicate models. Cache pricing is shown separately where available. +

+ +

๐Ÿ”— More Resources

+ + + Small Language Models +

๐ŸŽฏ AI Model Picker

+

โšก GitHub Action

+ + + diff --git a/site/ai-models-by-provider.html b/site/ai-models-by-provider.html new file mode 100644 index 00000000..c834ae3c --- /dev/null +++ b/site/ai-models-by-provider.html @@ -0,0 +1,4584 @@ + + + + + + AI Models by Provider โ€” All 95 Providers Listed (2025) | AI Models Catalog + + + + + + + + + + + + + + + + + + +

๐Ÿข AI Models by Provider โ€” All 95 Providers Listed

+

+ Browse 4,587 AI models across 95 providers. First-party data with real pricing, + context windows, and capabilities. +

+ +
+
95Providers
+
4,587Models
+
81Free Models
+
527Open Weights
+
+ + ๐Ÿ” Interactive Catalog + โญ Star on GitHub + + + +

๐Ÿ“Š Provider Overview

+

All 95 providers sorted by number of models. Click a provider to see their models.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ProviderModelsCheapest Input $/1MMax ContextTool CallFree
+ nanogpt (aggregator) + 547Aggregator?0
+ aihubmix (aggregator) + 476Aggregator?132
+ openrouter (aggregator) + 356Aggregator10M263โœ…
+ martian (aggregator) + 304Aggregator?0
+ requesty (aggregator) + 277Aggregator1M251
+ 302ai (aggregator) + 268Aggregator2M190
+ auriko (aggregator) + 181Aggregator1M154โœ…
+ llmgateway (aggregator) + 163Aggregator?158โœ…
+ aimlapi + 147$0.0072M21โœ…
+ fastrouter (aggregator) + 120Aggregator2M94โœ…
+ orcarouter (aggregator) + 120Aggregator1M102
+ cortecs (aggregator) + 105Aggregator?97
+ novitaai + 104$0.021M72โœ…
+ vultr + 98$0.551M11
+ deepinfra + 88$0.011M0
+ venice (aggregator) + 75Aggregator2M64
+ jiekou (aggregator) + 73Aggregator2M73
+ meganova (aggregator) + 63Aggregator1M60โœ…
+ alibaba + 62$0.151M62
+ ppio + 60$0.21451M46โœ…
+ amazon-bedrock + 57$0.0351M37
+ google-vertex + 38$0.071M32
+ siliconflow-cn + 37$0.5262K2
+ stepfun + 31$0.7256K0โœ…
+ cloudflare + 30$0.017327K15
+ databricks + 29$0.05200K4
+ gmicloud + 29$0.071M11
+ openai + 28$0.021M18
+ siliconflow + 27$0.041M24
+ togetherai + 24$0.03262K22
+ nebius + 23$0.021M21
+ google + 21$0.0752M8โœ…
+ minimax + 21$2.1204K0
+ voyage + 21$0.02?0โœ…
+ digitalocean + 20$0.051M14
+ inferencenet + 20$0.01131K15
+ zhipuai + 20$0.11M20โœ…
+ tencent-tokenhub + 19$11M16
+ mistral + 16$0.04256K12โœ…
+ moonshotai + 16$2262K0
+ neuralwatt + 14$0.03?14
+ tencent + 14$0.5250K3โœ…
+ scaleway + 13$0.15131K6
+ chutes + 12$0.08262K12
+ clarifai + 12$0.091M9
+ cloudferro-sherlock + 12$0.261M5
+ groq + 12$0.05131K8
+ klusterai + 12$0.0081M4
+ meta + 12$0.110M9
+ microsoft + 12$0.075128K6
+ ovhcloud + 12$0.05262K0
+ anthropic + 11$11M11
+ baichuan + 11$0.98131K0โœ…
+ cerebras + 11$0.1131K9โœ…
+ hpc-ai + 11$0.141M11
+ hyperbolic + 11$0.1163K0
+ fireworks + 10$0.071M10
+ baseten + 9$0.11M9
+ baidu + 8$0.1261M7โœ…
+ evroc + 8$0.1131K3
+ friendli + 8$0.1262K8
+ upstage + 8$0.1128K3
+ amazon + 7$0.0351M7
+ arcee + 7$0.04262K6โœ…
+ berget + 7$0.2?7
+ morph + 7$0.21M5
+ nousresearch + 7$0.06131K7
+ sambanova + 7$0.22196K0
+ dinference + 6$0.07204K3
+ iflytek + 6$0.8262K0โœ…
+ submodel + 6$0.1262K0
+ textsynth + 6$0.2131K0
+ writer + 6$0.61M3
+ xai + 6$0.2131K6
+ 01ai + 5$132K4
+ aion + 5$0.7131K0
+ bytedance + 5$0.07262K4
+ inception + 5$0.25128K3
+ mixlayer + 5$0.1131K5โœ…
+ privatemode + 5$0.43131K3
+ xiaomi + 5$0.11M5
+ deepseek + 4$0.141M4
+ perplexity + 4$1200K4
+ inclusionai + 3$0.01262K3
+ ai21 + 2$0.2256K0
+ reka + 2$0.03131K1
+ wafer + 2$0.6262K2
+ +

๐Ÿข OpenAI

+

GPT-4, GPT-4o, o1, o3 โ€” the industry standard for LLMs. 28 models available.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelInput $/1MOutput $/1MContextTool CallReasoning
text-embedding-3-small$0.02$08K
gpt-4.1-nano$0.1$0.41Mโœ…
text-embedding-ada-002$0.1$08K
text-embedding-3-large$0.13$08K
gpt-4o-mini$0.15$0.6128Kโœ…
gpt-4.1-mini$0.4$1.61Mโœ…
gpt-3.5-turbo$0.5$1.516Kโœ…
o3-mini$1.1$4.4200Kโœ…โœ…
o4-mini$1.1$4.4200Kโœ…โœ…
codex-mini$1.5$6192Kโœ…
o1-mini$1.5$6128Kโœ…โœ…
gpt-4.1$2$81Mโœ…
gpt-4o-audio$2.5$10128Kโœ…
gpt-4o$2.5$10128Kโœ…
gpt-3.5-turbo-16k$3$416Kโœ…
gpt-4o-realtime$5$20128Kโœ…
gpt-4-turbo$10$30128Kโœ…
o3$10$40200Kโœ…โœ…
o1-realtime$15$60200Kโœ…โœ…
o1$15$60200Kโœ…โœ…
gpt-4$30$608Kโœ…
gpt-4-32k$60$12032K
o1-pro$150$600200Kโœ…โœ…
dall-e-2$?$??
dall-e-3$?$??
tts-1-hd$?$??
tts-1$?$??
whisper-1$?$??
+ +

๐Ÿข Anthropic

+

Claude โ€” known for safety, reasoning, and long context. 11 models available.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelInput $/1MOutput $/1MContextTool CallReasoning
claude-haiku-4-5$1$5200Kโœ…โœ…
claude-sonnet-4-0$3$151Mโœ…โœ…
claude-sonnet-4-5$3$151Mโœ…โœ…
claude-sonnet-4-6$3$151Mโœ…โœ…
claude-opus-4-5$5$25200Kโœ…โœ…
claude-opus-4-6$5$251Mโœ…โœ…
claude-opus-4-7$5$251Mโœ…โœ…
claude-opus-4-0$15$75200Kโœ…โœ…
claude-opus-4-1$15$75200Kโœ…โœ…
claude-opus-4-6-fast$30$1501Mโœ…โœ…
claude-opus-4-7-fast$30$1501Mโœ…โœ…
+ +

๐Ÿข Google

+

Gemini โ€” multimodal models with massive context windows. 21 models available.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelInput $/1MOutput $/1MContextTool CallReasoning
gemini-1.5-flash-8b$0.075$0.31Mโœ…
gemini-1.5-flash$0.075$0.31Mโœ…
gemini-2.0-flash-lite$0.075$0.31Mโœ…
gemini-2.0-flash$0.1$0.41Mโœ…
gemini-2.5-flash-lite$0.1$0.41Mโœ…
gemini-2.5-flash$0.15$3.51Mโœ…โœ…
gemini-1.5-pro$1.25$52Mโœ…
gemini-2.5-pro$1.25$101Mโœ…โœ…
chirp-3.0-HD$?$??
gemma-3-12b-itFree131K
gemma-3-1b-itFree131K
gemma-3-27b-itFree131K
gemma-3-4b-itFree131K
gemma-3n-E2B-itFree131K
gemma-3n-E4B-itFree131K
imagen-3.0-fast-generate$?$??
imagen-3.0-generate$?$??
imagen-4.0-fast-generate$?$??
imagen-4.0-generate$?$??
lyria-2.0$?$??
veo-2.0-generate$?$??
+ +

๐Ÿข Meta

+

Llama โ€” open-weight models you can run anywhere. 12 models available.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelInput $/1MOutput $/1MContextTool CallReasoning
meta-llama-3.2-1b$0.1$0.1128K
meta-llama-3.2-3b$0.15$0.15128K
meta-llama-3.2-11b-vision$0.16$0.16128Kโœ…
meta-llama-4-scout$0.17$0.6610Mโœ…
meta-llama-3.1-8b$0.22$0.22128Kโœ…
meta-llama-4-maverick$0.24$0.971Mโœ…
meta-llama-3-8b$0.3$0.68K
meta-llama-3.1-70b$0.72$0.72128Kโœ…
meta-llama-3.2-90b-vision$0.72$0.72128Kโœ…
meta-llama-3.3-70b$0.72$0.72128Kโœ…
meta-llama-3.1-405b$2.4$2.4128Kโœ…
meta-llama-3-70b$2.65$3.58Kโœ…
+ +

๐Ÿข DeepSeek

+

High-performance reasoning at competitive prices. 4 models available.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelInput $/1MOutput $/1MContextTool CallReasoning
deepseek-chat$0.14$0.281Mโœ…
deepseek-reasoner$0.14$0.281Mโœ…โœ…
deepseek-v4-flash$0.14$0.281Mโœ…โœ…
deepseek-v4-pro$0.435$0.871Mโœ…โœ…
+ +

๐Ÿข Mistral

+

European AI with open and commercial models. 16 models available.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelInput $/1MOutput $/1MContextTool CallReasoning
ministral-3b$0.04$0.04128Kโœ…
voxtral-mini$0.04$0.04128K
ministral-8b$0.1$0.1128Kโœ…
voxtral-small$0.1$0.3128K
mistral-7b$0.15$0.232K
mistral-nemo$0.15$0.15128Kโœ…
mistral-small$0.2$0.6128Kโœ…
mistral-medium$0.4$2128Kโœ…
mixtral-8x7b$0.45$0.732Kโœ…
magistral-small$0.5$1.5128Kโœ…โœ…
mixtral-8x22b$0.8$1.264Kโœ…
mistral-large$2$6128Kโœ…
pixtral-large$2$6128Kโœ…
mistral-large-2407$4$12128Kโœ…
codestralFree256K
devstralFree128Kโœ…
+ +

๐Ÿข xAI

+

Grok โ€” models with real-time knowledge. 6 models available.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelInput $/1MOutput $/1MContextTool CallReasoning
xai-grok-4-fast$0.2$0.5131Kโœ…
xai-grok-4.1$0.2$0.5131Kโœ…โœ…
xai-grok-3-mini$0.25$1.27131Kโœ…โœ…
xai-grok-4.2$2$6131Kโœ…โœ…
xai-grok-3$3$15131Kโœ…โœ…
xai-grok-4$3$15131Kโœ…โœ…
+ +

๐Ÿข AWS Bedrock

+

Managed access to multiple foundation models. 57 models available.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelInput $/1MOutput $/1MContextTool CallReasoning
amazon-nova-micro$0.035$0.14128Kโœ…
google-gemma-3-4b$0.04$0.08131K
mistral-voxtral-mini$0.04$0.04128K
amazon-nova-lite$0.06$0.24300Kโœ…
nvidia-nemotron-nano-2$0.06$0.234K
nvidia-nemotron-nano-3-30b$0.06$0.244K
openai-gpt-oss-20b$0.07$0.3131Kโœ…
openai-gpt-oss-safeguard-20b$0.07$0.2131Kโœ…
zai-glm-4-7-flash$0.07$0.4131Kโœ…
google-gemma-3-12b$0.09$0.29131K
meta-llama-3-2-1b$0.1$0.1128K
mistral-ministral-3b$0.1$0.1128K
mistral-voxtral-small$0.1$0.3128K
meta-llama-3-2-3b$0.15$0.15128K
mistral-ministral-8b$0.15$0.15128K
mistral-mistral-7b$0.15$0.232K
nvidia-nemotron-3-super-120b$0.15$0.654K
openai-gpt-oss-120b$0.15$0.6131Kโœ…
openai-gpt-oss-safeguard-120b$0.15$0.6131Kโœ…
qwen-qwen3-32b$0.15$0.6131Kโœ…
qwen-qwen3-coder-30b-a3b$0.15$0.6131Kโœ…
writer-palmyra-vision-7b$0.15$0.68K
meta-llama-3-2-11b$0.16$0.16128Kโœ…
meta-llama-4-scout-17b$0.17$0.661Mโœ…
mistral-ministral-14b$0.2$0.2128K
nvidia-nemotron-nano-2-vl$0.2$0.64K
meta-llama-3-1-8b$0.22$0.22128Kโœ…
google-gemma-3-27b$0.23$0.38131K
meta-llama-4-maverick-17b$0.24$0.971Mโœ…
meta-llama-3-8b$0.3$0.68K
minimax-m2-1$0.3$1.21Mโœ…
minimax-m2-5$0.3$1.21Mโœ…
minimax-m2$0.3$1.21Mโœ…
amazon-nova-2-lite$0.33$2.7564Kโœ…
mistral-devstral$0.4$2128Kโœ…
mistral-mixtral-8x7b$0.45$0.732K
mistral-magistral-small$0.5$1.5128Kโœ…
mistral-mistral-large-3$0.5$1.5128Kโœ…
qwen-qwen3-coder-next$0.5$1.2131Kโœ…
qwen-qwen3-vl-235b-a22b$0.53$2.66131Kโœ…
kimi-k2-thinking$0.6$2.5131Kโœ…
moonshot-kimi-k2-5$0.6$3131Kโœ…
zai-glm-4-7$0.6$2.2131Kโœ…
deepseek-v3-2$0.62$1.8565Kโœ…
meta-llama-3-1-70b$0.72$0.72128Kโœ…
meta-llama-3-2-90b$0.72$0.72128Kโœ…
meta-llama-3-3-70b$0.72$0.72128Kโœ…
amazon-nova-pro$0.8$3.2300Kโœ…
meta-llama-3-1-70b-latency-optimized$0.9$0.9128Kโœ…
amazon-nova-pro-latency-optimized$1$4300Kโœ…
mistral-mistral-small$1$3128Kโœ…
zai-glm-5$1$3.2131Kโœ…
deepseek-r1$1.35$5.465K
mistral-pixtral-large$2$6128Kโœ…
amazon-nova-premier$2.5$12.51Mโœ…
meta-llama-3-70b$2.65$3.58K
mistral-mistral-large$4$12128Kโœ…
+ +

๐Ÿข Groq

+

Ultra-fast inference with LPU hardware. 12 models available.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelInput $/1MOutput $/1MContextTool CallReasoning
llama-3.1-8b-instant$0.05$0.08131Kโœ…
gpt-oss-20b$0.075$0.3131Kโœ…
gpt-oss-safeguard-20b$0.075$0.3131Kโœ…
llama-4-scout-17b-16e-instruct$0.11$0.34131Kโœ…
gpt-oss-120b$0.15$0.6131Kโœ…
qwen3-32b$0.29$0.59131Kโœ…
llama-3.3-70b-versatile$0.59$0.79131Kโœ…
kimi-k2-instruct-0905$1$3131Kโœ…
orpheus-ar-sa$?$??
orpheus-en$?$??
whisper-large-v3-turbo$?$??
whisper-large-v3$?$??
+ +

๐Ÿข Together AI

+

Open-weight model hosting platform. 24 models available.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelInput $/1MOutput $/1MContextTool CallReasoning
liquid-ai--LFM2-24B-A2B$0.03$0.12131Kโœ…
openai--gpt-oss-20b$0.05$0.2131Kโœ…
google--gemma-3n-E4B-it$0.06$0.12131K
Qwen--Qwen3.5-9B$0.1$0.15131Kโœ…
meta-llama--Meta-Llama-3.1-8B-Instruct-Lite$0.1$0.1131Kโœ…
essential-ai--Rnj-1-Instruct$0.15$0.15131K
openai--gpt-oss-120b$0.15$0.6131Kโœ…
Qwen--Qwen3-235B-A22B-FP8-Throughput$0.2$0.6131Kโœ…
MiniMaxAI--MiniMax-M2.5$0.3$1.2131Kโœ…
MiniMaxAI--MiniMax-M2.7$0.3$1.2131Kโœ…
Qwen--Qwen2.5-7B-Instruct-Turbo$0.3$0.3131Kโœ…
google--gemma-4-31B-it$0.39$0.97131Kโœ…
Qwen--Qwen3-Coder-Next$0.5$1.2131Kโœ…
Qwen--Qwen3.6-Plus$0.5$3131Kโœ…
moonshotai--Kimi-K2.5$0.5$2.8131Kโœ…
Qwen--Qwen3.5-397B-A17B$0.6$3.6131Kโœ…
deepseek-ai--DeepSeek-V3.1$0.6$1.7131Kโœ…
meta-llama--Llama-3.3-70B-Instruct-Turbo$0.88$0.88131Kโœ…
zai-org--GLM-5$1$3.2131Kโœ…
moonshotai--Kimi-K2.6$1.2$4.5262Kโœ…
cogito-ai--Cogito-v2.1-671B$1.25$1.25131Kโœ…โœ…
zai-org--GLM-5.1$1.4$4.4131Kโœ…
Qwen--Qwen3-Coder-480B-A35B-Instruct$2$2131Kโœ…
deepseek-ai--DeepSeek-V4-Pro$2.1$4.4131Kโœ…โœ…
+ +

๐Ÿข Fireworks

+

Fast inference for open-source models. 10 models available.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelInput $/1MOutput $/1MContextTool CallReasoning
gpt-oss-20b$0.07$0.3131Kโœ…
gpt-oss-120b$0.15$0.6131Kโœ…
llama4-scout-17b-16e-instruct$0.18$0.59131Kโœ…
minimax-m2.5$0.3$1.2196Kโœ…
minimax-m2.7$0.3$1.2196Kโœ…
qwen3.6-plus$0.5$3131Kโœ…
kimi-k2.5$0.6$3262Kโœ…
kimi-k2.6$0.95$4262Kโœ…
glm-5.1$1.4$4.4202Kโœ…
deepseek-v4-pro$1.74$3.481Mโœ…โœ…
+ +

๐Ÿข Cerebras

+

Wafer-scale inference at extreme speed. 11 models available.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelInput $/1MOutput $/1MContextTool CallReasoning
llama3.1-8b$0.1$0.1131Kโœ…
gpt-oss-120b$0.35$0.75131Kโœ…
qwen3-235b-instruct$0.6$1.2131Kโœ…
zai-glm-4.7$2.25$2.75131Kโœ…
deepseek-r1-distill-llama-70bFree131Kโœ…
deepseek-r1-distill-llama-8bFree131Kโœ…
llama-3.3-70bFree131Kโœ…
llama-4-scout-17b-16e-instructFree131Kโœ…
qwen-2.5-32bFree131Kโœ…
qwen-2.5-coder-32bFree131Kโœ…
qwen3-32bFree131Kโœ…
+ +

๐Ÿข Databricks

+

DBRX and enterprise AI models. 29 models available.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelInput $/1MOutput $/1MContextTool CallReasoning
databricks-gpt-5-nano$0.05$0.4200K
databricks-gpt-oss-20b$0.07$0.3131K
databricks-gemma-3-12b$0.15$0.5131K
databricks-gpt-oss-120b$0.15$0.6131K
databricks-meta-llama-3-1-8b-instruct$0.15$0.45131Kโœ…
databricks-qwen3-next-80b-a3b-instruct$0.15$1.2131Kโœ…
databricks-gpt-5-4-nano$0.2$1.25128K
databricks-gemini-3-1-flash-lite$0.25$1.5128K
databricks-gpt-5-1-codex-mini$0.25$2200K
databricks-gpt-5-mini$0.25$2200K
databricks-gemini-2-5-flash$0.3$2.5128K
databricks-llama-4-maverick$0.5$1.5131Kโœ…
databricks-meta-llama-3-3-70b-instruct$0.5$1.5131Kโœ…
databricks-gemini-3-flash$0.63$3.75128K
databricks-gpt-5-4-mini$0.75$4.5128K
databricks-claude-haiku-4-5$1$5200K
databricks-gemini-2-5-pro$1.25$10128K
databricks-gpt-5-1-codex-max$1.25$10200K
databricks-gpt-5-1$1.25$10200K
databricks-gpt-5$1.25$10200K
databricks-gpt-5-2-codex$1.75$14200K
databricks-gpt-5-2$1.75$14200K
databricks-gemini-3-1-pro$2.5$15128K
databricks-gpt-5-4$2.5$15128K
databricks-claude-sonnet-4-5$3$15200K
databricks-claude-sonnet-4$3$15200K
databricks-claude-opus-4-5$5$25200K
databricks-gpt-5-5$5$30128K
databricks-claude-opus-4-1$15$75200K
+ +

๐Ÿข Alibaba (Qwen)

+

Qwen โ€” multilingual models from Alibaba Cloud. 62 models available.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelInput $/1MOutput $/1MContextTool CallReasoning
qwen-flash$0.15$1.5?โœ…โœ…
qwen3.5-flash-2026-02-23$0.2$21Mโœ…
qwen3.5-flash$0.2$21Mโœ…
qwen-flash-character$0.25$1.5?โœ…โœ…
qwen-turbo$0.3$0.6?โœ…โœ…
qwen3-0.6b$0.3$1.2?โœ…โœ…
qwen3-1.7b$0.3$1.2?โœ…โœ…
qwen3-4b$0.3$1.2?โœ…โœ…
qwen-omni-turbo$0.4$25?โœ…โœ…
qwen3.5-35b-a3b$0.4$3.2256Kโœ…
qwen-long-2025-01-25$0.5$2?โœ…โœ…
qwen-long-latest$0.5$2?โœ…โœ…
qwen-long$0.5$2?โœ…โœ…
qwen2.5-7b-instruct-1m$0.5$1?โœ…โœ…
qwen2.5-7b-instruct$0.5$1?โœ…โœ…
qwen3-8b$0.5$2?โœ…โœ…
qwen-mt-lite$0.6$1.6?โœ…โœ…
qwen2.5-omni-7b$0.6$38?โœ…โœ…
qwen3.5-27b$0.6$4.8256Kโœ…
qwen-mt-flash$0.7$1.95?โœ…โœ…
qwen-mt-turbo$0.7$1.95?โœ…โœ…
qwen3-30b-a3b-instruct-2507$0.75$3?โœ…โœ…
qwen3-30b-a3b$0.75$3?โœ…โœ…
qwen-plus-character$0.8$2?โœ…โœ…
qwen-plus$0.8$2?โœ…โœ…
qwen3.5-122b-a10b$0.8$6.4256Kโœ…
qwen3.5-plus-2026-02-15$0.8$4.81Mโœ…
qwen3.5-plus$0.8$4.81Mโœ…
qwen2.5-14b-instruct-1m$1$3?โœ…โœ…
qwen2.5-14b-instruct$1$3?โœ…โœ…
qwen3-14b$1$4?โœ…โœ…
qwen3-coder-flash-2025-07-28$1$4?โœ…โœ…
qwen3-coder-flash$1$4?โœ…โœ…
qwen3-coder-next$1$4?โœ…โœ…
qwen3-next-80b-a3b-instruct$1$4?โœ…โœ…
qwen2.5-vl-3b-instruct$1.2$3.6?โœ…โœ…
qwen3.5-397b-a17b$1.2$7.2256Kโœ…
qwen3.6-flash-2026-04-16$1.2$7.21Mโœ…
qwen3.6-flash$1.2$7.21Mโœ…โœ…
qwen3-coder-30b-a3b-instruct$1.5$6?โœ…โœ…
qwen-mt-plus$1.8$5.4?โœ…โœ…
qwen2.5-32b-instruct$2$6?โœ…โœ…
qwen2.5-vl-7b-instruct$2$5?โœ…โœ…
qwen3-235b-a22b-instruct-2507$2$8?โœ…โœ…
qwen3-235b-a22b$2$8?โœ…โœ…
qwen3-32b$2$8?โœ…โœ…
qwen3.6-plus-2026-04-02$2$121Mโœ…
qwen3.6-plus$2$121Mโœ…โœ…
qwen-max$2.4$9.6?โœ…โœ…
qwen3-max-2026-01-23$2.5$10?โœ…โœ…
qwen3-max$2.5$10?โœ…โœ…
qwen-plus-character-ja$3.67$10.275?โœ…โœ…
qwen2.5-72b-instruct$4$12?โœ…โœ…
qwen3-coder-plus-2025-07-22$4$16?โœ…โœ…
qwen3-coder-plus-2025-09-23$4$16?โœ…โœ…
qwen3-coder-plus$4$16?โœ…โœ…
qwen3-coder-480b-a35b-instruct$6$24?โœ…โœ…
qwen3-max-2025-09-23$6$24?โœ…โœ…
qwen3-max-preview$6$24?โœ…โœ…
qwen2.5-vl-32b-instruct$8$24?โœ…โœ…
qwen3.6-max-preview$9$54256Kโœ…โœ…
qwen2.5-vl-72b-instruct$16$48?โœ…โœ…
+ +

๐Ÿข ByteDance

+

Doubao โ€” models from the TikTok parent company. 5 models available.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelInput $/1MOutput $/1MContextTool CallReasoning
seed-1.6-flash$0.07$0.3262Kโœ…โœ…
seed-2.0-mini$0.1$0.4262Kโœ…โœ…
ui-tars-1.5-7b$0.1$0.2128K
seed-1.6$0.25$2262Kโœ…โœ…
seed-2.0-lite$0.25$2262Kโœ…โœ…
+ +

๐Ÿข MiniMax

+

Chinese AI startup with competitive models. 21 models available.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelInput $/1MOutput $/1MContextTool CallReasoning
M2-her$2.1$8.464K
MiniMax-M2.1$2.1$8.4204K
MiniMax-M2.5$2.1$8.4204K
MiniMax-M2.7$2.1$8.4204K
MiniMax-M2$2.1$8.4204K
MiniMax-M2.1-highspeed$4.2$16.8204K
MiniMax-M2.5-highspeed$4.2$16.8204K
MiniMax-M2.7-highspeed$4.2$16.8204K
MiniMax-Hailuo-02$?$??
MiniMax-Hailuo-2.3-Fast$?$??
MiniMax-Hailuo-2.3$?$??
image-01-live$?$??
image-01$?$??
music-2.6$?$??
music-cover$?$??
speech-02-hd$?$??
speech-02-turbo$?$??
speech-2.6-hd$?$??
speech-2.6-turbo$?$??
speech-2.8-hd$?$??
speech-2.8-turbo$?$??
+ +

๐Ÿข Moonshot AI

+

Kimi โ€” long-context Chinese models. 16 models available.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelInput $/1MOutput $/1MContextTool CallReasoning
moonshot-v1-8k-vision-preview$2$108K
moonshot-v1-8k$2$108K
kimi-k2-0711-preview$4$16131K
kimi-k2-0905-preview$4$16262K
kimi-k2-thinking$4$16262Kโœ…
kimi-k2.5$4$21262Kโœ…
kimi-vl-a3b-thinking$4$21131Kโœ…
kimi-vl-a3b$4$21131K
moonshot-v1-32k-vision-preview$5$2032K
moonshot-v1-32k$5$2032K
kimi-k2.6-long$6.5$27262Kโœ…
kimi-k2.6$6.5$27262Kโœ…
kimi-k2-thinking-turbo$8$58262Kโœ…
kimi-k2-turbo-preview$8$58262K
moonshot-v1-128k-vision-preview$10$30131K
moonshot-v1-128k$10$30131K
+ +

๐Ÿข StepFun

+

Step โ€” Chinese AI models with strong capabilities. 31 models available.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelInput $/1MOutput $/1MContextTool CallReasoning
step-3.5-flash-2603$0.7$2.1256K
step-3.5-flash$0.7$2.1256K
step-2-mini$1$232K
step-3$1.5$464K
step-1o-turbo-vision$2.5$832K
step-r1-v-mini$2.5$8100K
step-1-8k$5$208K
step-1v-8k$5$208K
step-audio-2$10$70?
stepaudio-2.5-chat$10$25?
stepaudio-2.5-realtime$10$70?
step-1-32k$15$7032K
step-1o-vision-32k$15$7032K
step-1v-32k$15$7032K
step-1o-audio$25$60?
step-2-16k-exp$38$12016K
step-2-16k$38$12016K
step-1x-editFree?
step-1x-medium$?$??
step-2x-largeFree?
step-asr-1.1-stream$?$??
step-asr-1.1$?$??
step-asr$?$??
step-audio-r1.1Free?
step-guiFree?
step-image-edit-2$?$??
step-tts-2$?$??
step-tts-mini$?$??
stepaudio-2-asr-pro$?$??
stepaudio-2.5-asr$?$??
stepaudio-2.5-tts$?$??
+ +

๐Ÿข Baidu

+

ERNIE โ€” models from China's search giant. 8 models available.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelInput $/1MOutput $/1MContextTool CallReasoning
deepseek-v4-flash$0.126$0.2521Mโœ…โœ…
deepseek-v3.2$0.252$0.378131Kโœ…โœ…
minimax-m2.5$0.27$1.08196Kโœ…โœ…
qianfan-ocr-fast$0.6799999999999999$2.8165K
glm-5$0.7$2.24202Kโœ…โœ…
glm-5.1$0.98$3.08202Kโœ…โœ…
deepseek-v4-pro$1.521$3.042716Kโœ…โœ…
cobuddyFree131Kโœ…
+ +

๐Ÿ“Š Methodology

+

+ All data is sourced from first-party APIs โ€” not third-party aggregators. Pricing, + context windows, and capabilities are verified against official provider documentation. + Aggregator providers (OpenRouter, Requesty, etc.) are labeled as such โ€” they provide access to + other providers' models. +

+ +

๐Ÿ”— More Resources

+ + + Small Language Models +

๐ŸŽฏ AI Model Picker

+

โšก GitHub Action

+ + + diff --git a/site/best-ai-models-for-agents.html b/site/best-ai-models-for-agents.html new file mode 100644 index 00000000..f67af0e0 --- /dev/null +++ b/site/best-ai-models-for-agents.html @@ -0,0 +1,1003 @@ + + + + + + Best AI Models for Agents โ€” Top Agentic LLMs Compared (2025) | AI Models Catalog + + + + + + + + + + + + + + + + + + +

๐Ÿค– Best AI Models for Agents (2025)

+

+ Compare the top AI models for building autonomous agents. 1,080+ models with tool + calling โ€” the key capability for agentic workflows. +

+ +
+
1,080Agentic Models
+
2,350Tool Calling
+
1,306Reasoning
+
829Structured Output
+
+ + ๐Ÿ” Interactive Catalog + โญ Star on GitHub + +
+ ๐Ÿ’ก What makes a model "agentic"? The three key capabilities are: + Tool calling (invoke APIs/functions), Reasoning (plan multi-step actions), and + Structured output (return parseable JSON). Models with all three are the most capable + agents. +
+ +

๐Ÿ† Top Agentic Models โ€” Full Stack (Tool Call + Reasoning + Structured Output)

+

Models with all three agentic capabilities. Best for complex autonomous workflows.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContext
openai--gpt-oss-20bneuralwatt$0.03$0.16?
Qwen--Qwen3.6-35B-A3Bneuralwatt$0.05$0.1?
openai--gpt-oss-120bnovitaai$0.05$0.25131K
Nemotron-3-Nano-Omninebius$0.06$0.24128K
hermes-4-llama-3.1-8bnousresearch$0.06$0.12131K
zai-org--glm-4.7-flashnovitaai$0.07$0.4200K
Qwen--Qwen3-32B-TEEchutes$0.08$0.2440K
Gemma-3-27b-itnebius$0.1$0.396K
Qwen3-32Bnebius$0.1$0.3128K
xiaomimimo--mimo-v2-flashnovitaai$0.1$0.3262K
Qwen--Qwen3-235B-A22B-Thinking-2507chutes$0.11$0.6262K
deepseek-v4-flashbaidu$0.126$0.2521M
google--gemma-4-31B-turbo-TEEchutes$0.13$0.38131K
Hermes-4-70Bnebius$0.13$0.4128K
google--gemma-4-26b-a4b-itnovitaai$0.13$0.4262K
+ +

๐Ÿ”ง Tool Calling + Reasoning

+

+ Models that can both call tools and reason about when/how to use them. Essential for + ReAct-style agents. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContext
openai--gpt-oss-20bneuralwatt$0.03$0.16?
qwen--qwen3-4b-fp8novitaai$0.03$0.03128K
gpt-oss-120binferencenet$0.05$0.45131K
Qwen--Qwen3.6-35B-A3Bneuralwatt$0.05$0.1?
openai--gpt-oss-120bnovitaai$0.05$0.25131K
qwen3-30b-a3b-fp8cloudflare$0.051$0.33540K
glm-4.7-flashcloudflare$0.06$0.4131K
Nemotron-3-Nano-Omninebius$0.06$0.24128K
hermes-4-llama-3.1-8bnousresearch$0.06$0.12131K
seed-1.6-flashbytedance$0.07$0.3262K
ring-2.6-1tinclusionai$0.07$0.62262K
zai-org--glm-4.7-flashnovitaai$0.07$0.4200K
microsoft-phi-4-mini-reasoningmicrosoft$0.075$0.3128K
Qwen--Qwen3-32B-TEEchutes$0.08$0.2440K
gpt-oss-120bclarifai$0.09$0.36131K
+ +

๐Ÿ’ฐ Cheapest Tool Calling Models

+

Most affordable models with tool calling for budget-conscious agent deployments.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContext
ling-2.6-flashinclusionai$0.01$0.03262K
bdc-coderinferencenet$0.01$0.01131K
klusterai--Meta-Llama-3.1-8B-Instruct-Turboklusterai$0.015$0.02131K
granite-4.0-h-microcloudflare$0.017$0.112131K
llama-3.1-8b-instruct--fp-16inferencenet$0.02$0.03131K
schematron-3binferencenet$0.02$0.05131K
schematron-v3inferencenet$0.02$0.05131K
gpt-oss-20binferencenet$0.03$0.15131K
schematron-v2-turboinferencenet$0.03$0.15131K
openai--gpt-oss-20bneuralwatt$0.03$0.16?
qwen--qwen3-4b-fp8novitaai$0.03$0.03128K
liquid-ai--LFM2-24B-A2Btogetherai$0.03$0.12131K
amazon-nova-microamazon$0.035$0.14128K
amazon-nova-microamazon-bedrock$0.035$0.14128K
mistral-nemo-12b-instruct--fp-8inferencenet$0.0375$0.1131K
+ +

๐Ÿ†“ Free Models with Tool Calling

+

Zero-cost models for building and testing agents.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextReasoningStructured Output
openrouter--owl-alphaopenrouter1Mโœ…
deepseek--deepseek-v4-flash--freeopenrouter1Mโœ…
qwen--qwen3-coder--freeopenrouter1M
nvidia--nemotron-3-super-120b-a12b--freeopenrouter1Mโœ…โœ…
gemma-4-26b-a4b-itauriko262Kโœ…โœ…
gemma-4-31b-itauriko262Kโœ…โœ…
arcee-ai--trinity-large-thinking--freeopenrouter262Kโœ…
google--gemma-4-26b-a4b-it--freeopenrouter262Kโœ…โœ…
google--gemma-4-31b-it--freeopenrouter262Kโœ…โœ…
nvidia--nemotron-3-nano-omni-30b-a3b-reasoning--freeopenrouter256Kโœ…
+ +

๐Ÿ”“ Open-Weight Models with Tool Calling

+

Run agent models locally for full privacy and zero API costs at scale.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextReasoningStructured Output
google--gemma-4-31b-itorcarouter1M
qwen--qwen3.5-flash-2026-02-23orcarouter1M
qwen--qwen3.5-flashorcarouter1M
qwen--qwen3.6-flash-2026-04-16orcarouter1M
qwen--qwen3.6-flashorcarouter1M
meta-llama-4-maverick-17bamazon-bedrock1M
meta-llama-4-scout-17bamazon-bedrock1M
minimax-m2-1amazon-bedrock1M
minimax-m2-5amazon-bedrock1M
minimax-m2amazon-bedrock1M
+ +

๐Ÿ“ Large Context + Tool Calling

+

+ Models with 128K+ context and tool calling for agents that need to process large documents or + maintain long conversation history. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextInput $/1MReasoning
ling-2.6-flashinclusionai262K$0.01
bdc-coderinferencenet131K$0.01
klusterai--Meta-Llama-3.1-8B-Instruct-Turboklusterai131K$0.015
granite-4.0-h-microcloudflare131K$0.017
llama-3.1-8b-instruct--fp-16inferencenet131K$0.02
schematron-3binferencenet131K$0.02
schematron-v3inferencenet131K$0.02
gpt-oss-20binferencenet131K$0.03
schematron-v2-turboinferencenet131K$0.03
qwen--qwen3-4b-fp8novitaai128K$0.03โœ…
liquid-ai--LFM2-24B-A2Btogetherai131K$0.03
amazon-nova-microamazon128K$0.035
amazon-nova-microamazon-bedrock128K$0.035
mistral-nemo-12b-instruct--fp-8inferencenet131K$0.0375
klusterai--Meta-Llama-3.3-70B-Instruct-Turboklusterai131K$0.038
+ +

๐Ÿ“Š Methodology

+

+ All data is sourced from first-party APIs. Agentic capability is defined by tool + calling (function calling), reasoning (chain-of-thought), and structured output (JSON mode). + Aggregator providers are excluded from ranking tables to avoid duplicate models. +

+ +

๐Ÿ”— More Resources

+ + + Small Language Models +

๐ŸŽฏ AI Model Picker

+

โšก GitHub Action

+ + + diff --git a/site/best-ai-models-for-coding.html b/site/best-ai-models-for-coding.html new file mode 100644 index 00000000..260ed526 --- /dev/null +++ b/site/best-ai-models-for-coding.html @@ -0,0 +1,880 @@ + + + + + + Best AI Models for Coding โ€” Top 20 Code LLMs Compared (2025) | AI Models Catalog + + + + + + + + + + + + + + + + + + +

๐Ÿ’ป Best AI Models for Coding (2025)

+

+ Compare the top AI models for code generation, debugging, and software development. Real + pricing, context windows, and capabilities from first-party data. +

+ +
+
189Code Models
+
2,350Tool Calling
+
1,306Reasoning
+
81Free Models
+
+ + ๐Ÿ” Interactive Catalog + โญ Star on GitHub + +
+ ๐Ÿ’ก What makes a good coding model? Tool calling for agentic workflows, large + context for codebases, reasoning for complex logic, and structured output for parsing. We rank + models by these capabilities. +
+ +

๐Ÿ† Top Coding Models โ€” Flagship Tier

+

The most capable models for complex coding tasks. Higher price, highest quality.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContextTool CallReasoning
gpt-4.1openai$2$81Mโœ…
gpt-4oopenai$2.5$10128Kโœ…
gemini-2.5-prodeepinfra$1.25$101Mโœ…
deepseek-r1amazon-bedrock$1.35$5.465K
+ +

๐Ÿ’ฐ Best Value for Coding

+

Great coding performance at lower prices. Perfect for high-volume code generation.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContextTool CallReasoning
gpt-4o-miniopenai$0.15$0.6128Kโœ…
gemini-2.5-flashdeepinfra$0.3$2.51Mโœ…
deepseek-v3deepinfra$0.32$0.89163K
deepseek-r1amazon-bedrock$1.35$5.465K
+ +

๐Ÿ†“ Free Models for Coding

+

Zero-cost models for learning, prototyping, and personal projects.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextTool CallReasoning
openrouter--owl-alphaopenrouter1Mโœ…
deepseek--deepseek-v4-flash--freeopenrouter1Mโœ…โœ…
qwen--qwen3-coder--freeopenrouter1Mโœ…
nvidia--nemotron-3-super-120b-a12b--freeopenrouter1Mโœ…โœ…
gemma-4-26b-a4b-itauriko262Kโœ…โœ…
gemma-4-31b-itauriko262Kโœ…โœ…
arcee-ai--trinity-large-thinking--freeopenrouter262Kโœ…โœ…
google--gemma-4-26b-a4b-it--freeopenrouter262Kโœ…โœ…
google--gemma-4-31b-it--freeopenrouter262Kโœ…โœ…
nvidia--nemotron-3-nano-omni-30b-a3b-reasoning--freeopenrouter256Kโœ…โœ…
+ +

๐Ÿ”“ Open-Weight Models for Coding

+

Download and run locally for full privacy and zero API costs at scale.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextTool CallReasoning
google--gemma-4-31b-itorcarouter1Mโœ…
qwen--qwen3.5-flash-2026-02-23orcarouter1Mโœ…
qwen--qwen3.5-flashorcarouter1Mโœ…
qwen--qwen3.6-flash-2026-04-16orcarouter1Mโœ…
qwen--qwen3.6-flashorcarouter1Mโœ…
meta-llama-4-maverick-17bamazon-bedrock1Mโœ…
meta-llama-4-scout-17bamazon-bedrock1Mโœ…
minimax-m2-1amazon-bedrock1Mโœ…
minimax-m2-5amazon-bedrock1Mโœ…
minimax-m2amazon-bedrock1Mโœ…
+ +

๐Ÿ“ Large Context for Codebases

+

+ Models with 128K+ context for working with large codebases, multiple files, and long + conversations. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextInput $/1MTool Call
ling-2.6-flashinclusionai262K$0.01โœ…
bdc-coderinferencenet131K$0.01โœ…
klusterai--Meta-Llama-3.1-8B-Instruct-Turboklusterai131K$0.015โœ…
granite-4.0-h-microcloudflare131K$0.017โœ…
llama-3.1-8b-instruct--fp-16inferencenet131K$0.02โœ…
schematron-3binferencenet131K$0.02โœ…
schematron-v3inferencenet131K$0.02โœ…
gpt-oss-20binferencenet131K$0.03โœ…
schematron-v2-turboinferencenet131K$0.03โœ…
qwen--qwen3-4b-fp8novitaai128K$0.03โœ…
liquid-ai--LFM2-24B-A2Btogetherai131K$0.03โœ…
amazon-nova-microamazon128K$0.035โœ…
amazon-nova-microamazon-bedrock128K$0.035โœ…
mistral-nemo-12b-instruct--fp-8inferencenet131K$0.0375โœ…
klusterai--Meta-Llama-3.3-70B-Instruct-Turboklusterai131K$0.038โœ…
+ +

๐Ÿค– Agentic Coding Models

+

+ Models with tool calling + reasoning โ€” the key capabilities for AI coding agents (Cursor, + Copilot, Devin-style). +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContext
openai--gpt-oss-20bneuralwatt$0.03$0.16?
qwen--qwen3-4b-fp8novitaai$0.03$0.03128K
gpt-oss-120binferencenet$0.05$0.45131K
Qwen--Qwen3.6-35B-A3Bneuralwatt$0.05$0.1?
openai--gpt-oss-120bnovitaai$0.05$0.25131K
qwen3-30b-a3b-fp8cloudflare$0.051$0.33540K
glm-4.7-flashcloudflare$0.06$0.4131K
Nemotron-3-Nano-Omninebius$0.06$0.24128K
hermes-4-llama-3.1-8bnousresearch$0.06$0.12131K
seed-1.6-flashbytedance$0.07$0.3262K
ring-2.6-1tinclusionai$0.07$0.62262K
zai-org--glm-4.7-flashnovitaai$0.07$0.4200K
microsoft-phi-4-mini-reasoningmicrosoft$0.075$0.3128K
Qwen--Qwen3-32B-TEEchutes$0.08$0.2440K
gpt-oss-120bclarifai$0.09$0.36131K
+ +

๐Ÿ“Š Methodology

+

+ All data is sourced from first-party APIs. Models are selected based on capabilities + relevant to coding: tool calling (for agentic workflows), reasoning (for complex logic), large + context (for codebases), and structured output (for parsing). Aggregator providers are + excluded from ranking tables. +

+ +

๐Ÿ”— More Resources

+ + + Small Language Models +

๐ŸŽฏ AI Model Picker

+

โšก GitHub Action

+ + + diff --git a/site/best-ai-models-for-image-generation.html b/site/best-ai-models-for-image-generation.html new file mode 100644 index 00000000..7510aa26 --- /dev/null +++ b/site/best-ai-models-for-image-generation.html @@ -0,0 +1,784 @@ + + + + + + + Best AI Image Generation Models โ€” DALLยทE, Imagen, GPT-5 Image Compared (2025) | AI Models + Catalog + + + + + + + + + + + + + + + + + + + +

๐ŸŽจ Best AI Models for Image Generation (2025)

+

+ Compare the top AI models for image generation โ€” DALLยทE, Imagen, GPT-5 Image, Gemini, and + more. Real pricing and capabilities from first-party data. +

+ +
+
28Image Gen Models
+
9Providers
+
4,587Total Models
+
95Providers
+
+ + ๐Ÿ” Interactive Catalog + โญ Star on GitHub + +
+ ๐Ÿ’ก Two types of image generation models: Dedicated image models (DALLยทE, + Imagen) generate images from text descriptions. Chat models with image output (GPT-5 Image, + Gemini) can both understand and generate images in conversation. Choose based on your use + case. +
+ +

๐Ÿ–ผ๏ธ Dedicated Image Generation Models

+

+ Purpose-built models for text-to-image generation. Best for art, design, and visual content + creation. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderTypeKey Feature
imagen-4.0-generategoogleText โ†’ ImageLatest Imagen, highest quality
imagen-4.0-fast-generategoogleText โ†’ ImageFast generation, lower cost
imagen-3.0-generategoogleText โ†’ ImageStable v3, production-ready
imagen-3.0-fast-generategoogleText โ†’ ImageFast v3 variant
dall-e-3openaiText โ†’ ImageBest prompt adherence, DALLยทE quality
dall-e-2openaiText โ†’ ImageLower cost, good for simple images
step-2x-largestepfunText โ†’ ImageHigh-quality Chinese + English
step-1x-mediumstepfunText โ†’ ImageMid-tier, good balance
step-1x-editstepfunImage EditEdit existing images
step-image-edit-2stepfunImage EditAdvanced editing v2
image-01minimaxText โ†’ ImageMiniMax image generation
image-01-liveminimaxText โ†’ ImageReal-time generation
+ +

๐Ÿ’ฌ Chat Models with Image Output

+

+ Multimodal chat models that can generate images within a conversation. Best for agents and + interactive applications. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContextTool CallReasoning
gpt-5-image-miniopenrouter$2.50$2400Kโœ…
gemini-3.1-flash-imagefastrouter$0.25$1.5065Kโœ…
gemini-2.5-flash-imagefastrouter$0.30$2.5032K
gemini-3.1-flash-imageauriko$0.50$365Kโœ…
gemini-2.5-flash-imageauriko$0.30$0.0432K
amazon-nova-2.0-omniamazon$0.20$1.3064Kโœ…โœ…
gpt-5-imageopenrouter$10$10400Kโœ…
gpt-5.4-image-2openrouter$8$15272Kโœ…
gemini-3-pro-imagefastrouter$2$1265K
gemini-3-pro-imageauriko$2$12131Kโœ…
+ +

๐Ÿ’ฐ Cheapest Image Generation Models

+

Most affordable options for high-volume image generation.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContext
amazon-nova-2.0-omniamazon$0.20$1.3064K
gemini-3.1-flash-imagefastrouter$0.25$1.5065K
gemini-2.5-flash-imagefastrouter$0.30$2.5032K
gemini-2.5-flash-imageauriko$0.30$0.0432K
gemini-3.1-flash-imageauriko$0.50$365K
gpt-5-image-miniopenrouter$2.50$2400K
+ +

๐Ÿค– Image Models with Tool Calling

+

+ Models that support both image generation and function/tool calling โ€” ideal for AI agents that + create images. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContextReasoning
amazon-nova-2.0-omniamazon$0.20$1.3064Kโœ…
gemini-3-pro-imagellmgateway$2$12โ€”
gemini-3.1-flash-imagellmgateway$0.25$1.50โ€”
gemini-2.5-flash-imagellmgateway$0.30$30โ€”
+ +

๐Ÿ“ Image Models with Large Context

+

+ Models with 64K+ context for detailed image descriptions, multi-image generation, and long + conversations. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextInput $/1MOutput $/1M
gpt-5-imageopenrouter400K$10$10
gpt-5-image-miniopenrouter400K$2.50$2
gpt-5.4-image-2openrouter272K$8$15
gemini-3-pro-imageauriko131K$2$12
gemini-3.1-flash-imagefastrouter65K$0.25$1.50
gemini-3-pro-imagefastrouter65K$2$12
gemini-3.1-flash-imageauriko65K$0.50$3
amazon-nova-2.0-omniamazon64K$0.20$1.30
+ +

๐Ÿ”‘ Choosing the Right Model

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
Use CaseRecommended ModelWhy
Art & creativeimagen-4.0-generateHighest quality, Google's latest
Product imagesdall-e-3Best prompt adherence, consistent style
Chat + imagesgpt-5-image-miniConversational image gen, 400K context
AI agentsamazon-nova-2.0-omniTool calling + reasoning + image output
High volume / cheapgemini-2.5-flash-imageLowest cost per image
Image editingstep-image-edit-2Purpose-built for editing
Chinese contentstep-2x-largeBest Chinese + English generation
+ +

๐Ÿ“Š Methodology

+

+ All data is sourced from first-party APIs. Models are identified by having + image in their modalities.output field. Dedicated image models + (DALLยทE, Imagen) have no chat context. Chat models with image output support both text and + image generation in conversation. Aggregator providers are excluded from ranking tables. +

+ +

๐Ÿ”— More Resources

+ + + Small Language Models +

๐ŸŽฏ AI Model Picker

+

โšก GitHub Action

+ + + diff --git a/site/best-ai-models-for-vision.html b/site/best-ai-models-for-vision.html new file mode 100644 index 00000000..5875952e --- /dev/null +++ b/site/best-ai-models-for-vision.html @@ -0,0 +1,772 @@ + + + + + + + Best Vision AI Models โ€” GPT-4o, Claude, Gemini Vision Compared (2025) | AI Models Catalog + + + + + + + + + + + + + + + + + + + +

๐Ÿ‘๏ธ Best Vision AI Models (2025)

+

+ Compare the top vision AI models โ€” GPT-4o, Claude 4, Gemini, and 1,487 models with image + understanding. Real pricing and capabilities from first-party data. +

+ +
+
1,487Vision Models
+
1,179Vision + Tool Call
+
1,026Vision + Reasoning
+
1,267Vision + 128K+ Context
+
+ + ๐Ÿ” Interactive Catalog + โญ Star on GitHub + +

๐Ÿ† Flagship Vision Models โ€” Head to Head

+

+ The top-tier multimodal models from each major provider, compared on pricing, context, and + capabilities. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContextTool CallReasoning
gpt-4oopenai$2.50$10128Kโœ…
gpt-4o-miniopenai$0.15$0.60128Kโœ…
o3openai$2$8200Kโœ…โœ…
o4-miniopenai$1.10$4.40200Kโœ…โœ…
claude-sonnet-4-20250514anthropic$3$15200Kโœ…โœ…
claude-opus-4-20250514anthropic$15$75200Kโœ…โœ…
gemini-2.5-progoogle$1.25$101Mโœ…โœ…
gemini-2.5-flashgoogle$0.15$0.601Mโœ…โœ…
deepseek-r1deepseek$0.55$2.19128Kโœ…
grok-3xai$3$15131Kโœ…โœ…
qwen3-235b-a22balibaba$0.14$0.42128Kโœ…โœ…
llama4-maverickmeta$0.20$0.801Mโœ…
+ +

๐Ÿ’ฐ Cheapest Vision Models

+

Most affordable models with image understanding โ€” ideal for high-volume applications.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContextTool Call
gemini-2.0-flash-litegoogle$0.075$0.301Mโœ…
gemini-2.5-flashgoogle$0.15$0.601Mโœ…
gpt-4o-miniopenai$0.15$0.60128Kโœ…
qwen3-235b-a22balibaba$0.14$0.42128Kโœ…
llama4-maverickmeta$0.20$0.801Mโœ…
deepseek-chatdeepseek$0.14$0.28128K
+ +

๐Ÿ†“ Free Vision Models

+

+ Vision models available at zero cost โ€” perfect for prototyping, learning, and small projects. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextTool CallReasoning
gemini-2.0-flashgoogle1Mโœ…
gemini-2.5-flashgoogle1Mโœ…โœ…
gemma3-4bgoogle128K
llama4-scout-17b-16emeta10M
qwen3-30b-a3balibaba128Kโœ…
+ +

๐Ÿค– Vision + Tool Calling Models

+

+ 1,179 models that support both image understanding and function/tool calling โ€” essential for + AI agents that process images. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContextReasoning
gemini-2.0-flash-litegoogle$0.075$0.301M
gemini-2.5-flashgoogle$0.15$0.601Mโœ…
gpt-4o-miniopenai$0.15$0.60128K
qwen3-235b-a22balibaba$0.14$0.42128Kโœ…
claude-sonnet-4-20250514anthropic$3$15200Kโœ…
grok-3-minixai$0.30$0.50131Kโœ…
+ +

๐Ÿ“ Vision Models with Largest Context

+

+ 1,267 models with 128K+ context for processing large documents, multiple images, and long + conversations. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextInput $/1MOutput $/1MTool Call
llama4-scout-17b-16emeta10Mโ€”โ€”
gemini-2.5-progoogle1M$1.25$10โœ…
gemini-2.5-flashgoogle1M$0.15$0.60โœ…
llama4-maverickmeta1M$0.20$0.80โœ…
claude-sonnet-4-20250514anthropic200K$3$15โœ…
o3openai200K$2$8โœ…
+ +

๐Ÿ”‘ Choosing the Right Vision Model

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
Use CaseRecommended ModelWhy
Document OCRgemini-2.5-pro1M context, best document understanding
Image chatbotgpt-4o-miniCheapest with tool calling, good quality
AI agentsclaude-sonnet-4Best tool calling + reasoning + vision
High volume / cheapgemini-2.0-flash-liteLowest cost at $0.075/M input
Medical imagingo3Reasoning + vision for complex analysis
Video analysisgemini-2.5-flash1M context + video input + cheap
Prototypinggemini-2.5-flashFree tier, 1M context, all capabilities
+ +

๐Ÿ“Š Methodology

+

+ All data is sourced from first-party APIs. Models are identified by having + image in their modalities.input field. Aggregator providers are + excluded from ranking tables to avoid duplicate models. Pricing is per million tokens. +

+ +

๐Ÿ”— More Resources

+ + + Small Language Models +

๐ŸŽฏ AI Model Picker

+

โšก GitHub Action

+ + + diff --git a/site/best-ai-models.html b/site/best-ai-models.html new file mode 100644 index 00000000..0ae3a243 --- /dev/null +++ b/site/best-ai-models.html @@ -0,0 +1,1126 @@ + + + + + + Best AI Models in 2025 โ€” Complete Comparison Guide | AI Models Catalog + + + + + + + + + + + + + + + + + + +

Best AI Models in 2025

+

+ A comprehensive comparison of 4587 AI models across 95 providers. Find the best + model for your use case โ€” whether you need the cheapest, the most capable, or the best for a + specific task. +

+ +
+
4,587Models
+
95Providers
+
81Free
+
2,350Tool Calling
+
1,306Reasoning
+
1,487Vision
+
527Open Weights
+
+ + ๐Ÿ” Try the Interactive Catalog + โญ Star on GitHub + + + +

๐Ÿ’ฐ Cheapest AI Models

+

The most affordable models per million tokens, excluding aggregator providers.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/MOutput $/MContextCapabilities
openai--gpt-image-1-miniaimlapi$0.007$0.676?
mistralai--Mistral-Nemo-Instruct-2407klusterai$0.008$0.001131K
qwen3.5-0.8bdeepinfra$0.01$0.05262K + ๐Ÿง  Reason + ๐Ÿ‘๏ธ Vision +
ling-2.6-flashinclusionai$0.01$0.03262K๐Ÿ”ง Tool
bdc-coderinferencenet$0.01$0.01131K๐Ÿ”ง Tool
openai--gpt-image-1-modelaimlapi$0.012$0.175?
klusterai--Meta-Llama-3.1-8B-Instruct-Turboklusterai$0.015$0.02131K๐Ÿ”ง Tool
granite-4.0-h-microcloudflare$0.017$0.112131K๐Ÿ”ง Tool
meta-llama-3.1-8b-instruct-turbodeepinfra$0.02$0.03131K
meta-llama-3.1-8b-instructdeepinfra$0.02$0.05131K
mistral-nemo-instruct-2407deepinfra$0.02$0.04131K
qwen3.5-2bdeepinfra$0.02$0.1262K + ๐Ÿง  Reason + ๐Ÿ‘๏ธ Vision +
llama-3.1-8b-instruct--fp-16inferencenet$0.02$0.03131K๐Ÿ”ง Tool
schematron-3binferencenet$0.02$0.05131K๐Ÿ”ง Tool
schematron-v3inferencenet$0.02$0.05131K๐Ÿ”ง Tool
+ +

๐Ÿ†“ Free AI Models

+

81 models available at zero cost. Perfect for testing, prototyping, and learning.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextCapabilities
openrouter--owl-alphaopenrouter1M๐Ÿ”ง Tool
deepseek--deepseek-v4-flash--freeopenrouter1M + ๐Ÿ”ง Tool + ๐Ÿง  Reason +
google--lyria-3-clip-previewopenrouter1M๐Ÿ‘๏ธ Vision
google--lyria-3-pro-previewopenrouter1M๐Ÿ‘๏ธ Vision
qwen--qwen3-coder--freeopenrouter1M๐Ÿ”ง Tool
nvidia--nemotron-3-super-120b-a12b--freeopenrouter1M + ๐Ÿ”ง Tool + ๐Ÿง  Reason +
gemma-4-26b-a4b-itauriko262K + ๐Ÿ”ง Tool + ๐Ÿง  Reason + ๐Ÿ‘๏ธ Vision +
gemma-4-31b-itauriko262K + ๐Ÿ”ง Tool + ๐Ÿง  Reason + ๐Ÿ‘๏ธ Vision +
arcee-ai--trinity-large-thinking--freeopenrouter262K + ๐Ÿ”ง Tool + ๐Ÿง  Reason +
google--gemma-4-26b-a4b-it--freeopenrouter262K + ๐Ÿ”ง Tool + ๐Ÿง  Reason + ๐Ÿ‘๏ธ Vision +
google--gemma-4-31b-it--freeopenrouter262K + ๐Ÿ”ง Tool + ๐Ÿง  Reason + ๐Ÿ‘๏ธ Vision +
codestralmistral256K
nvidia--nemotron-3-nano-omni-30b-a3b-reasoning--freeopenrouter256K + ๐Ÿ”ง Tool + ๐Ÿง  Reason + ๐Ÿ‘๏ธ Vision +
hunyuan-litetencent250K
minimax--minimax-m2.5--freeopenrouter204K + ๐Ÿ”ง Tool + ๐Ÿง  Reason +
+ +

๐Ÿ’ป Best AI Models for Coding

+

0 models optimized for code generation, completion, and understanding.

+ + + + + + + + + +
ModelProviderInput $/MOutput $/MContextCapabilities
+ +

๐Ÿค– Best AI Models for Agents

+

+ 1080 models with both tool calling and reasoning โ€” the key capabilities for building AI + agents. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/MOutput $/MContextCapabilities
openai--gpt-oss-20bneuralwatt$0.03$0.16? + ๐Ÿ”ง Tool + ๐Ÿง  Reason +
qwen--qwen3-4b-fp8novitaai$0.03$0.03128K + ๐Ÿ”ง Tool + ๐Ÿง  Reason +
gpt-oss-120binferencenet$0.05$0.45131K + ๐Ÿ”ง Tool + ๐Ÿง  Reason +
Qwen--Qwen3.6-35B-A3Bneuralwatt$0.05$0.1? + ๐Ÿ”ง Tool + ๐Ÿง  Reason +
openai--gpt-oss-120bnovitaai$0.05$0.25131K + ๐Ÿ”ง Tool + ๐Ÿง  Reason +
qwen3-30b-a3b-fp8cloudflare$0.051$0.33540K + ๐Ÿ”ง Tool + ๐Ÿง  Reason +
glm-4.7-flashcloudflare$0.06$0.4131K + ๐Ÿ”ง Tool + ๐Ÿง  Reason +
Nemotron-3-Nano-Omninebius$0.06$0.24128K + ๐Ÿ”ง Tool + ๐Ÿง  Reason +
hermes-4-llama-3.1-8bnousresearch$0.06$0.12131K + ๐Ÿ”ง Tool + ๐Ÿง  Reason +
seed-1.6-flashbytedance$0.07$0.3262K + ๐Ÿ”ง Tool + ๐Ÿง  Reason +
+ +

๐Ÿง  Best AI Models for Reasoning

+

1306 models with advanced reasoning capabilities.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/MOutput $/MContext
qwen3.5-0.8bdeepinfra$0.01$0.05262K
qwen3.5-2bdeepinfra$0.02$0.1262K
gpt-oss-20bdeepinfra$0.03$0.14131K
qwen3.5-4bdeepinfra$0.03$0.15262K
openai--gpt-oss-20bneuralwatt$0.03$0.16?
qwen--qwen3-4b-fp8novitaai$0.03$0.03128K
gpt-oss-120bdeepinfra$0.039$0.19131K
nvidia-nemotron-nano-9b-v2deepinfra$0.04$0.16131K
openai--gpt-oss-20bnovitaai$0.04$0.15131K
nemotron-3-nano-30b-a3bdeepinfra$0.05$0.2262K
+ +

๐Ÿ‘๏ธ Best AI Models for Vision

+

1487 models that can understand images and visual content.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/MOutput $/MContext
qwen3.5-0.8bdeepinfra$0.01$0.05262K
qwen3.5-2bdeepinfra$0.02$0.1262K
paddlepaddle--paddleocr-vlnovitaai$0.02$0.0216K
qwen3.5-4bdeepinfra$0.03$0.15262K
deepseek--deepseek-ocr-2novitaai$0.03$0.038K
deepseek--deepseek-ocrnovitaai$0.03$0.038K
reka-edge-2reka$0.03$0.1131K
zai-org--autoglm-phone-9b-multilingualnovitaai$0.035$0.13865K
gemini-1.5-flash-8bdeepinfra$0.0375$0.151M
google-gemma-3-4bamazon-bedrock$0.04$0.08131K
+ +

๐Ÿ“ Largest Context Windows

+

Models with the largest context windows for processing long documents.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextInput $/MOutput $/M
meta-llama-4-scoutmeta10M$0.17$0.66
gemini-1.5-progoogle2M$1.25$5
xai--grok-4-fast-non-reasoningaimlapi2M$0.52$1.3
xai--grok-4-fast-reasoningaimlapi2M$0.52$1.3
meta-llama-4-maverick-17bamazon-bedrock1M$0.24$0.97
meta-llama-4-scout-17bamazon-bedrock1M$0.17$0.66
minimax-m2-1amazon-bedrock1M$0.3$1.2
minimax-m2-5amazon-bedrock1M$0.3$1.2
minimax-m2amazon-bedrock1M$0.3$1.2
deepseek-v4-flashbaidu1M$0.126$0.252
+ +

๐Ÿ”“ Open Weights Models

+

527 models with downloadable weights you can run locally.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextCapabilities
google--gemma-4-31b-itorcarouter1M๐Ÿ”ง Tool
qwen--qwen3.5-flash-2026-02-23orcarouter1M๐Ÿ”ง Tool
qwen--qwen3.5-flashorcarouter1M๐Ÿ”ง Tool
qwen--qwen3.6-flash-2026-04-16orcarouter1M๐Ÿ”ง Tool
qwen--qwen3.6-flashorcarouter1M๐Ÿ”ง Tool
MiniMax-Text-01302ai1M
llama-4-maverick302ai1M
llama-4-scout302ai1M
meta-llama-4-maverick-17bamazon-bedrock1M๐Ÿ”ง Tool
meta-llama-4-scout-17bamazon-bedrock1M๐Ÿ”ง Tool
+ +

๐Ÿ“Š Methodology

+

+ All data is sourced from first-party APIs โ€” not third-party aggregators. Pricing, + context windows, and capabilities are verified against official provider documentation. + Aggregator providers (OpenRouter, Requesty, etc.) are excluded from ranking tables to avoid + duplicate models. +

+

Data is auto-scraped and validated with Zod schemas. Last updated: 2025-05-21.

+ +

๐Ÿ”— More Resources

+ + +

Small Language Models

+

๐ŸŽฏ AI Model Picker

+

โšก GitHub Action

+ + + diff --git a/site/chatgpt-vs-claude-vs-gemini.html b/site/chatgpt-vs-claude-vs-gemini.html new file mode 100644 index 00000000..03960473 --- /dev/null +++ b/site/chatgpt-vs-claude-vs-gemini.html @@ -0,0 +1,631 @@ + + + + + + ChatGPT vs Claude vs Gemini โ€” 2025 Comparison | AI Models Catalog + + + + + + + + + + + + + + +
+

โšก ChatGPT vs Claude vs Gemini

+

+ The definitive 2025 comparison: pricing, context windows, capabilities, benchmarks, and API + features. GPT-4.1 vs Claude Sonnet 4 vs Gemini 2.5 Pro. +

+
+
+

1. Flagship Models at a Glance

+
+
+

OpenAI GPT-4.1

+
$2 / $8
+
Input / Output per M tokens
+
1,047,576 context
+
+
+

Anthropic Claude Sonnet 4

+
$3 / $15
+
Input / Output per M tokens
+
200,000 context
+
+
+

Google Gemini 2.5 Pro

+
$1.25 / $10
+
Input / Output per M tokens
+
1,048,576 context
+
+
+ +

2. Pricing Comparison

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
FeatureGPT-4.1Claude Sonnet 4Gemini 2.5 Pro
Input price ($/M tokens)$2.00$3.00$1.25
Output price ($/M tokens)$8.00$15.00$10.00
Cache input ($/M tokens)$0.50$0.30$0.07
Context window1,047,576200,0001,048,576
Max output tokens32,76864,00065,536
Free tierNoYes (limited)Yes (generous)
+
+ Winner on price: Gemini 2.5 Pro offers the best input pricing ($1.25/M) and + cache pricing ($0.07/M). GPT-4.1 wins on output pricing ($8/M vs $10-15/M). +
+ +

3. Capabilities

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
CapabilityGPT-4.1Claude Sonnet 4Gemini 2.5 Pro
Tool callingโœ…โœ…โœ…
Structured outputโœ…โœ…โœ…
Reasoning (extended thinking)โŒ (use o3)โœ…โœ…
Vision (image input)โœ…โœ…โœ…
Image generationโœ… (DALL-E)โŒโœ… (Imagen)
Audio inputโœ…โŒโœ…
Audio outputโœ…โŒโœ…
Video inputโŒโŒโœ…
PDF inputโœ…โœ…โœ…
Code executionโœ…โœ… (analysis tool)โœ…
+
+ Winner on capabilities: Gemini 2.5 Pro has the broadest multimodal support + (video, audio I/O, image generation). Claude Sonnet 4 excels at coding and analysis. GPT-4.1 + has the strongest tool calling (BFCL #1). +
+ +

4. Benchmark Performance

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
BenchmarkGPT-4.1Claude Sonnet 4Gemini 2.5 Pro
MMLU~90%~88%~90%
MATH-500~85%~88%~91%
HumanEval~91%~93%~90%
SWE-bench Verified~65%~72%~63%
GPQA Diamond~72%~70%~78%
BFCL v3 (tool calling)~88%~86%~85%
Chatbot Arena~1380~1370~1360
+
+ Key takeaway: No single model wins all benchmarks. GPT-4.1 leads on tool + calling and chat. Claude Sonnet 4 dominates coding (SWE-bench). Gemini 2.5 Pro excels at + math and science. +
+ +

5. API & Developer Experience

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
FeatureOpenAIAnthropicGoogle
API maturityMost matureMatureMaturing
SDK languagesPython, Node, Go, etc.Python, NodePython, Node, Go, etc.
Streamingโœ… SSEโœ… SSEโœ… SSE
Function callingParallel, strict modeParallel, forced toolParallel, auto
Batch APIโœ… (50% discount)โœ… (50% discount)โœ… (50% discount)
Fine-tuningโœ…โŒโœ… (limited)
Rate limitsTier-basedTier-basedPer-project
+ +

6. Budget Alternatives

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
Use CaseBest Budget OptionPriceWhy
General chatGemini 2.5 FlashFreeStrong quality at zero cost
CodingDeepSeek V3$0.07/$0.27Near-frontier coding at 1/30th the price
ReasoningDeepSeek R1FreeTop-tier reasoning at zero cost
Tool callingGemini 2.5 FlashFreeStrong BFCL scores for free
Long contextGemini 2.5 FlashFree1M context window for free
Open sourceQwen3-235BFreeBest open-weight model
+ +

7. The Verdict

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
If you need...ChooseBecause
Best overall valueGemini 2.5 ProLowest input price, 1M context, broadest capabilities
Best coding assistantClaude Sonnet 4#1 on SWE-bench, 64K output, analysis tool
Best tool callingGPT-4.1#1 on BFCL, parallel calls, strict mode
Best free optionGemini 2.5 FlashFree with 1M context, strong capabilities
Best reasoningo3 / DeepSeek R1Reasoning models outperform standard models on math/science
Most mature APIOpenAIWidest SDK support, fine-tuning, most integrations
+ + +
+ Small Language Models +

๐ŸŽฏ AI Model Picker

+

โšก GitHub Action

+
+

+ Data from AI Models Catalog โ€” 4,587 + models across 95 providers. Updated continuously. +

+
+ + diff --git a/site/cheapest-ai-models.html b/site/cheapest-ai-models.html new file mode 100644 index 00000000..6da9a037 --- /dev/null +++ b/site/cheapest-ai-models.html @@ -0,0 +1,1555 @@ + + + + + + Cheapest AI Models โ€” Lowest Price LLMs Compared (2025) | AI Models Catalog + + + + + + + + + + + + + + + + + + +

๐Ÿ’ฐ Cheapest AI Models โ€” Lowest Price LLMs (2025)

+

+ Find the most affordable AI models across 95 providers. All prices per million tokens, + from first-party data. Aggregator providers excluded to avoid duplicates. +

+ +
+
81Free Models
+
95Providers
+
4,587Total Models
+
+ + ๐Ÿ” Interactive Catalog + โญ Star on GitHub + +
+ ๐Ÿ’ก Price tips: Input price is what you pay for prompts; output price is for + completions (usually 2-5x higher). For high-volume use, output price matters most. For + RAG/search, input price dominates. All prices shown per million tokens. +
+ +

๐Ÿ† Cheapest Overall

+

The absolute lowest-priced models across all providers.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
#ModelProviderInput $/1MOutput $/1MContextTool Call
1openai--gpt-image-1-miniaimlapi$0.007$0.676?
2mistralai--Mistral-Nemo-Instruct-2407klusterai$0.008$0.001131K
3qwen3.5-0.8bdeepinfra$0.01$0.05262K
4ling-2.6-flashinclusionai$0.01$0.03262Kโœ…
5bdc-coderinferencenet$0.01$0.01131Kโœ…
6openai--gpt-image-1-modelaimlapi$0.012$0.175?
7klusterai--Meta-Llama-3.1-8B-Instruct-Turboklusterai$0.015$0.02131Kโœ…
8granite-4.0-h-microcloudflare$0.017$0.112131Kโœ…
9meta-llama-3.1-8b-instruct-turbodeepinfra$0.02$0.03131K
10meta-llama-3.1-8b-instructdeepinfra$0.02$0.05131K
11mistral-nemo-instruct-2407deepinfra$0.02$0.04131K
12qwen3.5-2bdeepinfra$0.02$0.1262K
13llama-3.1-8b-instruct--fp-16inferencenet$0.02$0.03131Kโœ…
14schematron-3binferencenet$0.02$0.05131Kโœ…
15schematron-v3inferencenet$0.02$0.05131Kโœ…
16Gemma-2-2b-itnebius$0.02$0.068K
17Meta-Llama-3.1-8B-Instructnebius$0.02$0.06131K
18meta-llama--llama-3.1-8b-instructnovitaai$0.02$0.0516K
19paddlepaddle--paddleocr-vlnovitaai$0.02$0.0216K
20text-embedding-3-smallopenai$0.02$08K
+ +

๐Ÿ”ง Cheapest with Tool Calling

+

+ Most affordable models that support function/tool calling โ€” essential for agents and + automation. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContext
ling-2.6-flashinclusionai$0.01$0.03262K
bdc-coderinferencenet$0.01$0.01131K
klusterai--Meta-Llama-3.1-8B-Instruct-Turboklusterai$0.015$0.02131K
granite-4.0-h-microcloudflare$0.017$0.112131K
llama-3.1-8b-instruct--fp-16inferencenet$0.02$0.03131K
schematron-3binferencenet$0.02$0.05131K
schematron-v3inferencenet$0.02$0.05131K
gpt-oss-20binferencenet$0.03$0.15131K
schematron-v2-turboinferencenet$0.03$0.15131K
openai--gpt-oss-20bneuralwatt$0.03$0.16?
qwen--qwen3-4b-fp8novitaai$0.03$0.03128K
liquid-ai--LFM2-24B-A2Btogetherai$0.03$0.12131K
amazon-nova-microamazon$0.035$0.14128K
amazon-nova-microamazon-bedrock$0.035$0.14128K
mistral-nemo-12b-instruct--fp-8inferencenet$0.0375$0.1131K
+ +

๐Ÿง  Cheapest with Reasoning

+

Most affordable reasoning models โ€” chain-of-thought for complex problems on a budget.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContext
qwen3.5-0.8bdeepinfra$0.01$0.05262K
qwen3.5-2bdeepinfra$0.02$0.1262K
gpt-oss-20bdeepinfra$0.03$0.14131K
qwen3.5-4bdeepinfra$0.03$0.15262K
openai--gpt-oss-20bneuralwatt$0.03$0.16?
qwen--qwen3-4b-fp8novitaai$0.03$0.03128K
gpt-oss-120bdeepinfra$0.039$0.19131K
nvidia-nemotron-nano-9b-v2deepinfra$0.04$0.16131K
openai--gpt-oss-20bnovitaai$0.04$0.15131K
nemotron-3-nano-30b-a3bdeepinfra$0.05$0.2262K
gpt-oss-120binferencenet$0.05$0.45131K
Qwen--Qwen3.6-35B-A3Bneuralwatt$0.05$0.1?
openai--gpt-oss-120bnovitaai$0.05$0.25131K
qwen3-30b-a3b-fp8cloudflare$0.051$0.33540K
glm-4.7-flashcloudflare$0.06$0.4131K
+ +

๐Ÿ‘๏ธ Cheapest with Vision

+

+ Most affordable models that can process images โ€” for OCR, visual Q&A, and multimodal tasks. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContext
qwen3.5-0.8bdeepinfra$0.01$0.05262K
qwen3.5-2bdeepinfra$0.02$0.1262K
paddlepaddle--paddleocr-vlnovitaai$0.02$0.0216K
qwen3.5-4bdeepinfra$0.03$0.15262K
deepseek--deepseek-ocr-2novitaai$0.03$0.038K
deepseek--deepseek-ocrnovitaai$0.03$0.038K
reka-edge-2reka$0.03$0.1131K
zai-org--autoglm-phone-9b-multilingualnovitaai$0.035$0.13865K
gemini-1.5-flash-8bdeepinfra$0.0375$0.151M
google-gemma-3-4bamazon-bedrock$0.04$0.08131K
gemma-3-12b-itdeepinfra$0.04$0.13131K
gemma-3-4b-itdeepinfra$0.04$0.08131K
qwen3.5-9bdeepinfra$0.04$0.15262K
openai--gpt-oss-20bnovitaai$0.04$0.15131K
llama-3.2-11b-vision-instructcloudflare$0.049$0.676131K
+ +

๐Ÿ“ Cheapest with 128K+ Context

+

+ Most affordable models with large context windows โ€” for long documents, codebases, and + conversations. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContext
mistralai--Mistral-Nemo-Instruct-2407klusterai$0.008$0.001131K
qwen3.5-0.8bdeepinfra$0.01$0.05262K
ling-2.6-flashinclusionai$0.01$0.03262K
bdc-coderinferencenet$0.01$0.01131K
klusterai--Meta-Llama-3.1-8B-Instruct-Turboklusterai$0.015$0.02131K
granite-4.0-h-microcloudflare$0.017$0.112131K
meta-llama-3.1-8b-instruct-turbodeepinfra$0.02$0.03131K
meta-llama-3.1-8b-instructdeepinfra$0.02$0.05131K
mistral-nemo-instruct-2407deepinfra$0.02$0.04131K
qwen3.5-2bdeepinfra$0.02$0.1262K
llama-3.1-8b-instruct--fp-16inferencenet$0.02$0.03131K
schematron-3binferencenet$0.02$0.05131K
schematron-v3inferencenet$0.02$0.05131K
Meta-Llama-3.1-8B-Instructnebius$0.02$0.06131K
llama-3.2-1b-instructcloudflare$0.027$0.201131K
+ +

๐Ÿข Cheapest Model per Provider

+

+ The most affordable model from each provider โ€” find the best deal from your preferred + provider. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ProviderCheapest ModelInput $/1MOutput $/1MContext
01aiyi-lightning$1$116K
ai21jamba-mini-2-2026-01$0.2$0.4256K
aimlapiopenai--gpt-image-1-mini$0.007$0.676?
aionaion-1.0-mini$0.7$1.4131K
alibabaqwen-flash$0.15$1.5?
amazonamazon-nova-micro$0.035$0.14128K
amazon-bedrockamazon-nova-micro$0.035$0.14128K
anthropicclaude-haiku-4-5$1$5200K
arceetrinity-mini$0.04$0.15131K
baichuanbaichuan4-air$0.98$0.9832K
baidudeepseek-v4-flash$0.126$0.2521M
basetengpt-oss-120b$0.1$0.5131K
bergetmeta-llama--Llama-3.1-8B-Instruct$0.2$0.2?
bytedanceseed-1.6-flash$0.07$0.3262K
cerebrasllama3.1-8b$0.1$0.1131K
chutesQwen--Qwen3-32B-TEE$0.08$0.2440K
clarifaigpt-oss-120b$0.09$0.36131K
cloudferro-sherlockminimax-m2.5$0.26$1.041M
cloudflaregranite-4.0-h-micro$0.017$0.112131K
databricksdatabricks-gpt-5-nano$0.05$0.4200K
deepinfraqwen3.5-0.8b$0.01$0.05262K
deepseekdeepseek-chat$0.14$0.281M
digitaloceanopenai-gpt-oss-20b$0.05$0.45131K
dinferencegpt-oss-20b$0.07$0.25131K
evrocQwen--Qwen3-30B-A3B-Instruct$0.1$0.840K
fireworksgpt-oss-20b$0.07$0.3131K
friendlimeta-llama-3.1-8b-instruct$0.1$0.1131K
gmicloudopenai--gpt-oss-120b$0.07$0.28131K
googlegemini-1.5-flash-8b$0.075$0.31M
google-vertexgpt-oss-20b$0.07$0.25131K
groqllama-3.1-8b-instant$0.05$0.08131K
hpc-aideepseek--deepseek-v4-flash$0.14$0.281M
hyperbolicmeta-llama--Llama-3.1-8B-BF16-Base$0.1$0.1131K
iflytekspark-ultra$0.8$0.8131K
inceptionmercury-2$0.25$0.75128K
inclusionailing-2.6-flash$0.01$0.03262K
inferencenetbdc-coder$0.01$0.01131K
klusteraimistralai--Mistral-Nemo-Instruct-2407$0.008$0.001131K
metameta-llama-3.2-1b$0.1$0.1128K
microsoftmicrosoft-phi-4-mini-reasoning$0.075$0.3128K
minimaxM2-her$2.1$8.464K
mistralministral-3b$0.04$0.04128K
mixlayerqwen--qwen3.5-9b$0.1$0.4131K
moonshotaimoonshot-v1-8k-vision-preview$2$108K
morphmorph-compact$0.2$0.51M
nebiusGemma-2-2b-it$0.02$0.068K
neuralwattopenai--gpt-oss-20b$0.03$0.16?
nousresearchhermes-3-llama-3.1-8b$0.06$0.12131K
novitaaimeta-llama--llama-3.1-8b-instruct$0.02$0.0516K
openaitext-embedding-3-small$0.02$08K
ovhcloudgpt-oss-20b$0.05$0.18131K
perplexitysonar$1$1127K
ppioqwen--qwen3-4b-fp8$0.2145$0.2145128K
privatemodegpt-oss-120b$0.43$1.7131K
rekareka-edge-2$0.03$0.1131K
sambanovagpt-oss-120b$0.22$0.59131K
scalewaygpt-oss-120b$0.15$0.6131K
siliconflowgpt-oss-20b$0.04$0.18131K
siliconflow-cnling-mini-2.0$0.5$2131K
stepfunstep-3.5-flash-2603$0.7$2.1256K
submodelopenai--gpt-oss-120b$0.1$0.5131K
tencenthunyuan-a13b$0.5$2224K
tencent-tokenhubdeepseek-v4-flash$1$21M
textsynthEleutherAI--gpt-j-6B$0.2$22K
togetherailiquid-ai--LFM2-24B-A2B$0.03$0.12131K
upstagesolar-embedding-1-large$0.1$0?
voyagererank-2.5-lite$0.02$0?
vultrcosmos-reason-2-2b$0.55$2.75131K
waferQwen3.5-397B-A17B$0.6$3.6262K
writerpalmyra-x5$0.6$61M
xaixai-grok-4-fast$0.2$0.5131K
xiaomimimo-v2-flash$0.1$0.3262K
zhipuaiglm-4-flashx-250414$0.1$0.1128K
+ +

๐Ÿ“Š Methodology

+

+ All data is sourced from first-party APIs โ€” not third-party aggregators. Prices are per + million tokens as listed by each provider. Aggregator providers (OpenRouter, Requesty, etc.) + are excluded from ranking tables to avoid duplicate models. Actual costs may vary based on + usage patterns, caching, and batch discounts. +

+ +

๐Ÿ”— More Resources

+ + +

Small Language Models

+

๐ŸŽฏ AI Model Picker

+

โšก GitHub Action

+ + + diff --git a/site/context-window-comparison.html b/site/context-window-comparison.html new file mode 100644 index 00000000..6f7a935f --- /dev/null +++ b/site/context-window-comparison.html @@ -0,0 +1,1661 @@ + + + + + + + AI Model Context Window Comparison โ€” Largest Context LLMs (2025) | AI Models Catalog + + + + + + + + + + + + + + + + + + + +

๐Ÿ“ AI Model Context Window Comparison

+

+ Compare context windows across 4,587 AI models. Find the largest context LLMs for your + use case โ€” from 1M+ token monsters to compact 8K models. +

+ +
+
4,587Models
+
2,195128K+ Context
+
95Providers
+
+ + ๐Ÿ” Interactive Catalog + โญ Star on GitHub + +

๐Ÿ† Top 20 Largest Context Windows

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
#ModelProviderContextInput $/1MTool Call
1meta-llama-4-scoutmeta10M$0.17โœ…
2gemini-1.5-progoogle2M$1.25โœ…
3xai--grok-4-fast-non-reasoningaimlapi2M$0.52โœ…
4xai--grok-4-fast-reasoningaimlapi2M$0.52โœ…
5meta-llama-4-maverick-17bamazon-bedrock1M$0.24โœ…
6meta-llama-4-scout-17bamazon-bedrock1M$0.17โœ…
7minimax-m2-1amazon-bedrock1M$0.3โœ…
8minimax-m2-5amazon-bedrock1M$0.3โœ…
9minimax-m2amazon-bedrock1M$0.3โœ…
10deepseek-v4-flashbaidu1M$0.126โœ…
11minimax-m2-5baseten1M$0.3โœ…
12gpt-5-1clarifai1M$1.5625โœ…
13deepseek-v4-flashdeepinfra1M$0.14
14llama-4-maverick-17b-128e-instruct-fp8deepinfra1M$0.15
15mimo-v2.5-prodeepinfra1M$1
16llama-4-maverickdigitalocean1M$0.25โœ…
17deepseek-v4-profireworks1M$1.74โœ…
18meta-llama--Llama-4-Maverick-17B-128E-Instruct-FP8gmicloud1M$0.25โœ…
19gemini-1.5-flash-8bgoogle1M$0.075โœ…
20gemini-1.5-flashgoogle1M$0.075โœ…
+ +

๐Ÿ“Š 1M+ Tokens (93 models)

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextInput $/1MOutput $/1MTool CallReasoning
meta-llama-4-scoutmeta10M$0.17$0.66โœ…
gemini-1.5-progoogle2M$1.25$5โœ…
xai--grok-4-fast-non-reasoningaimlapi2M$0.52$1.3โœ…
xai--grok-4-fast-reasoningaimlapi2M$0.52$1.3โœ…
meta-llama-4-maverick-17bamazon-bedrock1M$0.24$0.97โœ…
meta-llama-4-scout-17bamazon-bedrock1M$0.17$0.66โœ…
minimax-m2-1amazon-bedrock1M$0.3$1.2โœ…
minimax-m2-5amazon-bedrock1M$0.3$1.2โœ…
minimax-m2amazon-bedrock1M$0.3$1.2โœ…
deepseek-v4-flashbaidu1M$0.126$0.252โœ…โœ…
minimax-m2-5baseten1M$0.3$1.2โœ…
gpt-5-1clarifai1M$1.5625$12.5โœ…
deepseek-v4-flashdeepinfra1M$0.14$0.28โœ…
llama-4-maverick-17b-128e-instruct-fp8deepinfra1M$0.15$0.6
mimo-v2.5-prodeepinfra1M$1$3โœ…
... and 78 more models
+ +

๐Ÿ“Š 512Kโ€“1M Tokens (1 models)

+ + + + + + + + + + + + + + + + + + + +
ModelProviderContextInput $/1MOutput $/1MTool CallReasoning
deepseek-v4-probaidu716K$1.521$3.042โœ…โœ…
+ +

๐Ÿ“Š 256Kโ€“512K Tokens (187 models)

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextInput $/1MOutput $/1MTool CallReasoning
openai--gpt-5-chataimlapi400K$1.625$13
openai--gpt-5-miniaimlapi400K$0.325$2.6โœ…
openai--gpt-5-nanoaimlapi400K$0.065$0.52โœ…
openai--gpt-5.1-chat-latestaimlapi400K$1.625$13โœ…
openai--gpt-5.1aimlapi400K$1.625$13โœ…
openai--gpt-5.2aimlapi400K$2.275$18.2โœ…
openai--gpt-5aimlapi400K$1.625$13โœ…
llama-4-scout-17b-16e-instructcloudflare327K$0.27$0.85โœ…
llama-4-scout-17b-16e-instructdeepinfra327K$0.08$0.3
meta-llama--Llama-4-Scout-17B-16E-Instructgmicloud327K$0.08$0.5โœ…
llama-4-scout-17b-16e-instructvultr327K$0.55$2.75โœ…
llama-4-scout-17b-16evultr327K$0.55$2.75
amazon-nova-liteamazon300K$0.06$0.24โœ…
amazon-nova-proamazon300K$0.8$3.2โœ…
amazon-nova-liteamazon-bedrock300K$0.06$0.24โœ…
... and 172 more models
+ +

๐Ÿ“Š 128Kโ€“256K Tokens (685 models)

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextInput $/1MOutput $/1MTool CallReasoning
hunyuan-litetencent250KFree
hunyuan-a13btencent224K$0.5$2โœ…
minimax-m2.5dinference204K$0.22$0.88
minimax--minimax-m2.5hpc-ai204K$0.3$1.2โœ…โœ…
MiniMax-M2.1-highspeedminimax204K$4.2$16.8
MiniMax-M2.1minimax204K$2.1$8.4
MiniMax-M2.5-highspeedminimax204K$4.2$16.8
MiniMax-M2.5minimax204K$2.1$8.4
MiniMax-M2.7-highspeedminimax204K$4.2$16.8
MiniMax-M2.7minimax204K$2.1$8.4
MiniMax-M2minimax204K$2.1$8.4
minimax--minimax-m2.1novitaai204K$0.3$1.2โœ…
minimax--minimax-m2.5-highspeednovitaai204K$0.6$2.4โœ…โœ…
minimax--minimax-m2.5novitaai204K$0.3$1.2โœ…โœ…
minimax--minimax-m2.7novitaai204K$0.3$1.2โœ…โœ…
... and 670 more models
+ +

๐Ÿ“Š 64Kโ€“128K Tokens (56 models)

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextInput $/1MOutput $/1MTool CallReasoning
sonarperplexity127K$1$1โœ…
baidu--ernie-4.5-300b-a47b-paddlenovitaai123K$0.28$1.1
baidu--ernie-4.5-vl-424b-a47bnovitaai123K$0.42$1.25โœ…
baidu--ernie-4.5-300b-a47b-paddleppio123K$2$7
baidu--ernie-4.5-vl-424b-a47bppio123K$3$9
baidu--ernie-4.5-0.3baimlapi120KFreeโœ…
baidu--ernie-4.5-21B-a3bnovitaai120K$0.07$0.28โœ…
baidu--ernie-4.5-0.3bppio120KFree
baidu--ernie-4.5-21B-a3bppio120K$0.5$2
qwen3.6-27bvultr120K$0.55$2.75
step-r1-v-ministepfun100K$2.5$8
google--gemma-3-27b-itnovitaai98K$0.119$0.2
Gemma-3-27b-itnebius96K$0.1$0.3โœ…โœ…
gemma-3-27bprivatemode96K$0.77$1.27
gemma-4-31bprivatemode96K$0.77$1.27
... and 41 more models
+ +

๐Ÿ“Š 32Kโ€“64K Tokens (74 models)

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextInput $/1MOutput $/1MTool CallReasoning
mistralai--mistral-nemonovitaai60K$0.04$0.17
Qwen--Qwen3-32B-TEEchutes40K$0.08$0.24โœ…โœ…
qwen3-30b-a3b-fp8cloudflare40K$0.051$0.335โœ…โœ…
qwen3-14bdeepinfra40K$0.12$0.24โœ…
qwen3-30b-a3bdeepinfra40K$0.09$0.45โœ…
qwen3-32bdeepinfra40K$0.08$0.28โœ…
Qwen--Qwen3-30B-A3B-Instructevroc40K$0.1$0.8
Qwen--Qwen3-VL-30B-A3B-Instructevroc40K$0.2$0.8
Qwen--Qwen3-30B-A3Bgmicloud40K$0.08$0.25
Qwen--Qwen3-32B-FP8gmicloud40K$0.1$0.6
Qwen--Qwen3-235B-A22B-FP8klusterai40K$0.13$2โœ…โœ…
mistralai--Magistral-Small-2506klusterai40K$0.1$0.3
qwen--qwen3-235b-a22b-fp8novitaai40K$0.2$0.8โœ…
qwen--qwen3-30b-a3b-fp8novitaai40K$0.09$0.45โœ…โœ…
qwen--qwen3-32b-fp8novitaai40K$0.1$0.45โœ…
... and 59 more models
+ +

๐Ÿ“Š 8Kโ€“32K Tokens (79 models)

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextInput $/1MOutput $/1MTool CallReasoning
baidu--ernie-4.5-vl-28b-a3bnovitaai30K$0.14$0.56โœ…โœ…
baidu--ernie-4.5-vl-28b-a3bppio30K$1$4
gpt-oss-120bvultr30K$0.55$2.75
gpt-oss-20bvultr30K$0.55$2.75
hunyuan-large-role-latesttencent28K$2.4$9.6
hunyuan-t1-visiontencent28K$3$9โœ…
hunyuan-roletencent-tokenhub28K$2.4$9.6
hunyuan-turbos-vision-videotencent24K$3$9
hunyuan-turbos-visiontencent24K$3$9
hunyuan-vision-1.5-instructtencent24K$3$9
autoglm-phonezhipuai20KFreeโœ…
gpt-3.5-turbo-16kopenai16K$3$4โœ…
gpt-3.5-turboopenai16K$0.5$1.5โœ…
yi-lightning01ai16K$1$1โœ…
yi-medium01ai16K$2.5$2.5โœ…
... and 64 more models
+ +

๐Ÿ“Š Under 8K Tokens (13 models)

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextInput $/1MOutput $/1MTool CallReasoning
nvidia-nemotron-3-super-120bamazon-bedrock4K$0.15$0.65
nvidia-nemotron-nano-2-vlamazon-bedrock4K$0.2$0.6
nvidia-nemotron-nano-2amazon-bedrock4K$0.06$0.23
nvidia-nemotron-nano-3-30bamazon-bedrock4K$0.06$0.24
llama-2-7b-chat-fp16cloudflare4K$0.556$6.667
mythomax-l2-13bdeepinfra4K$0.4$0.4
nvidia-nemotron-3-super-120bdigitalocean4K$0.3$0.65
nemotron3-superinferencenet4K$2.5$5
gryphe--mythomax-l2-13bnovitaai4K$0.09$0.09
nemotron-3-super-120b-a12b-bf16vultr4K$0.55$2.75
hunyuan-translation-litetencent4K$1$3
hunyuan-translationtencent4K$1.2$3.6
EleutherAI--gpt-j-6Btextsynth2K$0.2$2
+ +

๐Ÿ’ฐ Cheapest Models by Context Tier

+

Find the most affordable model in each context window tier.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
Context TierCheapest ModelProviderContextInput $/1M
1M+ Tokensgemini-1.5-flash-8bdeepinfra1M$0.0375
512Kโ€“1M Tokensdeepseek-v4-probaidu716K$1.521
256Kโ€“512K Tokensqwen3.5-0.8bdeepinfra262K$0.01
128Kโ€“256K Tokensmistralai--Mistral-Nemo-Instruct-2407klusterai131K$0.008
64Kโ€“128K Tokenszai-org--autoglm-phone-9b-multilingualnovitaai65K$0.035
32Kโ€“64K Tokensmeta-llama--llama-3.2-3b-instructnovitaai32K$0.03
8Kโ€“32K TokensGemma-2-2b-itnebius8K$0.02
+ +

๐Ÿ“Š Methodology

+

+ All data is sourced from first-party APIs โ€” not third-party aggregators. Context + windows are as reported by each provider. Aggregator providers are excluded from ranking + tables to avoid duplicate models. +

+ +

๐Ÿ”— More Resources

+ + + Small Language Models +

๐ŸŽฏ AI Model Picker

+

โšก GitHub Action

+ + + diff --git a/site/devto-article.md b/site/devto-article.md new file mode 100644 index 00000000..200c9f74 --- /dev/null +++ b/site/devto-article.md @@ -0,0 +1,184 @@ +# I Built the Most Comprehensive AI Model Catalog on GitHub (4,587 Models, 95 Providers) + +_Choosing the right AI model shouldn't require visiting 95 different websites._ + +## The Problem + +Every week, a new AI model launches. Every month, a new provider enters the market. Keeping track of pricing, context windows, capabilities, and which models support tool calling or structured output is a full-time job. + +I got tired of: + +- Checking OpenAI's pricing page, then Anthropic's, then Google's... +- Wondering "which models support tool calling again?" +- Not knowing the cheapest model with a 128K+ context window +- Manually comparing prices across providers for the same model + +So I built [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” a structured YAML catalog of 4,587 AI models across 95 providers, all with first-party data. + +## What's Inside + +Every model file includes: + +```yaml +id: gpt-4.1 +name: GPT-4.1 +provider: openai +family: gpt-4 +pricing: + input: 2 # $/M tokens + output: 8 + cache_read: 0.5 +limit: + context: 1047576 # 1M tokens + output: 32768 +tool_call: true +structured_output: true +reasoning: false +modalities: + input: [text, image] + output: [text] +``` + +No more guessing. No more visiting 95 websites. + +## The Numbers + +| Metric | Count | +| ------------------- | ----- | +| Total models | 4,587 | +| Providers | 95 | +| Tool-calling models | 2,350 | +| Reasoning models | 1,306 | +| Vision models | 1,487 | +| Free models | 81 | +| Open weights | 527 | +| Structured output | 829 | + +## Key Design Decisions + +### First-Party Data Only + +Every data point comes from the provider's own API or documentation. No third-party aggregators. This means: + +- Pricing is always accurate and up-to-date +- Model capabilities are verified against official sources +- No stale or incorrect data from middlemen + +### Machine-Readable YAML + +Not a web UI you can't query. Not a PDF you can't parse. Structured YAML with: + +- TypeScript type definitions +- Zod runtime validation +- JSON Schema for other languages + +### Automated Sync + +Scrape scripts pull fresh data from provider APIs. CI validates everything on every push. No manual updates needed. + +## How to Use It + +### One Command + +```bash +# Download the latest data +curl -sL https://github.com/i-need-token/ai-models/releases/latest/download/models.json | jq '.models | length' +# โ†’ 4587 +``` + +### npm Package + +```bash +npm install ai-models +``` + +```javascript +import catalog from "ai-models/models.json"; +console.log(catalog.models.length); // 4587 +``` + +### GitHub Action + +```yaml +- uses: i-need-token/ai-models@v0.2.0 + id: catalog +- run: echo "Models: ${{ steps.catalog.outputs.model-count }}" +``` + +### Interactive Catalog + +Try it live: [i-need-token.github.io/ai-models](https://i-need-token.github.io/ai-models/) + +Features: + +- ๐Ÿ” Search, sort, and filter 4,587 models +- ๐Ÿ’ฐ **Price Calculator** โ€” enter your token usage, see monthly costs +- ๐ŸŽฏ **Model Picker** โ€” answer 2 questions, get top 5 recommendations +- ๐Ÿ“‹ Model detail modal with full metadata +- โฌ‡๏ธ Export CSV/JSON +- ๐Ÿ”— Shareable URL filters + +## Unique Features You Won't Find Elsewhere + +### Price Calculator + +Enter your monthly token usage and instantly see the cheapest, median, and most expensive model. Filter by capability first (e.g., "only tool-calling models"), then calculate. + +### Model Picker + +Answer 2 questions: + +1. What do you need? (chat, code, agents, reasoning, vision, cheap, free, large context) +2. What's your budget? (any, free, low, mid, high) + +Get the top 5 recommended models with pricing and capability badges. + +### 68 Documentation Pages + +34 English + 34 Chinese pages covering: + +- [Free Models](https://github.com/i-need-token/ai-models/blob/main/docs/free-models.md) โ€” 81 free models +- [OpenAI Alternatives](https://github.com/i-need-token/ai-models/blob/main/docs/openai-alternatives.md) โ€” 70+ OpenAI-compatible providers +- [Agentic Models](https://github.com/i-need-token/ai-models/blob/main/docs/agentic-models.md) โ€” 1,080 models with tool_call + reasoning +- [Code Models](https://github.com/i-need-token/ai-models/blob/main/docs/code-models.md) โ€” 189 code-focused models +- [Pricing Comparison](https://github.com/i-need-token/ai-models/blob/main/docs/pricing-comparison.md) โ€” side-by-side pricing +- And 29 more... + +## How It Compares + +| Project | Scope | Data Source | Format | Auto-Update | Free | +| ------------------- | --------------------------- | ---------------- | ----------------- | ----------- | ------- | +| **This catalog** | 95 providers, 4,587+ models | First-party APIs | YAML + JSON + CSV | Weekly CI | โœ… | +| OpenRouter models | OpenRouter only | OpenRouter API | Web UI | โœ… | โœ… | +| Artificial Analysis | ~30 providers | Mixed | Web UI | โœ… | Partial | +| Helicone models | ~20 providers | Mixed | Web UI | โœ… | Partial | +| BerriAI/litellm | 100+ providers | Community | Python config | โœ… | โœ… | + +Key differentiators: + +- **First-party data only** โ€” not aggregated from third parties +- **Machine-readable** โ€” structured data with validation, not just a web UI +- **Multiple formats** โ€” YAML, JSON, CSV, npm, GitHub Action, Hugging Face +- **Bilingual docs** โ€” 68 pages in English and Chinese + +## What's Next + +- Model benchmarking data integration +- Historical pricing trends +- REST API for querying model data +- Python package (`pip install ai-models`) +- Regional availability data + +## Get Started + +โญ [Star the repo](https://github.com/i-need-token/ai-models) if you find it useful + +๐Ÿ” [Try the interactive catalog](https://i-need-token.github.io/ai-models/) + +๐Ÿ“ฆ [Download the data](https://github.com/i-need-token/ai-models/releases) + +๐Ÿ“– [Read the docs](https://github.com/i-need-token/ai-models/tree/main/docs) + +--- + +_If you're building with AI models, this catalog saves you hours of research. Give it a star and help others find it too!_ diff --git a/site/free-ai-models.html b/site/free-ai-models.html new file mode 100644 index 00000000..c64782b2 --- /dev/null +++ b/site/free-ai-models.html @@ -0,0 +1,1552 @@ + + + + + + Free AI Models โ€” 81 Models at Zero Cost (2025) | AI Models Catalog + + + + + + + + + + + + + + + + + + +

๐Ÿ†“ Free AI Models โ€” 81 Models at Zero Cost

+

+ A complete, verified list of 81 AI models you can use for free โ€” no credit card, no + hidden fees. Data sourced from first-party provider APIs. +

+ +
+
81Free Models
+
20Providers
+
54Tool Calling
+
33Reasoning
+
27Vision
+
10Open Weights
+
51128K+ Context
+
+ + ๐Ÿ” Interactive Catalog + โญ Star on GitHub + +
+ ๐Ÿ’ก Pro tip: Use the + interactive catalog + to filter by "Free" and compare models side-by-side. You can also calculate monthly costs for + paid alternatives. +
+ + + +

๐Ÿ“ Free Models with Largest Context Windows

+

+ These free models can handle the longest inputs โ€” perfect for processing documents, codebases, + and long conversations. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextTool CallReasoningVision
openrouter--owl-alphaopenrouter1Mโœ…
deepseek--deepseek-v4-flash--freeopenrouter1Mโœ…โœ…
google--lyria-3-clip-previewopenrouter1Mโœ…
google--lyria-3-pro-previewopenrouter1Mโœ…
qwen--qwen3-coder--freeopenrouter1Mโœ…
nvidia--nemotron-3-super-120b-a12b--freeopenrouter1Mโœ…โœ…
gemma-4-26b-a4b-itauriko262Kโœ…โœ…โœ…
gemma-4-31b-itauriko262Kโœ…โœ…โœ…
arcee-ai--trinity-large-thinking--freeopenrouter262Kโœ…โœ…
google--gemma-4-26b-a4b-it--freeopenrouter262Kโœ…โœ…โœ…
google--gemma-4-31b-it--freeopenrouter262Kโœ…โœ…โœ…
codestralmistral256K
nvidia--nemotron-3-nano-omni-30b-a3b-reasoning--freeopenrouter256Kโœ…โœ…โœ…
hunyuan-litetencent250K
minimax--minimax-m2.5--freeopenrouter204Kโœ…โœ…
+ +

๐Ÿ”ง Free Models with Tool Calling

+

54 free models support tool/function calling โ€” essential for building AI agents.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextReasoningVision
openrouter--owl-alphaopenrouter1M
deepseek--deepseek-v4-flash--freeopenrouter1Mโœ…
qwen--qwen3-coder--freeopenrouter1M
nvidia--nemotron-3-super-120b-a12b--freeopenrouter1Mโœ…
gemma-4-26b-a4b-itauriko262Kโœ…โœ…
gemma-4-31b-itauriko262Kโœ…โœ…
arcee-ai--trinity-large-thinking--freeopenrouter262Kโœ…
google--gemma-4-26b-a4b-it--freeopenrouter262Kโœ…โœ…
google--gemma-4-31b-it--freeopenrouter262Kโœ…โœ…
nvidia--nemotron-3-nano-omni-30b-a3b-reasoning--freeopenrouter256Kโœ…โœ…
minimax--minimax-m2.5--freeopenrouter204Kโœ…
z-ai--glm-5.1openrouter202Kโœ…
glm-4.5-flashauriko200Kโœ…
glm-4.7-flashzhipuai200K
cobuddybaidu131K
+ +

๐Ÿง  Free Models with Reasoning

+

33 free models with advanced reasoning capabilities.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextTool Call
deepseek--deepseek-v4-flash--freeopenrouter1Mโœ…
nvidia--nemotron-3-super-120b-a12b--freeopenrouter1Mโœ…
gemma-4-26b-a4b-itauriko262Kโœ…
gemma-4-31b-itauriko262Kโœ…
arcee-ai--trinity-large-thinking--freeopenrouter262Kโœ…
google--gemma-4-26b-a4b-it--freeopenrouter262Kโœ…
google--gemma-4-31b-it--freeopenrouter262Kโœ…
nvidia--nemotron-3-nano-omni-30b-a3b-reasoning--freeopenrouter256Kโœ…
minimax--minimax-m2.5--freeopenrouter204Kโœ…
z-ai--glm-5.1openrouter202Kโœ…
+ +

๐Ÿ‘๏ธ Free Models with Vision

+

27 free models that can understand images.

+ + + + + + + +
ModelProviderContextTool Call
+ +

๐Ÿ”“ Free Open-Weights Models

+

10 free models with downloadable weights you can run locally.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextTool CallReasoning
hunyuan-litetencent250K
deepseek-r1-distill-llama-70bcerebras131Kโœ…
deepseek-r1-distill-llama-8bcerebras131Kโœ…
llama-3.3-70bcerebras131Kโœ…
llama-4-scout-17b-16e-instructcerebras131Kโœ…
qwen-2.5-32bcerebras131Kโœ…
qwen-2.5-coder-32bcerebras131Kโœ…
qwen3-32bcerebras131Kโœ…
qwen--qwen3.5-4b-freemixlayer131Kโœ…โœ…
voyage-4-nanovoyage?
+ +

๐Ÿ“‹ All 81 Free AI Models

+

Complete list of every free AI model in our catalog, sorted by context window size.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextTool CallReasoningVisionOpen Weights
openrouter--owl-alphaopenrouter1Mโœ…
deepseek--deepseek-v4-flash--freeopenrouter1Mโœ…โœ…
google--lyria-3-clip-previewopenrouter1Mโœ…
google--lyria-3-pro-previewopenrouter1Mโœ…
qwen--qwen3-coder--freeopenrouter1Mโœ…
nvidia--nemotron-3-super-120b-a12b--freeopenrouter1Mโœ…โœ…
gemma-4-26b-a4b-itauriko262Kโœ…โœ…โœ…
gemma-4-31b-itauriko262Kโœ…โœ…โœ…
arcee-ai--trinity-large-thinking--freeopenrouter262Kโœ…โœ…
google--gemma-4-26b-a4b-it--freeopenrouter262Kโœ…โœ…โœ…
google--gemma-4-31b-it--freeopenrouter262Kโœ…โœ…โœ…
codestralmistral256K
nvidia--nemotron-3-nano-omni-30b-a3b-reasoning--freeopenrouter256Kโœ…โœ…โœ…
hunyuan-litetencent250Kโœ…
minimax--minimax-m2.5--freeopenrouter204Kโœ…โœ…
z-ai--glm-5.1openrouter202Kโœ…โœ…
glm-4.5-flashauriko200Kโœ…โœ…
glm-4.7-flashzhipuai200Kโœ…
spotlightarcee131Kโœ…
cobuddybaidu131Kโœ…
deepseek-r1-distill-llama-70bcerebras131Kโœ…โœ…
deepseek-r1-distill-llama-8bcerebras131Kโœ…โœ…
llama-3.3-70bcerebras131Kโœ…โœ…
llama-4-scout-17b-16e-instructcerebras131Kโœ…โœ…
qwen-2.5-32bcerebras131Kโœ…โœ…
qwen-2.5-coder-32bcerebras131Kโœ…โœ…
qwen3-32bcerebras131Kโœ…โœ…
gemma-3-12b-itgoogle131Kโœ…
gemma-3-1b-itgoogle131K
gemma-3-27b-itgoogle131Kโœ…
gemma-3-4b-itgoogle131Kโœ…
gemma-3n-E2B-itgoogle131Kโœ…
gemma-3n-E4B-itgoogle131Kโœ…
glm-4-7-flashmeganova131Kโœ…
manta-flash-1.0meganova131Kโœ…
manta-mini-1.0meganova131Kโœ…
manta-pro-1.0meganova131Kโœ…
qwen--qwen3.5-4b-freemixlayer131Kโœ…โœ…โœ…
baidu--cobuddy--freeopenrouter131Kโœ…โœ…
openai--gpt-oss-120b--freeopenrouter131Kโœ…โœ…
openai--gpt-oss-20b--freeopenrouter131Kโœ…โœ…
poolside--laguna-m.1--freeopenrouter131Kโœ…โœ…
poolside--laguna-xs.2--freeopenrouter131Kโœ…โœ…
z-ai--glm-4.5-air--freeopenrouter131Kโœ…โœ…
glm-4.6v-flashauriko128Kโœ…โœ…โœ…
sarvam--sarvam-105bfastrouter128Kโœ…โœ…
sarvam--sarvam-30bfastrouter128Kโœ…โœ…
devstralmistral128Kโœ…
nvidia--nemotron-nano-12b-v2-vl--freeopenrouter128Kโœ…โœ…โœ…
glm-4-flash-250414zhipuai128Kโœ…
glm-4.6v-flashzhipuai128Kโœ…โœ…
baidu--ernie-4.5-0.3baimlapi120Kโœ…
baidu--ernie-4.5-0.3bppio120K
qwen--qwen3-omni-30b-a3b-instructnovitaai65Kโœ…โœ…
qwen--qwen3-omni-30b-a3b-thinkingnovitaai65Kโœ…โœ…โœ…
glm-4.1v-thinking-flashzhipuai64Kโœ…โœ…โœ…
baichuan4baichuan32K
autoglm-phonezhipuai20Kโœ…โœ…
glm-4v-flashzhipuai16Kโœ…โœ…
spark-liteiflytek8K
nvidia--nemotron-3-nano-omniaimlapi?
glm-4.7-flashauriko?โœ…โœ…
glm-4.5-flashllmgateway?โœ…
glm-4.6v-flashllmgateway?โœ…โœ…โœ…
glm-4.7-flashllmgateway?โœ…โœ…
cognitivecomputations--dolphin-mistral-24b-venice-edition--freeopenrouter?
liquid--lfm-2.5-1.2b-instruct--freeopenrouter?
liquid--lfm-2.5-1.2b-thinking--freeopenrouter?โœ…
meta-llama--llama-3.2-3b-instruct--freeopenrouter?
meta-llama--llama-3.3-70b-instruct--freeopenrouter?โœ…
nousresearch--hermes-3-llama-3.1-405b--freeopenrouter?
nvidia--nemotron-3-nano-30b-a3b--freeopenrouter?โœ…โœ…
nvidia--nemotron-nano-9b-v2--freeopenrouter?โœ…โœ…
openrouter--freeopenrouter?โœ…โœ…โœ…
qwen--qwen3-next-80b-a3b-instruct--freeopenrouter?โœ…
step-1x-editstepfun?โœ…
step-2x-largestepfun?โœ…
step-audio-r1.1stepfun?
step-guistepfun?โœ…
voyage-4-nanovoyage?โœ…
glm-ocrzhipuai?โœ…โœ…
+ +

๐Ÿ”— More Resources

+ + +

Small Language Models

+

๐ŸŽฏ AI Model Picker

+

โšก GitHub Action

+ + + diff --git a/site/index.html b/site/index.html new file mode 100644 index 00000000..299757d5 --- /dev/null +++ b/site/index.html @@ -0,0 +1,2323 @@ + + + + + + AI Models Catalog โ€” Interactive Explorer + + + + + + + + + + + + + + + + + +
+
+

๐Ÿค– AI Models Catalog

+
+ โญ Star + / to search + +
+
+
+ + + + + +
+
+
+

โŒจ๏ธ Keyboard Shortcuts

+ +
+
+ /Focus search EscClose modal / clear search ?Show this help + โ†Previous page โ†’Next page jNext row kPrevious row EnterOpen model detail cToggle compare checkbox +
+
+
+
+
+ +
โญ
+
Finding this useful?
+
+ Star the repo to help others discover it +
+ Star on GitHub +
+
+
+ +
+ + + + diff --git a/site/linkedin-article.md b/site/linkedin-article.md new file mode 100644 index 00000000..016d0a42 --- /dev/null +++ b/site/linkedin-article.md @@ -0,0 +1,86 @@ +# LinkedIn Article: AI Models Catalog + +## Title Options + +1. I Built the Most Comprehensive AI Model Catalog โ€” 4,587 Models, 95 Providers, Zero Third-Party Data +2. How to Choose the Right AI Model in 2025: A Data-Driven Guide +3. Stop Guessing Which AI Model to Use โ€” Here's a Catalog of 4,587 Models with Real Pricing + +--- + +## Article Body + +As AI practitioners, we face a growing challenge: with 4,500+ models from 95+ providers, how do you find the right model for your use case? + +I've been maintaining an open-source AI Models Catalog that solves this problem with first-party data, structured YAML, and an interactive comparison tool. + +**The numbers:** + +- 4,587 models across 95 providers +- 81 free models +- 2,350 with tool calling +- 1,306 with reasoning +- 1,487 with vision +- 527 open weights +- 2,195 with 128K+ context windows + +**What makes it different:** + +1๏ธโƒฃ **First-party data only** โ€” every data point comes from the provider's own API or documentation, not third-party aggregators. This means pricing is accurate, capabilities are verified, and context windows are real. + +2๏ธโƒฃ **Structured & programmable** โ€” every model is a YAML file with Zod-validated TypeScript types. Use it in your code: + +```python +import requests +catalog = requests.get( + "https://github.com/i-need-token/ai-models/releases/latest/download/models.json" +).json() +free_models = [m for m in catalog["models"] if m.get("pricing", {}).get("unit") == "free"] +``` + +3๏ธโƒฃ **Interactive catalog** โ€” search, filter by 9 capabilities, compare models side-by-side, calculate monthly costs, and use the model picker wizard at https://i-need-token.github.io/ai-models/ + +4๏ธโƒฃ **Free to use** โ€” all data is open source under MIT license. Download as JSON, CSV, or use the npm package. + +**Who is this for?** + +- ๐Ÿ”ง Developers choosing models for their apps +- ๐Ÿ’ฐ Teams optimizing AI spend +- ๐Ÿค– Agent builders needing tool-calling models +- ๐Ÿ“Š Researchers tracking the AI landscape +- ๐Ÿข Enterprises evaluating providers + +**Key findings from the data:** + +- The cheapest model with tool calling costs $0.01/1M input tokens +- 81 models are completely free (including some with 128K+ context) +- Only 527 out of 4,587 models have open weights +- 1,306 models support reasoning (a rapidly growing category) + +If you work with AI models, I'd love your feedback. Star the repo, open an issue, or contribute a provider. + +๐Ÿ”— GitHub: https://github.com/i-need-token/ai-models +๐Ÿ”— Interactive Catalog: https://i-need-token.github.io/ai-models/ +๐Ÿ”— npm: npm install ai-models + +#AI #MachineLearning #LLM #OpenSource #ArtificialIntelligence #AIModels #DataScience + +--- + +## Short Post Version (for sharing) + +I maintain an open-source catalog of 4,587 AI models from 95 providers โ€” all with first-party data, real pricing, and verified capabilities. + +๐Ÿ” Interactive catalog: https://i-need-token.github.io/ai-models/ +โญ GitHub: https://github.com/i-need-token/ai-models + +Key stats: +โ€ข 81 free models +โ€ข 2,350 with tool calling +โ€ข 1,306 with reasoning +โ€ข 527 open weights +โ€ข 2,195 with 128K+ context + +Search, filter, compare, and calculate costs โ€” all in one place. + +#AI #LLM #OpenSource #MachineLearning diff --git a/site/llm-pricing.html b/site/llm-pricing.html new file mode 100644 index 00000000..7b23fc87 --- /dev/null +++ b/site/llm-pricing.html @@ -0,0 +1,929 @@ + + + + + + LLM Pricing Comparison โ€” 4587 AI Models, Real Prices (2025) | AI Models Catalog + + + + + + + + + + + + + + + + + + +

๐Ÿ’ฐ LLM Pricing Comparison โ€” 4587 AI Models

+

+ Real pricing data for 4587 AI models across 95 providers. All prices are per + million tokens, sourced from first-party APIs. No third-party aggregators. +

+ +
+
$0.01Cheapest Input/1M
+
$150.00Most Expensive Input/1M
+
$1.61Average Input/1M
+
81Free Models
+
0With Cache Pricing
+
+ + ๐Ÿ” Price Calculator in Catalog + โญ Star on GitHub + +
+ ๐Ÿ’ก Pro tip: Use the + interactive catalog's price calculator + to estimate monthly costs based on your actual token usage. +
+ + + +

๐Ÿ’ต Cheapest AI Models Overall

+

The most affordable models per million input tokens.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContext
openai--gpt-image-1-miniaimlapi$0.007$0.676?
mistralai--Mistral-Nemo-Instruct-2407klusterai$0.008$0.001131K
qwen3.5-0.8bdeepinfra$0.01$0.05262K
ling-2.6-flashinclusionai$0.01$0.03262K
bdc-coderinferencenet$0.01$0.01131K
openai--gpt-image-1-modelaimlapi$0.012$0.175?
klusterai--Meta-Llama-3.1-8B-Instruct-Turboklusterai$0.015$0.02131K
granite-4.0-h-microcloudflare$0.017$0.112131K
meta-llama-3.1-8b-instruct-turbodeepinfra$0.02$0.03131K
meta-llama-3.1-8b-instructdeepinfra$0.02$0.05131K
mistral-nemo-instruct-2407deepinfra$0.02$0.04131K
qwen3.5-2bdeepinfra$0.02$0.1262K
llama-3.1-8b-instruct--fp-16inferencenet$0.02$0.03131K
schematron-3binferencenet$0.02$0.05131K
schematron-v3inferencenet$0.02$0.05131K
+ +

๐Ÿ”ง Cheapest Models with Tool Calling

+

The most affordable models that support function/tool calling โ€” essential for AI agents.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContext
ling-2.6-flashinclusionai$0.01$0.03262K
bdc-coderinferencenet$0.01$0.01131K
klusterai--Meta-Llama-3.1-8B-Instruct-Turboklusterai$0.015$0.02131K
granite-4.0-h-microcloudflare$0.017$0.112131K
llama-3.1-8b-instruct--fp-16inferencenet$0.02$0.03131K
schematron-3binferencenet$0.02$0.05131K
schematron-v3inferencenet$0.02$0.05131K
gpt-oss-20binferencenet$0.03$0.15131K
schematron-v2-turboinferencenet$0.03$0.15131K
openai--gpt-oss-20bneuralwatt$0.03$0.16?
+ +

๐Ÿง  Cheapest Models with Reasoning

+

The most affordable models with advanced reasoning capabilities.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContext
qwen3.5-0.8bdeepinfra$0.01$0.05262K
qwen3.5-2bdeepinfra$0.02$0.1262K
gpt-oss-20bdeepinfra$0.03$0.14131K
qwen3.5-4bdeepinfra$0.03$0.15262K
openai--gpt-oss-20bneuralwatt$0.03$0.16?
qwen--qwen3-4b-fp8novitaai$0.03$0.03128K
gpt-oss-120bdeepinfra$0.039$0.19131K
nvidia-nemotron-nano-9b-v2deepinfra$0.04$0.16131K
openai--gpt-oss-20bnovitaai$0.04$0.15131K
nemotron-3-nano-30b-a3bdeepinfra$0.05$0.2262K
+ +

๐Ÿ‘๏ธ Cheapest Models with Vision

+

The most affordable models that can understand images.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContext
qwen3.5-0.8bdeepinfra$0.01$0.05262K
qwen3.5-2bdeepinfra$0.02$0.1262K
paddlepaddle--paddleocr-vlnovitaai$0.02$0.0216K
qwen3.5-4bdeepinfra$0.03$0.15262K
deepseek--deepseek-ocr-2novitaai$0.03$0.038K
deepseek--deepseek-ocrnovitaai$0.03$0.038K
reka-edge-2reka$0.03$0.1131K
zai-org--autoglm-phone-9b-multilingualnovitaai$0.035$0.13865K
gemini-1.5-flash-8bdeepinfra$0.0375$0.151M
google-gemma-3-4bamazon-bedrock$0.04$0.08131K
+ +

๐Ÿ“ Cheapest Models with 128K+ Context

+

The most affordable models with large context windows (128K+ tokens).

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContext
mistralai--Mistral-Nemo-Instruct-2407klusterai$0.008$0.001131K
qwen3.5-0.8bdeepinfra$0.01$0.05262K
ling-2.6-flashinclusionai$0.01$0.03262K
bdc-coderinferencenet$0.01$0.01131K
klusterai--Meta-Llama-3.1-8B-Instruct-Turboklusterai$0.015$0.02131K
granite-4.0-h-microcloudflare$0.017$0.112131K
meta-llama-3.1-8b-instruct-turbodeepinfra$0.02$0.03131K
meta-llama-3.1-8b-instructdeepinfra$0.02$0.05131K
mistral-nemo-instruct-2407deepinfra$0.02$0.04131K
qwen3.5-2bdeepinfra$0.02$0.1262K
+ +

๐Ÿ† Flagship Model Prices

+

How much do the top AI models cost? A side-by-side comparison of the most popular models.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContext
gpt-4.1openai$2$81M
gpt-4oopenai$2.5$10128K
gpt-4o-miniopenai$0.15$0.6128K
gemini-2.5-prodeepinfra$1.25$101M
gemini-2.5-flashdeepinfra$0.3$2.51M
llama-4-maverickdigitalocean$0.25$0.871M
deepseek-r1amazon-bedrock$1.35$5.465K
deepseek-v3deepinfra$0.32$0.89163K
+ +

โšก Cache Pricing

+

+ 0 models offer cache pricing โ€” significantly reducing costs for repeated prompts. Cache + pricing is typically 50-90% cheaper than standard input pricing. +

+ + + + + + + + +
ModelProviderInput $/1MCache $/1MSavings
+ +

๐Ÿ“Š Methodology

+

+ All pricing data is sourced from first-party APIs โ€” not third-party aggregators. Prices + are per million tokens (input and output separately). Aggregator providers (OpenRouter, + Requesty, etc.) are excluded from ranking tables to avoid duplicate models. Cache pricing is + shown where available. +

+

Data is auto-scraped and validated with Zod schemas. Last updated: 2025-05-21.

+ +

๐Ÿ”— More Resources

+ + + Small Language Models +

๐ŸŽฏ AI Model Picker

+

โšก GitHub Action

+ + + diff --git a/site/multimodal-ai-models.html b/site/multimodal-ai-models.html new file mode 100644 index 00000000..ebe8c7bb --- /dev/null +++ b/site/multimodal-ai-models.html @@ -0,0 +1,664 @@ + + + + + + + Multimodal AI Models โ€” 1,548 Vision, Audio & Image Models Compared | AI Models Catalog + + + + + + + + + + + + + + + + + +
+
+

๐ŸŽจ Multimodal AI Models

+

+ 1,548 models that see, hear, speak, and create โ€” compared with pricing, context windows, + and capabilities +

+
+
+
1,548
+
Multimodal Models
+
+
+
1,487
+
Vision
+
+
+
118
+
Audio Input
+
+
+
34
+
Audio Output
+
+
+
28
+
Image Output
+
+
+
167
+
Video Input
+
+
+ ๐Ÿ” Interactive Catalog + โญ Star on GitHub +
+
+
+ + +

๐Ÿ“Š Modality Breakdown

+
+
+
๐Ÿ‘๏ธ
+
1,487
+
Vision (Image Input)
+
+
+
๐ŸŽฌ
+
167
+
Video Input
+
+
+
๐ŸŽค
+
118
+
Audio Input
+
+
+
๐Ÿ“„
+
141
+
PDF Input
+
+
+
๐Ÿ–ผ๏ธ
+
28
+
Image Output
+
+
+
๐Ÿ”Š
+
34
+
Audio Output
+
+
+
๐ŸŽฅ
+
4
+
Video Output
+
+
+ +

๐Ÿ† Flagship Multimodal Models

+

The most capable multimodal models across all providers:

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextInputOutputTool CallPrice (in/out per 1M)
gpt-4oOpenAI128Ktext, imagetextโœ“$2.50/$10
gpt-4.1OpenAI1Mtext, imagetextโœ“$2/$8
claude-sonnet-4Anthropic200Ktext, imagetextโœ“$3/$15
gemini-2.5-proGoogle1Mtext, image, audio, videotextโœ“$1.25/$10
gemini-2.5-flashGoogle1Mtext, image, audio, videotextโœ“$0.15/$0.60
llama-4-maverickMeta1Mtext, imagetextโœ“Varies
qwen3-235b-a22bAlibaba128Ktext, imagetextโœ“Varies
+ +

๐Ÿ‘๏ธ Vision Models (Image Input)

+

+ 1,487 models can accept images as input alongside text. These are the most common type of + multimodal model: +

+
+

Best Vision Models by Use Case

+
    +
  • + Document analysis: Gemini 2.5 Pro (1M context, PDF + image support), + GPT-4.1 +
  • +
  • Visual Q&A: Claude Sonnet 4, GPT-4o, Llama 4 Maverick
  • +
  • Code from screenshots: GPT-4o, Claude Sonnet 4, Gemini 2.5 Pro
  • +
  • + Medical imaging: Specialized models available through various providers +
  • +
  • + Free vision models: Gemma 3 (1Bโ€“27B), Qwen3 series, Llama 4 Maverick +
  • +
+
+

โ†’ See all 1,487 vision models compared

+ +

๐ŸŽค Audio Input Models

+

+ 118 models can process audio input โ€” for transcription, voice analysis, and audio + understanding: +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderAudio CapabilitiesContext
gemini-2.5-proGoogleAudio understanding + transcription1M
gemini-2.5-flashGoogleAudio understanding + transcription1M
gpt-4o-audio-previewOpenAIAudio input + output128K
claude-sonnet-4AnthropicAudio transcription200K
+ +

๐Ÿ–ผ๏ธ Image Generation Models

+

+ 28 models can generate images from text descriptions. This is a rapidly growing category: +

+ + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderCapabilities
gpt-image-1OpenAIText-to-image, image editing
dall-e-3OpenAIText-to-image generation
flux-1.1-proBlack Forest LabsHigh-quality text-to-image
stable-diffusion-3.5Stability AIOpen-weight text-to-image
+

+ โ†’ See all 28 image generation models +

+ +

๐Ÿ”Š Audio Output Models

+

+ 34 models can generate audio output โ€” for text-to-speech, voice cloning, and audio + generation: +

+
+

Key Audio Output Models

+
    +
  • + GPT-4o Audio Preview: Natural conversation with voice input and output +
  • +
  • Gemini 2.5 Flash: Audio understanding with text response
  • +
  • + Specialized TTS models: Available through various providers for + production voice applications +
  • +
+
+ +

๐ŸŽฌ Video Understanding Models

+

+ 167 models can process video input โ€” for video analysis, summarization, and content + understanding: +

+
+

Top Video Understanding Models

+
    +
  • + Gemini 2.5 Pro/Flash: Native video input with 1M context, process up to + 1 hour of video +
  • +
  • GPT-4o: Video frame extraction and analysis
  • +
  • Qwen3 series: Video understanding across model sizes
  • +
+
+ +

๐Ÿค” Choosing the Right Multimodal Model

+
+

Decision Framework

+
    +
  • + Image understanding only? โ†’ gemma-3-27b-it (free) or + gpt-4o +
  • +
  • + Need audio + vision? โ†’ gemini-2.5-flash (cheapest + multimodal) or gemini-2.5-pro +
  • +
  • + Generate images? โ†’ gpt-image-1 or + flux-1.1-pro +
  • +
  • + Video analysis? โ†’ gemini-2.5-pro (best video + understanding) +
  • +
  • + Need tool calling + vision? โ†’ llama-4-maverick or + claude-sonnet-4 +
  • +
  • + Budget-conscious? โ†’ gemini-2.5-flash ($0.15/$0.60 per 1M + tokens) +
  • +
  • + Need free API? โ†’ gemma-3-27b-it (Google, free) or + qwen3-32b (Alibaba, free) +
  • +
+
+ +

๐Ÿ”— Related Comparisons

+ +
+ Small Language Models +

๐ŸŽฏ AI Model Picker

+

โšก GitHub Action

+ + + diff --git a/site/open-source-ai-models.html b/site/open-source-ai-models.html new file mode 100644 index 00000000..342d6f0c --- /dev/null +++ b/site/open-source-ai-models.html @@ -0,0 +1,849 @@ + + + + + + Open Source AI Models โ€” 527 Open Weight LLMs Compared | AI Models Catalog + + + + + + + + + + + + + + + + +
+
+

๐Ÿ”“ Open Source AI Models

+

+ 527 open-weight LLMs compared โ€” pricing, context windows, tool calling, reasoning, and + vision capabilities +

+
+
+
527
+
Open Weight Models
+
+
+
81
+
Free to Use
+
+
+
375
+
Tool Calling
+
+
+
231
+
Reasoning
+
+
+
269
+
Vision
+
+
+ ๐Ÿ” Interactive Catalog + โญ Star on GitHub +
+
+
+ + +

๐Ÿ† Flagship Open-Weight Models

+

The most capable open-weight models available today, from leading AI labs:

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextTool CallReasoningPrice (in/out per 1M)
llama-4-maverickMeta1Mโœ“โœ—Varies
llama-4-scoutMeta10Mโœ“โœ—Varies
deepseek-r1DeepSeek128Kโœ“โœ“Varies
deepseek-v3DeepSeek128Kโœ“โœ—Varies
qwen3-235b-a22bAlibaba128Kโœ“โœ“Varies
qwen3-32bAlibaba128Kโœ“โœ“Varies
llama-3.3-70b-instructMeta128Kโœ“โœ—Varies
gemma-3-27b-itGoogle128Kโœ“โœ—Free
phi-4Microsoft16Kโœ“โœ—Varies
command-aCohere256Kโœ“โœ—Varies
mistral-large-2411Mistral128Kโœ“โœ—Varies
+ +

๐Ÿ†“ Free Open-Source AI Models

+

+ 81 open-weight models you can use for free through their provider APIs. These are ideal for + prototyping, testing, and learning: +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextTool CallReasoning
gemma-3-27b-itGoogle128Kโœ“โœ—
gemma-3-12b-itGoogle128Kโœ“โœ—
gemma-3-4b-itGoogle128Kโœ“โœ—
gemma-3-1b-itGoogle128Kโœ—โœ—
qwen3-235b-a22bAlibaba128Kโœ“โœ“
qwen3-30b-a3bAlibaba128Kโœ“โœ“
qwen3-32bAlibaba128Kโœ“โœ“
qwen3-14bAlibaba128Kโœ“โœ“
qwen3-8bAlibaba128Kโœ“โœ“
qwen3-4bAlibaba128Kโœ“โœ“
qwen3-1.7bAlibaba128Kโœ“โœ“
qwen3-0.6bAlibaba128Kโœ“โœ“
llama-4-maverickMeta1Mโœ“โœ—
llama-4-scoutMeta10Mโœ“โœ—
llama-3.3-70b-instructMeta128Kโœ“โœ—
+

+ โ†’ See all 81 free AI models (including non-open-weight) +

+ +

๐Ÿ”ง Open-Weight Tool-Calling Models

+

+ 375 open-weight models support tool/function calling โ€” essential for AI agents and agentic + workflows: +

+
+

Top Open-Weight Tool-Calling Models

+
    +
  • + Llama 4 Maverick/Scout โ€” Meta's latest with native tool calling, 1Mโ€“10M + context +
  • +
  • + Qwen3 series โ€” All sizes support tool calling + reasoning (0.6B to + 235B) +
  • +
  • DeepSeek R1/V3 โ€” Strong tool calling with 128K context
  • +
  • Gemma 3 (1Bโ€“27B) โ€” Google's lightweight models with tool calling
  • +
  • + Command A โ€” Cohere's 111B model optimized for enterprise tool use +
  • +
  • + Mistral Large โ€” 123B parameter model with robust function calling +
  • +
+
+

โ†’ See all 2,350 tool-calling models

+ +

๐Ÿง  Open-Weight Reasoning Models

+

+ 231 open-weight models with reasoning capabilities โ€” these can "think step by step" for + complex tasks: +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextTool CallKey Strength
deepseek-r1DeepSeek128Kโœ“Best open-weight reasoning, rivals o1
qwen3-235b-a22bAlibaba128Kโœ“MoE architecture, thinking mode
qwen3-32bAlibaba128Kโœ“Dense reasoning, strong benchmarks
qwen3-30b-a3bAlibaba128Kโœ“Lightweight MoE reasoning
qwen3-14bAlibaba128Kโœ“Mid-size reasoning model
qwen3-8bAlibaba128Kโœ“Small but capable reasoning
+

โ†’ See all 1,306 reasoning models

+ +

๐Ÿ‘๏ธ Open-Weight Vision Models

+

+ 269 open-weight models can process images alongside text โ€” useful for document analysis, + visual Q&A, and multimodal applications: +

+
+

Top Open-Weight Vision Models

+
    +
  • + Llama 4 Maverick/Scout โ€” Native multimodal with 1Mโ€“10M context, process + images + text +
  • +
  • Qwen3 series โ€” Vision-capable across all sizes
  • +
  • Gemma 3 (1Bโ€“27B) โ€” Google's vision-language models, free to use
  • +
  • DeepSeek R1/V3 โ€” Reasoning + vision capabilities
  • +
  • Command A โ€” Enterprise-grade vision + tool calling
  • +
+
+

โ†’ See all 1,487 vision models

+ +

๐Ÿ“ Open-Weight Large Context Models

+

+ Open-weight models with the largest context windows โ€” essential for processing long + documents, codebases, and multi-turn conversations: +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContext WindowTool CallReasoning
llama-4-scoutMeta10Mโœ“โœ—
llama-4-maverickMeta1Mโœ“โœ—
command-aCohere256Kโœ“โœ—
deepseek-r1DeepSeek128Kโœ“โœ“
deepseek-v3DeepSeek128Kโœ“โœ—
qwen3-235b-a22bAlibaba128Kโœ“โœ“
llama-3.3-70b-instructMeta128Kโœ“โœ—
gemma-3-27b-itGoogle128Kโœ“โœ—
mistral-large-2411Mistral128Kโœ“โœ—
+

+ โ†’ See all models with context window comparison +

+ +

๐Ÿค” How to Choose an Open-Source AI Model

+
+

Decision Framework

+
    +
  • + Need free API access? โ†’ Start with gemma-3-27b-it (Google, + free) or qwen3-32b (Alibaba, free) +
  • +
  • + Building AI agents? โ†’ llama-4-maverick (1M context + tool + calling) or deepseek-r1 (reasoning + tools) +
  • +
  • + Processing long documents? โ†’ llama-4-scout (10M context) + or llama-4-maverick (1M context) +
  • +
  • + Complex reasoning tasks? โ†’ deepseek-r1 (best open-weight + reasoning) or qwen3-235b-a22b +
  • +
  • + Vision/image understanding? โ†’ llama-4-maverick or + gemma-3-27b-it +
  • +
  • + Edge/mobile deployment? โ†’ qwen3-0.6b or + gemma-3-1b-it (smallest open-weight) +
  • +
  • + Enterprise tool use? โ†’ command-a (256K context, optimized + for RAG + tools) +
  • +
+
+
+

Open Weights vs. Proprietary Models

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
AspectOpen WeightsProprietary
Self-hostingโœ“ Run on your own hardwareโœ— Cloud API only
Data privacyโœ“ Full control over dataโœ— Data sent to provider
Customizationโœ“ Fine-tune on your dataโœ— Limited (prompt-based)
Cost at scaleโœ“ Fixed infra costโœ— Per-token pricing
Latest capabilities~3โ€“6 months behindโœ“ Cutting-edge
ConvenienceRequires infra setupโœ“ Instant API access
+
+ +

๐Ÿ”— Related Comparisons

+ +
+

๐ŸŽฏ AI Model Picker

+

โšก GitHub Action

+ + + diff --git a/site/openai-alternatives.html b/site/openai-alternatives.html new file mode 100644 index 00000000..77f5a716 --- /dev/null +++ b/site/openai-alternatives.html @@ -0,0 +1,2851 @@ + + + + + + OpenAI Alternatives โ€” 87 AI Providers Compared (2025) | AI Models Catalog + + + + + + + + + + + + + + + + + + +

๐Ÿ”„ OpenAI Alternatives โ€” 87 AI Providers Compared

+

+ Looking for alternatives to OpenAI? Compare 87 AI providers with 4,587 models. + Real pricing, real capabilities, first-party data. +

+ +
+
87Providers
+
4,587Models
+
81Free Models
+
2,350Tool Calling
+
527Open Weights
+
+ + ๐Ÿ” Interactive Catalog + โญ Star on GitHub + +
+ ๐Ÿ’ก Why consider alternatives? OpenAI is great, but many providers offer + cheaper pricing, larger context windows, open weights, or specialized capabilities. This page + helps you find the right model for your needs. +
+ + + +

๐Ÿ’ฐ Price Comparison: OpenAI vs Alternatives

+

How do alternative providers compare on price? All prices per million tokens.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ProviderModelInput $/1MOutput $/1MContextTool Call
OpenAIgpt-4.1$2$81Mโœ…
OpenAIgpt-4o$2.5$10128Kโœ…
OpenAIgpt-4o-mini$0.15$0.6128Kโœ…
Googlegemini-2.5-pro$1.25$101M
Googlegemini-2.5-flash$0.3$2.51M
DeepSeekdeepseek-r1$1.35$5.465K
DeepSeekdeepseek-v3$0.32$0.89163K
Metallama-4-maverick$0.25$0.871Mโœ…
+ +

๐ŸŸฃ Anthropic (Claude)

+

+ Anthropic's Claude models are known for superior reasoning, safety, and long context windows. + Claude is a strong alternative for complex tasks, coding, and analysis. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelInput $/1MOutput $/1MContextTool CallReasoning
claude-haiku-4-5$1$5200Kโœ…โœ…
databricks-claude-haiku-4-5$1$5200K
claude-haiku-4-5$1$5200Kโœ…
claude-haiku-4-5$1$5200Kโœ…
claude-sonnet-4-0$3$151Mโœ…โœ…
claude-sonnet-4-5$3$151Mโœ…โœ…
claude-sonnet-4-6$3$151Mโœ…โœ…
databricks-claude-sonnet-4-5$3$15200K
databricks-claude-sonnet-4$3$15200K
claude-sonnet-4-6$3$151Mโœ…
claude-sonnet-4-5$3$15200Kโœ…
claude-sonnet-4-6$3$15200Kโœ…
claude-sonnet-4$3$15200Kโœ…
claude-opus-4-5$5$25200Kโœ…โœ…
claude-opus-4-6$5$251Mโœ…โœ…
claude-opus-4-7$5$251Mโœ…โœ…
databricks-claude-opus-4-5$5$25200K
claude-opus-4-7$5$251Mโœ…
claude-opus-4-5$5$25200Kโœ…
claude-opus-4-6$5$25200Kโœ…
claude-opus-4-7$5$25200Kโœ…
claude-opus-4-5$6.25$31.25200Kโœ…
claude-opus-4-0$15$75200Kโœ…โœ…
claude-opus-4-1$15$75200Kโœ…โœ…
databricks-claude-opus-4-1$15$75200K
claude-opus-4-1$15$75200Kโœ…
claude-opus-4$15$75200Kโœ…
claude-opus-4-6-fast$30$1501Mโœ…โœ…
claude-opus-4-7-fast$30$1501Mโœ…โœ…
+ +

๐Ÿ”ต Google (Gemini)

+

+ Google's Gemini models offer multimodal capabilities (text, image, audio, video) with + competitive pricing and massive context windows. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelInput $/1MOutput $/1MContextTool CallReasoning
gemini-1.5-flash-8b$0.0375$0.151M
gemini-1.5-flash$0.075$0.31M
gemini-1.5-flash-8b$0.075$0.31Mโœ…
gemini-1.5-flash$0.075$0.31Mโœ…
gemini-2.0-flash-lite$0.075$0.31Mโœ…
gemini-2-0-flash-lite$0.075$0.31Mโœ…
gemini-2.0-flash$0.1$0.41Mโœ…
gemini-2.5-flash-lite$0.1$0.41Mโœ…
gemini-2-5-flash-lite$0.1$0.41Mโœ…
gemini-2.5-flash$0.15$3.51Mโœ…โœ…
gemini-2-0-flash$0.15$0.61Mโœ…
databricks-gemini-3-1-flash-lite$0.25$1.5128K
gemini-3.1-flash-lite$0.25$1.51Mโœ…
gemini-3-1-flash-lite$0.25$1.5200Kโœ…
databricks-gemini-2-5-flash$0.3$2.5128K
gemini-2.5-flash$0.3$2.51Mโœ…
gemini-2-5-flash$0.3$2.51Mโœ…
gemini-3-flash$0.5$3200Kโœ…
databricks-gemini-3-flash$0.63$3.75128K
databricks-gemini-2-5-pro$1.25$10128K
gemini-2.5-pro$1.25$101Mโœ…
gemini-1.5-pro$1.25$52Mโœ…
gemini-2.5-pro$1.25$101Mโœ…โœ…
gemini-2-5-pro$1.25$101Mโœ…
gemini-3.1-pro$2$121Mโœ…
gemini-3-pro$2$12200Kโœ…
databricks-gemini-3-1-pro$2.5$15128K
chirp-3.0-HD$?$??
gemma-3-12b-itFree131K
gemma-3-1b-itFree131K
gemma-3-27b-itFree131K
gemma-3-4b-itFree131K
gemma-3n-E2B-itFree131K
gemma-3n-E4B-itFree131K
imagen-3.0-fast-generate$?$??
imagen-3.0-generate$?$??
imagen-4.0-fast-generate$?$??
imagen-4.0-generate$?$??
lyria-2.0$?$??
veo-2.0-generate$?$??
+ +

๐Ÿฆ™ Meta (Llama)

+

+ Meta's Llama models are open-weight, meaning you can download and run them locally. Great for + privacy-sensitive applications and cost optimization. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextTool CallReasoningOpen Weights
meta-llama-4-scoutmeta10Mโœ…
meta-llama-4-maverick-17bamazon-bedrock1Mโœ…โœ…
meta-llama-4-scout-17bamazon-bedrock1Mโœ…โœ…
llama-4-maverick-17b-128e-instruct-fp8deepinfra1M
llama-4-maverickdigitalocean1Mโœ…โœ…
meta-llama--Llama-4-Maverick-17B-128E-Instruct-FP8gmicloud1Mโœ…โœ…
llama-4-maverickgoogle-vertex1Mโœ…โœ…
llama-4-scoutgoogle-vertex1Mโœ…โœ…
meta-llama--Llama-4-Maverick-17B-128E-Instruct-FP8klusterai1Mโœ…
meta-llama--llama-4-maverick-17b-128e-instruct-fp8novitaai1M
meta-llama-4-maverickmeta1Mโœ…
llama-4-scout-17b-16e-instructcloudflare327Kโœ…โœ…
llama-4-scout-17b-16e-instructdeepinfra327K
meta-llama--Llama-4-Scout-17B-16E-Instructgmicloud327Kโœ…โœ…
llama-4-scout-17b-16e-instructvultr327Kโœ…โœ…
+ +

๐Ÿ”ฎ DeepSeek

+

+ DeepSeek offers high-performance reasoning and chat models at significantly lower prices than + OpenAI. DeepSeek-R1 rivals o1 on reasoning benchmarks. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelInput $/1MOutput $/1MContextTool CallReasoning
deepseek--deepseek-ocr-2$0.03$0.038K
deepseek--deepseek-ocr$0.03$0.038K
deepseek--deepseek-r1-0528-qwen3-8b$0.06$0.09128K
deepseek-ai--DeepSeek-R1-Distill-Qwen-7B$0.1$0.2131Kโœ…
deepseek-v4-flash$0.126$0.2521Mโœ…โœ…
deepseek-v4-flash$0.14$0.281Mโœ…
deepseek-chat$0.14$0.281Mโœ…
deepseek-reasoner$0.14$0.281Mโœ…โœ…
deepseek-v4-flash$0.14$0.281Mโœ…โœ…
deepseek-ai--DeepSeek-R1-Distill-Llama-8B$0.14$0.39131Kโœ…
deepseek--deepseek-v4-flash$0.14$0.281Mโœ…โœ…
deepseek--deepseek-v4-flash$0.14$0.281Mโœ…โœ…
deepseek-v4-flash$0.14$0.281Mโœ…โœ…
deepseek--deepseek-r1-distill-qwen-14b$0.15$0.1532K
deepseek--deepseek-4-flash$0.182$0.364?
deepseek-v3-0324$0.2$0.77163K
deepseek-ai--DeepSeek-R1-Distill-Qwen-14B$0.2$0.2131Kโœ…
deepseek--DeepSeek-R1$0.2$0.8163Kโœ…
deepseek--DeepSeek-V3.1$0.2$0.8163K
deepseek-v3.1$0.21$0.79163Kโœ…
deepseek--deepseek-ocr-2$0.216$0.2168Kโœ…
deepseek-ai--DeepSeek-R1-Distill-Llama-70B$0.25$0.75131Kโœ…
deepseek-v3.2$0.252$0.378131Kโœ…โœ…
deepseek-v3.2$0.26$0.38163K
deepseek--deepseek-v3.2$0.269$0.4163Kโœ…โœ…
deepseek-v3.1-terminus$0.27$0.95163Kโœ…
deepseek-ai--DeepSeek-V3.1-Terminus$0.27$1163K
deepseek-ai--DeepSeek-V3.1$0.27$1163K
deepseek-ai--DeepSeek-V3.2-Exp$0.27$0.41163K
deepseek--deepseek-v3-0324$0.27$1.12163Kโœ…
deepseek--deepseek-v3.1-terminus$0.27$1131Kโœ…โœ…
deepseek--deepseek-v3.1$0.27$1131Kโœ…โœ…
deepseek--deepseek-v3.2-exp$0.27$0.41163Kโœ…โœ…
deepseek-v3.1-nex-n1$0.27$1131Kโœ…
deepseek-v3.1-terminus$0.27$1163Kโœ…
deepseek-v3.2-exp$0.27$0.41163Kโœ…
deepseek-v3.2$0.27$0.42163Kโœ…
deepseek-ai--DeepSeek-V3.2-TEE$0.28$0.42131Kโœ…โœ…
deepseek-ai--DeepSeek-V3-0324$0.28$0.88163K
deepseek-ai--DeepSeek-V3-0324$0.28$1.14163Kโœ…
deepseek--deepseek-v3.1-release$0.294$0.441?
deepseek--deepseek-v3.1$0.294$0.441?
DeepSeek-V3.2$0.3$0.45160Kโœ…โœ…
deepseek--deepseek-r1-distill-qwen-32b$0.3$0.364K
deepseek-v3$0.32$0.89163K
deepseek--deepseek-v3.1-terminus$0.364$0.546?
deepseek--deepseek-v3.2-exp-non-thinking$0.364$0.546128Kโœ…
deepseek--deepseekโ€‘v3.2โ€‘exp-thinking$0.364$0.546?
deepseek--deepseek-v3.2-speciale$0.36855$0.56186?
deepseek-v3--fp-8$0.4$1.2131Kโœ…
deepseek--deepseek-v3-turbo$0.4$1.364Kโœ…
deepseek-v4-pro$0.435$0.871Mโœ…โœ…
deepseek-r1-distill-qwen-32b$0.497$4.881131Kโœ…
deepseek-v3-1$0.5$1.5131Kโœ…
deepseek-r1-0528$0.5$2.15163Kโœ…
deepseek-3.2$0.5$1.6131Kโœ…
deepseek-ai--DeepSeek-V3.2$0.5$1.5163Kโœ…
deepseek-ai--DeepSeek-Prover-V2-671B$0.5$2.18163Kโœ…
deepseek-ai--DeepSeek-R1-Distill-Qwen-32B$0.5$0.9131Kโœ…
deepseek-ai--DeepSeek-R1$0.5$2.18163Kโœ…
deepseek-r1-0528--fp-8$0.5$2.15131Kโœ…
deepseek-r1-0528$0.55$2.75131Kโœ…
deepseek-r1-distill-llama-70b$0.55$2.75131Kโœ…
deepseek-r1-distill-llama-8b$0.55$2.75131Kโœ…
deepseek-r1-distill-qwen-1.5b$0.55$2.7532Kโœ…
deepseek-r1-distill-qwen-14b$0.55$2.75131Kโœ…
deepseek-r1-distill-qwen-32b$0.55$2.75131Kโœ…
deepseek-r1-distill-qwen-7b$0.55$2.7532Kโœ…
deepseek-v32-exp$0.55$2.75131K
deepseek-v32-speciale$0.55$2.75131K
deepseek-v32$0.55$2.75131K
deepseek-v4-flash$0.55$2.75131K
deepseek-v4-pro$0.55$2.75131Kโœ…
deepseek-v3-2$0.56$1.6865Kโœ…
deepseek-v3-1$0.6$1.765K
deepseek-ai--DeepSeek-V3.1$0.6$1.7131Kโœ…
deepseek-v3-2$0.62$1.8565Kโœ…
deepseek-r1-distill-llama-70b$0.7$0.8131Kโœ…
deepseek-ai--DeepSeek-R1-0528$0.7$2.3163Kโœ…
deepseek--deepseek-prover-v2-671b$0.7$2.5160K
deepseek--deepseek-r1-0528$0.7$2.5163Kโœ…โœ…
deepseek--deepseek-r1-turbo$0.7$2.564Kโœ…โœ…
deepseek--deepseek-r1-distill-llama-70b$0.8$0.88Kโœ…
deepseek-r1-distill-llama-70b$0.99$0.99131Kโœ…
deepseek-r1-0528-turbo$1$332Kโœ…
deepseek--deepseek-v4-flash$1$21Mโœ…
deepseek-v4-flash$1$2131Kโœ…
deepseek-v4-flash$1$21Mโœ…
deepseek-r1$1.35$5.465K
deepseek-r1$1.35$5.465K
deepseek-v4-pro$1.521$3.042716Kโœ…โœ…
deepseek--deepseek-v4-pro$1.67$3.381Mโœ…โœ…
deepseek-v4$1.74$3.48131Kโœ…โœ…
deepseek-v4-pro$1.74$3.4865K
deepseek-v4-pro$1.74$3.48163Kโœ…โœ…
deepseek-v4-pro$1.74$3.481Mโœ…โœ…
deepseek--deepseek-v4-pro$1.74$3.481Mโœ…โœ…
deepseek-v4-pro$1.74$3.481Mโœ…โœ…
DeepSeek-V4-Pro$1.75$3.51Mโœ…โœ…
deepseek-ai--DeepSeek-V2.5$2$2163K
deepseek--deepseek-v3--community$2$864Kโœ…
deepseek--deepseek-v3-0324$2$8163Kโœ…
deepseek--deepseek-v3-turbo$2$864Kโœ…
deepseek--deepseek-v3.2-exp$2$3163Kโœ…
deepseek--deepseek-v3.2$2$3163Kโœ…
deepseek-v3.2$2$3163Kโœ…
deepseek-v3$2$8163Kโœ…
deepseek-v3-0324$2$8128Kโœ…
deepseek-v3.2$2$3128Kโœ…
deepseek-ai--DeepSeek-V4-Pro$2.1$4.4131Kโœ…โœ…
deepseek--deepseek-v4-pro$2.262$4.524?
deepseek-r1-distill-llama-70b$2.44$2.44131Kโœ…
deepseek-ai--DeepSeek-R1-0528$2.5$5163Kโœ…
DeepSeek-V3.1$3$4.5131K
DeepSeek-V3.2$3$4.532K
deepseek--deepseek-prover-v2-671b$4$16160Kโœ…โœ…
deepseek--deepseek-r1--community$4$1664Kโœ…โœ…
deepseek--deepseek-r1-0528$4$16163Kโœ…โœ…
deepseek--deepseek-r1-turbo$4$1664Kโœ…โœ…
deepseek--deepseek-v3.1-terminus$4$12131Kโœ…
deepseek--deepseek-v3.1$4$12131Kโœ…
deepseek-r1$4$16163Kโœ…
deepseek-v3.1-terminus$4$12163Kโœ…
deepseek-r1-0528$4$16128Kโœ…โœ…
deepseek-v3.1$4$12128Kโœ…
deepseek--deepseek-r1-distill-llama-70b$5.8$5.832Kโœ…โœ…
deepseek--deepseek-v4-pro$12$241Mโœ…
deepseek-v4-pro$12$24128Kโœ…โœ…
deepseek-r1-distill-llama-70bFree131Kโœ…
deepseek-r1-distill-llama-8bFree131Kโœ…
+ +

๐Ÿ‡ซ๐Ÿ‡ท Mistral

+

+ Mistral offers both open-weight and commercial models. Known for efficiency and European data + sovereignty. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelInput $/1MOutput $/1MContextTool CallOpen Weights
mistralai--Mistral-Nemo-Instruct-2407$0.008$0.001131Kโœ…
mistral-nemo-instruct-2407$0.02$0.04131K
mistral-nemo-12b-instruct--fp-8$0.0375$0.1131Kโœ…โœ…
ministral-3b$0.04$0.04128Kโœ…
voxtral-mini$0.04$0.04128K
mistralai--mistral-nemo$0.04$0.1760K
mistral-small-24b-instruct-2501$0.05$0.0832K
mistralai--Mistral-Small-24B-Instruct-2501$0.05$0.0832Kโœ…
mistral-small-3.2-24b-instruct-2506$0.075$0.2128K
mistralai--Devstral-Small-2-24B-Instruct$0.1$0.4131Kโœ…โœ…
mistral-small-3-1$0.1$0.3128Kโœ…
ministral-8b$0.1$0.1128Kโœ…
voxtral-small$0.1$0.3128K
Mistral-Small-3.2-24B-Instruct-2506$0.1$0.31131K
mistral-7b-instruct-v0.1$0.11$0.1932Kโœ…
Mistral-7B-Instruct-v0.3$0.11$0.1165K
Mistral-Nemo-Instruct-2407$0.14$0.1465K
mistral-mistral-7b$0.15$0.232Kโœ…
mistral-7b$0.15$0.232K
mistral-nemo$0.15$0.15128Kโœ…
mistral-small-3.2-24b-instruct-2506$0.15$0.35131Kโœ…โœ…
mistral-small$0.2$0.6128Kโœ…
mistral-nemo-instruct-2407$0.2$0.2131Kโœ…
mistralai--Mistral-7B$0.2$28Kโœ…
mistralai--Mistral-Small-3.2-24B-Instruct-2506$0.3$0.3?โœ…
mistral-small-3.1-24b-instruct$0.351$0.555131Kโœ…โœ…
mistral-medium-3$0.4$2128Kโœ…
mistral-medium$0.4$2128Kโœ…
mixtral-8x7b$0.45$0.732Kโœ…
mistral-mistral-large-3$0.5$1.5128Kโœ…
mistralai--Magistral-Small$0.5$2131Kโœ…
magistral-small$0.5$1.5128Kโœ…
mistral-large-3-675b-instruct-2512$0.55$2.75262Kโœ…โœ…
mistral-small-4-119b-2603$0.55$2.75131Kโœ…โœ…
mixtral-8x22b$0.8$1.264Kโœ…
mistral-mistral-small$1$3128Kโœ…
mistral-ai--mixtral-8x22b$1.26$1.26?
mistral-small-24b-instruct-2501$1.26$1.2632Kโœ…
mistral-large$2$6128Kโœ…
pixtral-large$2$6128Kโœ…
mistral-mistral-large$4$12128Kโœ…
mistral-large-2407$4$12128Kโœ…
codestralFree256K
devstralFree128Kโœ…
+ +

๐Ÿ†“ Free Alternatives to OpenAI

+

+ 81 models are available at zero cost โ€” perfect for testing, prototyping, and learning. Many + support tool calling and have large context windows. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextTool CallReasoning
openrouter--owl-alphaopenrouter1Mโœ…
deepseek--deepseek-v4-flash--freeopenrouter1Mโœ…โœ…
google--lyria-3-clip-previewopenrouter1M
google--lyria-3-pro-previewopenrouter1M
qwen--qwen3-coder--freeopenrouter1Mโœ…
nvidia--nemotron-3-super-120b-a12b--freeopenrouter1Mโœ…โœ…
gemma-4-26b-a4b-itauriko262Kโœ…โœ…
gemma-4-31b-itauriko262Kโœ…โœ…
arcee-ai--trinity-large-thinking--freeopenrouter262Kโœ…โœ…
google--gemma-4-26b-a4b-it--freeopenrouter262Kโœ…โœ…
google--gemma-4-31b-it--freeopenrouter262Kโœ…โœ…
codestralmistral256K
nvidia--nemotron-3-nano-omni-30b-a3b-reasoning--freeopenrouter256Kโœ…โœ…
hunyuan-litetencent250K
minimax--minimax-m2.5--freeopenrouter204Kโœ…โœ…
+ +

๐Ÿ”“ Open-Weight Alternatives

+

+ 527 models with downloadable weights you can run locally or on your own infrastructure. No API + dependency, full privacy control. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextTool CallReasoning
google--gemma-4-31b-itorcarouter1Mโœ…
qwen--qwen3.5-flash-2026-02-23orcarouter1Mโœ…
qwen--qwen3.5-flashorcarouter1Mโœ…
qwen--qwen3.6-flash-2026-04-16orcarouter1Mโœ…
qwen--qwen3.6-flashorcarouter1Mโœ…
MiniMax-Text-01302ai1M
llama-4-maverick302ai1M
llama-4-scout302ai1M
meta-llama-4-maverick-17bamazon-bedrock1Mโœ…
meta-llama-4-scout-17bamazon-bedrock1Mโœ…
minimax-m2-1amazon-bedrock1Mโœ…
minimax-m2-5amazon-bedrock1Mโœ…
minimax-m2amazon-bedrock1Mโœ…
minimax-m2-5baseten1Mโœ…
llama-4-maverickdigitalocean1Mโœ…
+ +

๐Ÿ“Š Methodology

+

+ All data is sourced from first-party APIs โ€” not third-party aggregators. Pricing, + context windows, and capabilities are verified against official provider documentation. + Aggregator providers are excluded from ranking tables to avoid duplicate models. +

+ +

๐Ÿ”— More Resources

+ + + Small Language Models +

๐ŸŽฏ AI Model Picker

+

โšก GitHub Action

+ + + diff --git a/site/promotion-templates.md b/site/promotion-templates.md new file mode 100644 index 00000000..f23859cb --- /dev/null +++ b/site/promotion-templates.md @@ -0,0 +1,105 @@ +# Reddit / HN Post Templates + +## r/LocalLLaMA + +**Title:** I built a catalog of 4,587 AI models across 95 providers โ€” all with structured pricing, context windows, and capabilities + +**Body:** + +Hey r/LocalLLaMA, + +I got tired of checking 95 different websites to compare AI model pricing and capabilities, so I built [AI Models Catalog](https://github.com/i-need-token/ai-models) โ€” a structured YAML catalog of every major AI model. + +**The numbers:** + +- 4,587 models across 95 providers +- 81 free models, 527 open weights +- 2,350 tool-calling, 1,306 reasoning, 1,487 vision +- All data from first-party APIs (no third-party aggregators) + +**What makes it different:** + +- Machine-readable YAML (not just a web UI) +- TypeScript types + Zod validation +- Multiple formats: JSON, CSV, npm, GitHub Action +- 68 documentation pages (34 EN + 34 ZH) + +**Free models:** 81 models you can use at zero cost, including models on Groq, Cerebras, Cloudflare Workers AI, and more. + +**Open weights:** 527 models with downloadable weights (Llama, Mistral, Qwen, DeepSeek, etc.) + +**Interactive catalog:** [i-need-token.github.io/ai-models](https://i-need-token.github.io/ai-models/) โ€” search, filter, price calculator, model picker + +**Quick start:** + +```bash +curl -sL https://github.com/i-need-token/ai-models/releases/latest/download/models.json | jq '.models | length' +# โ†’ 4587 +``` + +Would love feedback on what providers or features to add next! + +--- + +## r/MachineLearning + +**Title:** [P] AI Models Catalog โ€” 4,587 models, 95 providers, structured YAML with pricing and capabilities + +**Body:** + +We created a structured catalog of AI model metadata to make model comparison and selection easier for researchers and developers. + +**Repository:** https://github.com/i-need-token/ai-models + +**Key features:** + +- Structured YAML for every model (pricing, context windows, modalities, capabilities) +- First-party data only โ€” scraped from provider APIs +- Zod-validated TypeScript types +- JSON, CSV, npm package, GitHub Action outputs +- 68 documentation pages covering specific use cases + +**Research applications:** + +- Model selection for experiments +- Pricing analysis across providers +- Capability tracking (tool calling, reasoning, structured output) +- Context window comparison +- Open weights tracking + +**Data access:** + +```python +import json +with open("models.json") as f: + catalog = json.load(f) + models = catalog["models"] + free = [m for m in models if m.get("pricing", {}).get("unit") == "free"] + print(f"Free models: {len(free)}") +``` + +Feedback and contributions welcome! + +--- + +## Hacker News (Show HN) + +**Title:** Show HN: AI Models Catalog โ€“ 4,587 models, 95 providers, structured pricing and capabilities + +**Body:** + +I built a structured catalog of AI model metadata because I was tired of visiting 95 different websites to compare models. + +Every model has structured YAML with pricing (per-token), context windows, modalities, and capabilities. All data comes from first-party APIs โ€” no third-party aggregators. + +Key features: + +- 4,587 models across 95 providers +- 81 free models, 527 open weights +- Machine-readable YAML with Zod validation +- JSON, CSV, npm, GitHub Action +- Interactive catalog with price calculator and model picker +- 68 documentation pages + +Try it: https://i-need-token.github.io/ai-models/ +Repo: https://github.com/i-need-token/ai-models diff --git a/site/reasoning-models-comparison.html b/site/reasoning-models-comparison.html new file mode 100644 index 00000000..bff4ba7e --- /dev/null +++ b/site/reasoning-models-comparison.html @@ -0,0 +1,970 @@ + + + + + + AI Reasoning Models Compared โ€” o1, R1, Claude, Gemini (2025) | AI Models Catalog + + + + + + + + + + + + + + + + + + +

๐Ÿง  AI Reasoning Models Compared (2025)

+

+ Compare 1,306 reasoning models across 95 providers. Find the best chain-of-thought + model for math, science, coding, and complex analysis. +

+ +
+
1,306Reasoning Models
+
95Providers
+
81Free
+
527Open Weights
+
+ + ๐Ÿ” Interactive Catalog + โญ Star on GitHub + +
+ ๐Ÿ’ก What is a reasoning model? Reasoning models (like OpenAI o1/o3, DeepSeek + R1, Claude with extended thinking) use chain-of-thought to break complex problems into steps. + They excel at math, science, coding, and multi-step logic โ€” but often cost more and run slower + than standard models. +
+ +

๐Ÿ† Flagship Reasoning Models โ€” Head to Head

+

The top reasoning models compared side by side.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContextTool Call
o3openai$10$40200Kโœ…
o3-miniopenai$1.1$4.4200Kโœ…
o4-miniopenai$1.1$4.4200Kโœ…
o1openai$15$60200Kโœ…
o1-miniopenai$1.5$6128Kโœ…
o1-proopenai$150$600200Kโœ…
deepseek-r1-distill-llama-70bcerebrasFree131K
gemini-2.5-prodeepinfra$1.25$101M
gemini-2.5-flashdeepinfra$0.3$2.51M
qwen3-235b-a22balibaba$2$8?โœ…
+ +

๐Ÿ’ฐ Cheapest Reasoning Models

+

Reasoning on a budget โ€” most affordable models with reasoning capability.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContextTool Call
qwen3.5-0.8bdeepinfra$0.01$0.05262K
qwen3.5-2bdeepinfra$0.02$0.1262K
gpt-oss-20bdeepinfra$0.03$0.14131K
qwen3.5-4bdeepinfra$0.03$0.15262K
openai--gpt-oss-20bneuralwatt$0.03$0.16?โœ…
qwen--qwen3-4b-fp8novitaai$0.03$0.03128Kโœ…
gpt-oss-120bdeepinfra$0.039$0.19131K
nvidia-nemotron-nano-9b-v2deepinfra$0.04$0.16131K
openai--gpt-oss-20bnovitaai$0.04$0.15131K
nemotron-3-nano-30b-a3bdeepinfra$0.05$0.2262K
gpt-oss-120binferencenet$0.05$0.45131Kโœ…
Qwen--Qwen3.6-35B-A3Bneuralwatt$0.05$0.1?โœ…
openai--gpt-oss-120bnovitaai$0.05$0.25131Kโœ…
qwen3-30b-a3b-fp8cloudflare$0.051$0.33540Kโœ…
glm-4.7-flashcloudflare$0.06$0.4131Kโœ…
+ +

๐Ÿ†“ Free Reasoning Models

+

33 reasoning models at zero cost โ€” perfect for learning and prototyping.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextTool Call
deepseek--deepseek-v4-flash--freeopenrouter1Mโœ…
nvidia--nemotron-3-super-120b-a12b--freeopenrouter1Mโœ…
gemma-4-26b-a4b-itauriko262Kโœ…
gemma-4-31b-itauriko262Kโœ…
arcee-ai--trinity-large-thinking--freeopenrouter262Kโœ…
google--gemma-4-26b-a4b-it--freeopenrouter262Kโœ…
google--gemma-4-31b-it--freeopenrouter262Kโœ…
nvidia--nemotron-3-nano-omni-30b-a3b-reasoning--freeopenrouter256Kโœ…
minimax--minimax-m2.5--freeopenrouter204Kโœ…
z-ai--glm-5.1openrouter202Kโœ…
+ +

๐Ÿ”“ Open-Weight Reasoning Models

+

120 reasoning models you can run locally for full privacy and zero API costs.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextTool Call
xiaomi--mimo-v2.5-prohpc-ai1Mโœ…
xiaomi--mimo-v2.5hpc-ai1Mโœ…
deepseek--deepseek-v4-flashhpc-ai1Mโœ…
deepseek--deepseek-v4-prohpc-ai1Mโœ…
DeepSeek-V4-Pronebius1Mโœ…
trinity-large-thinkingarcee262Kโœ…
qwen3-next-80b-a3b-thinkingclarifai262Kโœ…
gemma-4-26b-a4b-itcloudflare262Kโœ…
kimi-k2.5cloudflare262Kโœ…
kimi-k2.6cloudflare262Kโœ…
+ +

๐Ÿ”ง Reasoning + Tool Calling

+

+ Models with both reasoning and tool calling โ€” the most capable for agentic workflows that need + complex planning. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContext
openai--gpt-oss-20bneuralwatt$0.03$0.16?
qwen--qwen3-4b-fp8novitaai$0.03$0.03128K
gpt-oss-120binferencenet$0.05$0.45131K
Qwen--Qwen3.6-35B-A3Bneuralwatt$0.05$0.1?
openai--gpt-oss-120bnovitaai$0.05$0.25131K
qwen3-30b-a3b-fp8cloudflare$0.051$0.33540K
glm-4.7-flashcloudflare$0.06$0.4131K
Nemotron-3-Nano-Omninebius$0.06$0.24128K
hermes-4-llama-3.1-8bnousresearch$0.06$0.12131K
seed-1.6-flashbytedance$0.07$0.3262K
ring-2.6-1tinclusionai$0.07$0.62262K
zai-org--glm-4.7-flashnovitaai$0.07$0.4200K
microsoft-phi-4-mini-reasoningmicrosoft$0.075$0.3128K
Qwen--Qwen3-32B-TEEchutes$0.08$0.2440K
gpt-oss-120bclarifai$0.09$0.36131K
+ +

๐Ÿ“ Large Context Reasoning Models

+

+ Reasoning models with 128K+ context โ€” for analyzing long documents, large codebases, and + complex multi-step problems. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextInput $/1MTool Call
qwen3.5-0.8bdeepinfra262K$0.01
qwen3.5-2bdeepinfra262K$0.02
gpt-oss-20bdeepinfra131K$0.03
qwen3.5-4bdeepinfra262K$0.03
qwen--qwen3-4b-fp8novitaai128K$0.03โœ…
gpt-oss-120bdeepinfra131K$0.039
nvidia-nemotron-nano-9b-v2deepinfra131K$0.04
openai--gpt-oss-20bnovitaai131K$0.04
nemotron-3-nano-30b-a3bdeepinfra262K$0.05
gpt-oss-120binferencenet131K$0.05โœ…
openai--gpt-oss-120bnovitaai131K$0.05โœ…
glm-4.7-flashcloudflare131K$0.06โœ…
glm-4.7-flashdeepinfra202K$0.06
Nemotron-3-Nano-Omninebius128K$0.06โœ…
hermes-4-llama-3.1-8bnousresearch131K$0.06โœ…
+ +

๐Ÿ“Š Methodology

+

+ All data is sourced from first-party APIs. Reasoning capability is defined by the + provider's own classification โ€” models that use chain-of-thought, extended thinking, or + similar techniques. Aggregator providers are excluded from ranking tables to avoid duplicate + models. +

+ +

๐Ÿ”— More Resources

+ + +

Small Language Models

+

๐ŸŽฏ AI Model Picker

+

โšก GitHub Action

+ + + diff --git a/site/robots.txt b/site/robots.txt new file mode 100644 index 00000000..42b43f0d --- /dev/null +++ b/site/robots.txt @@ -0,0 +1,4 @@ +User-agent: * +Allow: / + +Sitemap: https://i-need-token.github.io/ai-models/sitemap.xml diff --git a/site/sitemap.xml b/site/sitemap.xml new file mode 100644 index 00000000..1aaa1cf7 --- /dev/null +++ b/site/sitemap.xml @@ -0,0 +1,276 @@ + + + + https://i-need-token.github.io/ai-models/ + daily + 1.0 + + + https://i-need-token.github.io/ai-models/docs/agentic-models + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/api + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/audio-models + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/cached-pricing + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/chat-models + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/code-examples + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/code-models + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/context-windows + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/data-acquisition + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/data-schema + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/embedding-models + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/faq + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/free-models + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/glossary + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/image-generation + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/large-context-models + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/lessons-learned + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/migration-guide + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/modality-matrix + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/model-comparison + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/model-selection + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/multimodal-models + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/open-weights + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/pricing-comparison + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/provider-comparison + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/providers + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/quick-start + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/reasoning-models + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/small-models + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/structured-output + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/tool-calling + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/video-models + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/vision-models + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/models.json + daily + 0.9 + + + https://i-need-token.github.io/ai-models/docs/openai-alternatives + weekly + 0.8 + + + https://i-need-token.github.io/ai-models/docs/agentic-models + weekly + 0.8 + + + https://i-need-token.github.io/ai-models/docs/code-models + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/docs/audio-models + weekly + 0.7 + + + https://i-need-token.github.io/ai-models/best-ai-models.html + weekly + 0.9 + + + https://i-need-token.github.io/ai-models/free-ai-models.html + weekly + 0.9 + + + https://i-need-token.github.io/ai-models/llm-pricing.html + weekly + 0.9 + + + https://i-need-token.github.io/ai-models/openai-alternatives.html + weekly + 0.9 + + + https://i-need-token.github.io/ai-models/ai-models-by-provider.html + weekly + 0.9 + + + https://i-need-token.github.io/ai-models/context-window-comparison.html + weekly + 0.9 + + + https://i-need-token.github.io/ai-models/best-ai-models-for-coding.html + weekly + 0.9 + + + https://i-need-token.github.io/ai-models/best-ai-models-for-agents.html + weekly + 0.9 + + + https://i-need-token.github.io/ai-models/reasoning-models-comparison.html + weekly + 0.9 + + + https://i-need-token.github.io/ai-models/cheapest-ai-models.html + weekly + 0.9 + + + https://i-need-token.github.io/ai-models/tool-calling-models-comparison.html + weekly + 0.9 + + + https://i-need-token.github.io/ai-models/ai-model-pricing-calculator.html + weekly + 0.9 + + + + https://i-need-token.github.io/ai-models/best-ai-models-for-image-generation.html + weekly + 0.9 + + + + https://i-need-token.github.io/ai-models/best-ai-models-for-vision.html + weekly + 0.9 + + + + https://i-need-token.github.io/ai-models/structured-output-models-comparison.html + weekly + 0.9 + +https://i-need-token.github.io/ai-models/open-source-ai-models.html0.9weeklyhttps://i-need-token.github.io/ai-models/multimodal-ai-models.html0.9weekly \ No newline at end of file diff --git a/site/small-language-models.html b/site/small-language-models.html new file mode 100644 index 00000000..7d80cca0 --- /dev/null +++ b/site/small-language-models.html @@ -0,0 +1,611 @@ + + + + + + + Small Language Models (SLM) โ€” 2,000+ Models Under 10B Parameters (2025) | AI Models Catalog + + + + + + + + + + + + + + + + +
+

๐Ÿค Small Language Models (SLM) โ€” 2,000+ Models Under 10B Parameters

+

+ Complete guide to small language models for edge deployment, mobile apps, and cost-efficient + production. All data from + AI Models Catalog โ€” first-party data + only. +

+ +
+
+
2,002
+
Small Models
+
+
+
928
+
With Tool Calling
+
+
+
557
+
With Reasoning
+
+
+
48
+
Free SLMs
+
+
+
689
+
First-Party
+
+
+ + ๐Ÿ” Search All 4,587 Models โ†’ + +

What Are Small Language Models?

+

+ Small Language Models (SLMs) are AI models with fewer than ~10 billion parameters, designed + for efficiency, low latency, and deployment on resource-constrained hardware โ€” from + smartphones to edge servers. They offer a practical alternative to large frontier models + when cost, speed, or privacy matters. +

+

Key advantages of SLMs:

+
    +
  • Lower cost โ€” often 10-100x cheaper per token than frontier models
  • +
  • Lower latency โ€” faster inference for real-time applications
  • +
  • Edge deployment โ€” run on-device without cloud dependency
  • +
  • Privacy โ€” data never leaves the device
  • +
  • Fine-tuning โ€” easier to customize for specific domains
  • +
+ +

Cheapest Small Models with Tool Calling

+

Best value SLMs for AI agents and tool-use workflows (first-party providers only):

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/MOutput $/MContextReasoning
ling-2.6-flashling$0.01$0.03262K
klusterai--Meta-Llama-3.1-8B-Instruct-Turboklusterai$0.015$0.02131K
granite-4.0-h-microibm$0.017$0.112131K
llama-3.1-8b-instruct--fp-16fireworks$0.02$0.03131K
schematron-3bfireworks$0.02$0.05131K
+ +

Free Small Language Models

+

48 small models available at zero cost โ€” perfect for prototyping and development:

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextTool CallingReasoning
deepseek-r1-distill-llama-8bcerebras131Kโœ“
llama-4-scout-17b-16e-instructcerebras131Kโœ“
qwen-2.5-32bcerebras131Kโœ“
gemma-4-26b-a4b-itauriko262Kโœ“
glm-4.5-flashauriko200Kโœ“
glm-4.6v-flashauriko128Kโœ“
baidu--ernie-4.5-0.3baimlapi120Kโœ“
+ +

Small Models with Reasoning

+

+ 557 small models with reasoning capabilities โ€” ideal for math, logic, and step-by-step + problem solving: +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/MOutput $/MContextTool Calling
qwen3.5-0.8bqwen$0.01$0.05262K
qwen3.5-2bqwen$0.02$0.10262K
qwen--qwen3-4b-fp8fireworks$0.03$0.03128K
qwen3.5-4bqwen$0.03$0.15262K
deepseek-r1-distill-llama-8bcerebrasFreeFree131K
+ +

Best SLMs by Use Case

+

๐Ÿค– AI Agents on a Budget

+

+ ling-2.6-flash ($0.01/$0.03/M) โ€” cheapest tool-calling model with 262K + context. Perfect for high-volume agent workflows. +

+

๐Ÿ“ฑ On-Device / Edge Deployment

+

+ Qwen3.5 0.8B โ€” ultra-compact reasoning model. + Gemma 4 27B IT โ€” free with vision + tool calling. +

+

๐Ÿ’ป Code Completion

+

+ bdc-coder ($0.01/$0.01/M) โ€” cheapest coding model. + Qwen3 4B ($0.03/$0.15/M) โ€” open-source with reasoning. +

+

๐Ÿงฎ Math & Reasoning

+

+ DeepSeek R1 Distill Llama 8B โ€” free reasoning model. + Qwen3.5 0.8B ($0.01/$0.05/M) โ€” cheapest reasoning. +

+

๐Ÿ’ฌ Chat & RAG

+

+ GPT-4.1-nano ($0.10/$0.40/M) โ€” fast, cheap, reliable. + Qwen3 4B ($0.03/$0.15/M) โ€” open-source alternative. +

+ +

SLM vs LLM: When to Choose Small

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
FactorSmall Model (SLM)Large Model (LLM)
Cost per 1M tokens$0.01 โ€“ $0.20$1 โ€“ $40
Latency (first token)50 โ€“ 200ms200 โ€“ 2000ms
DeploymentOn-device, edge, cloudCloud only
PrivacyData stays on deviceData sent to cloud
CustomizationEasy fine-tuningExpensive fine-tuning
Complex reasoningGood for simple tasksSuperior for complex tasks
Best forHigh-volume, real-time, edgeComplex, nuanced, creative
+ + + +

๐ŸŽฏ AI Model Picker

+

โšก GitHub Action

+ +
+ + diff --git a/site/social-preview.svg b/site/social-preview.svg new file mode 100644 index 00000000..063f980e --- /dev/null +++ b/site/social-preview.svg @@ -0,0 +1,109 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + AI Models Catalog + + + Structured YAML catalog of AI model metadata โ€” pricing, context windows, capabilities + + + + + + MODELS + 4,587 + + + + PROVIDERS + 95 + + + + FREE MODELS + 81 + + + + OPEN WEIGHTS + 527 + + + + + + ๐Ÿ”ง 2,350 Tool Calling + + + ๐Ÿง  1,306 Reasoning + + + ๐Ÿ‘๏ธ 1,487 Vision + + + ๐Ÿ“‹ 829 Structured Output + + + ๐Ÿค– 1,080 Agentic + + + + + First-party data ยท TypeScript types ยท Zod validation ยท Auto-scraped + + + + + YAML + + + JSON + + + CSV + + + npm + + + GitHub Action + + + + + github.com/i-need-token/ai-models + + + + \ No newline at end of file diff --git a/site/state-of-ai-models.html b/site/state-of-ai-models.html new file mode 100644 index 00000000..9aa53624 --- /dev/null +++ b/site/state-of-ai-models.html @@ -0,0 +1,729 @@ + + + + + + State of AI Models 2025 โ€” Data-Driven Report | AI Models Catalog + + + + + + + + + + + + + + +
+

๐Ÿ“Š State of AI Models 2025

+

+ A data-driven analysis of 4,587 AI models across 95 providers โ€” pricing trends, capability + adoption, context window growth, and the rise of open-source AI. +

+
+
+
+
+
4,587
+
Total Models
+
+
+
95
+
Providers
+
+
+
81
+
Free Models
+
+
+
527
+
Open-Weight
+
+
+
2,350
+
Tool Calling
+
+
+
1,306
+
Reasoning
+
+
+
1,487
+
Vision
+
+
+
2,195
+
128K+ Context
+
+
+ +

1. Provider Landscape

+

+ The AI model ecosystem spans 95 providers, from tech giants to specialized startups. The top + 15 providers account for the majority of models: +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ProviderModelsNotable Models
OpenRouter415Aggregator โ€” routes to 100+ models
Google261Gemini 2.5 Pro/Flash, Gemma 3
Requesty234Aggregator โ€” unified API
Cohere197Command R+, Embed v3
xAI193Grok 3, Grok 3 Mini
DeepSeek184DeepSeek R1, V3
Meta163Llama 4 Maverick/Scout
Mistral155Mistral Large, Codestral
Alibaba (Qwen)139Qwen3-235B, QwQ
Anthropic121Claude Sonnet 4, Opus 4
OpenAI115GPT-4.1, o3, o4-mini
Microsoft99Phi-4, Florence 2
Amazon96Nova Pro, Titan
NVIDIA87Nemotron, Llama Nemotron
01.ai83Yi-Lightning, Yi-VL
+
+ Key Insight: Aggregators (OpenRouter, Requesty) offer the widest selection + but may duplicate models available from first-party providers. For the best pricing, go + direct to the source. +
+ +

2. Pricing Distribution

+

+ AI model pricing varies dramatically โ€” from completely free to over $15 per million input + tokens. Here is the breakdown of the 4,587 models: +

+
+
+
Free
+
+
81 models
+
+
+
< $0.50/M
+
+
~1,800 models
+
+
+
$0.50โ€“5/M
+
+
~1,400 models
+
+
+
> $5/M
+
+
~480 models
+
+
+
+ Key Insight: The median input price for tool-calling models is $0.50/M + tokens, while reasoning models median is $0.80/M. Vision-capable models average $1.50/M โ€” + still affordable for most production use cases. +
+ +

3. Capability Adoption

+

+ Modern AI models increasingly support advanced capabilities beyond basic text generation: +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
CapabilityModels% of TotalAvg Input $/M
Tool Calling2,35051.2%$1.50
Reasoning1,30628.5%$2.10
Structured Output82918.1%$1.80
Vision (Image Input)1,48732.4%$1.50
Open Weights52711.5%Free or low-cost
Image Generation280.6%$3.00+
Audio Input1182.6%$2.50+
Audio Output340.7%$3.00+
Video Input1673.6%$2.00+
+
+ Key Insight: Over half of all models now support tool calling โ€” it has + become table stakes for production AI. Reasoning capabilities are growing fast, with 1,306 + models (28.5%) supporting extended thinking. +
+ +

4. Context Window Revolution

+

+ Context windows have grown exponentially. The average context window across all models is + now approximately 200K tokens: +

+
+
+
< 32K
+
+
~800 models
+
+
+
32Kโ€“128K
+
+
~1,000 models
+
+
+
128Kโ€“1M
+
+
~2,195 models
+
+
+
1M+
+
+
~30 models
+
+
+

Largest Context Windows

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelContextProvider
Google Gemini 2.5 Pro1,048,576Google
Google Gemini 2.5 Flash1,048,576Google
Meta Llama 4 Scout10,000,000Meta
Meta Llama 4 Maverick1,048,576Meta
Google Gemma 3 27B131,072Google
+
+ Key Insight: 128K+ context is now the norm โ€” 2,195 models (47.8%) support + it. Meta's Llama 4 Scout leads with a 10M token window, making entire codebases and books + processable in a single prompt. +
+ +

5. The Rise of Free & Open-Source AI

+

+ 81 models are completely free to use, and 527 have open weights. Here are the most capable + free models: +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelContextCapabilitiesProvider
Google Gemini 2.5 Flash1MTC, Reasoning, Vision, SOGoogle
DeepSeek R1128KReasoning, TCDeepSeek
Meta Llama 4 Maverick1MTC, VisionMeta
Alibaba Qwen3-235B128KTC, Reasoning, SOAlibaba
Google Gemma 3 27B131KVision, TCGoogle
+
+ Key Insight: Free models now rival paid ones in capability. Google Gemini + 2.5 Flash (free tier) offers 1M context, tool calling, reasoning, and vision โ€” making it + viable for production use at zero cost. +
+ +

6. Best Value Models by Use Case

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
Use CaseBest FreeBest Paid (Cheapest)Best Overall
General ChatGemini 2.5 FlashDeepSeek V3 ($0.07/$0.28)Claude Sonnet 4
CodingDeepSeek R1DeepSeek V3 ($0.07/$0.28)Claude Sonnet 4
AI AgentsGemini 2.5 FlashGrok 3 Mini ($0.30/$0.50)Claude Sonnet 4
ReasoningDeepSeek R1Grok 3 Mini ($0.30/$0.50)o3
VisionGemini 2.5 FlashGemma 3 4B (free)Gemini 2.5 Pro
Large ContextLlama 4 Scout (10M)Gemini 2.5 Flash ($0.15/$0.60)Gemini 2.5 Pro
+ +

7. Key Trends & Predictions

+
+ Trend 1: Agentic AI is the new default. 51% of models support tool calling, + and 1,080 models are classified as "agentic" (tool_call + chat). Expect this to reach 80%+ + by 2026. +
+
+ Trend 2: Context windows are commoditized. 128K context is now standard. + 1M+ context models are growing, with Google and Meta leading. Expect 10M+ to become common + by 2026. +
+
+ Trend 3: Free tiers are production-ready. 81 free models with capabilities + like tool calling and reasoning mean that cost is no longer a barrier to entry for AI + development. +
+
+ Trend 4: Multimodal is mainstream. 1,548 models support more than text + input. Vision (1,487 models) is nearly universal among flagship models. Audio and video are + the next frontiers. +
+
+ Trend 5: Open weights are accelerating. 527 open-weight models exist, with + Meta's Llama 4 and Alibaba's Qwen3 leading. Expect open-source to match proprietary + capabilities within 6 months. +
+ + +
+ Small Language Models +

๐ŸŽฏ AI Model Picker

+

โšก GitHub Action

+
+

+ Data from + AI Models Catalog + โ€” 4,587 models across 95 providers. Updated continuously. +

+
+ + diff --git a/site/structured-output-models-comparison.html b/site/structured-output-models-comparison.html new file mode 100644 index 00000000..da0b060d --- /dev/null +++ b/site/structured-output-models-comparison.html @@ -0,0 +1,742 @@ + + + + + + + Structured Output AI Models โ€” JSON Mode, Function Calling Compared (2025) | AI Models Catalog + + + + + + + + + + + + + + + + + + + +

๐Ÿ“‹ Structured Output AI Models (2025)

+

+ Compare 829 AI models with structured output / JSON mode support. GPT-4o, Claude, Gemini, and + more โ€” real pricing and capabilities from first-party data. +

+ +
+
829Structured Output Models
+
780SO + Tool Calling
+
672SO + Reasoning
+
4,587Total Models
+
+ + ๐Ÿ” Interactive Catalog + โญ Star on GitHub + +
+ ๐Ÿ’ก What is structured output? Structured output (also called JSON mode) + allows LLMs to generate responses in a specific schema โ€” JSON, XML, or other formats. This is + essential for building reliable AI applications that parse model outputs programmatically. +
+ +

๐Ÿ† Flagship Structured Output Models โ€” Head to Head

+

+ The top-tier models from each major provider, all supporting structured output with tool + calling. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContextTool CallReasoning
gpt-4oopenai$2.50$10128Kโœ…
gpt-4o-miniopenai$0.15$0.60128Kโœ…
o3openai$2$8200Kโœ…โœ…
o4-miniopenai$1.10$4.40200Kโœ…โœ…
claude-sonnet-4-20250514anthropic$3$15200Kโœ…โœ…
claude-opus-4-20250514anthropic$15$75200Kโœ…โœ…
gemini-2.5-progoogle$1.25$101Mโœ…โœ…
gemini-2.5-flashgoogle$0.15$0.601Mโœ…โœ…
deepseek-r1deepseek$0.55$2.19128Kโœ…
grok-3xai$3$15131Kโœ…โœ…
qwen3-235b-a22balibaba$0.14$0.42128Kโœ…โœ…
llama4-maverickmeta$0.20$0.801Mโœ…
+ +

๐Ÿ’ฐ Cheapest Structured Output Models

+

+ Most affordable models with structured output โ€” ideal for high-volume production applications. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContextTool Call
gemini-2.0-flash-litegoogle$0.075$0.301Mโœ…
gemini-2.5-flashgoogle$0.15$0.601Mโœ…
gpt-4o-miniopenai$0.15$0.60128Kโœ…
qwen3-235b-a22balibaba$0.14$0.42128Kโœ…
llama4-maverickmeta$0.20$0.801Mโœ…
deepseek-chatdeepseek$0.14$0.28128K
+ +

๐Ÿ†“ Free Structured Output Models

+

+ Structured output models available at zero cost โ€” perfect for prototyping JSON-mode + applications. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextTool CallReasoning
gemini-2.0-flashgoogle1Mโœ…
gemini-2.5-flashgoogle1Mโœ…โœ…
llama4-scout-17b-16emeta10M
qwen3-30b-a3balibaba128Kโœ…
+ +

๐Ÿค– Structured Output + Tool Calling

+

+ 780 models that support both structured output and tool calling โ€” the ideal combination for + building AI agents that return structured data from function calls. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContextReasoning
gemini-2.0-flash-litegoogle$0.075$0.301M
gemini-2.5-flashgoogle$0.15$0.601Mโœ…
gpt-4o-miniopenai$0.15$0.60128K
qwen3-235b-a22balibaba$0.14$0.42128Kโœ…
claude-sonnet-4-20250514anthropic$3$15200Kโœ…
grok-3-minixai$0.30$0.50131Kโœ…
+ +

๐Ÿง  Structured Output + Reasoning

+

+ 672 models with both structured output and reasoning capabilities โ€” for complex tasks that + require both thinking and structured responses. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContextTool Call
gemini-2.5-flashgoogle$0.15$0.601Mโœ…
qwen3-235b-a22balibaba$0.14$0.42128Kโœ…
deepseek-chatdeepseek$0.14$0.28128K
deepseek-r1deepseek$0.55$2.19128K
o4-miniopenai$1.10$4.40200Kโœ…
o3openai$2$8200Kโœ…
claude-sonnet-4-20250514anthropic$3$15200Kโœ…
+ +

๐Ÿ”‘ Choosing the Right Structured Output Model

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
Use CaseRecommended ModelWhy
API response parsinggpt-4o-miniCheapest with SO + tool calling
Data extractiongemini-2.5-flash1M context + SO + reasoning + cheap
AI agentsclaude-sonnet-4Best tool calling + SO + reasoning
High volume / cheapgemini-2.0-flash-liteLowest cost at $0.075/M input
Complex reasoningo3Best reasoning + SO + tool calling
Prototypinggemini-2.5-flashFree tier, 1M context, all capabilities
+ +

๐Ÿ“Š Methodology

+

+ All data is sourced from first-party APIs. Models are identified by having + structured_output: true in their metadata. Aggregator providers are excluded from + ranking tables to avoid duplicate models. Pricing is per million tokens. +

+ +

๐Ÿ”— More Resources

+ + + Small Language Models +

๐ŸŽฏ AI Model Picker

+

โšก GitHub Action

+ + + diff --git a/site/tool-calling-models-comparison.html b/site/tool-calling-models-comparison.html new file mode 100644 index 00000000..e254f07d --- /dev/null +++ b/site/tool-calling-models-comparison.html @@ -0,0 +1,1118 @@ + + + + + + + Tool Calling AI Models Compared โ€” Function Calling LLMs (2025) | AI Models Catalog + + + + + + + + + + + + + + + + + + + +

๐Ÿ”ง Tool Calling AI Models Compared (2025)

+

+ Compare 2,350 AI models with tool/function calling across 95 providers. Find the best + model for agents, automation, and API integration. +

+ +
+
2,350Tool Calling Models
+
95Providers
+
81Free
+
527Open Weights
+
+ + ๐Ÿ” Interactive Catalog + โญ Star on GitHub + +
+ ๐Ÿ’ก What is tool calling? Tool calling (also called function calling) lets + LLMs invoke external APIs, databases, and services. This is the foundation of AI agents โ€” + without tool calling, a model can only generate text. With it, models can search the web, run + code, query databases, and take real-world actions. +
+ +

๐Ÿ† Flagship Tool Calling Models โ€” Head to Head

+

The top models with tool calling compared side by side.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContextReasoning
gpt-4oopenai$2.5$10128K
gpt-4o-miniopenai$0.15$0.6128K
gpt-4.1openai$2$81M
gpt-4.1-miniopenai$0.4$1.61M
gpt-4.1-nanoopenai$0.1$0.41M
o3openai$10$40200Kโœ…
o3-miniopenai$1.1$4.4200Kโœ…
o4-miniopenai$1.1$4.4200Kโœ…
gemini-2.0-flashgoogle$0.1$0.41M
deepseek-chatdeepseek$0.14$0.281M
qwen3-235b-a22balibaba$2$8?โœ…
llama-4-maverickdigitalocean$0.25$0.871M
llama-4-scoutgoogle-vertex$0.25$0.71M
+ +

๐Ÿ’ฐ Cheapest Tool Calling Models

+

Most affordable models with tool calling โ€” for cost-sensitive agents and automation.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContextReasoning
ling-2.6-flashinclusionai$0.01$0.03262K
bdc-coderinferencenet$0.01$0.01131K
klusterai--Meta-Llama-3.1-8B-Instruct-Turboklusterai$0.015$0.02131K
granite-4.0-h-microcloudflare$0.017$0.112131K
llama-3.1-8b-instruct--fp-16inferencenet$0.02$0.03131K
schematron-3binferencenet$0.02$0.05131K
schematron-v3inferencenet$0.02$0.05131K
gpt-oss-20binferencenet$0.03$0.15131K
schematron-v2-turboinferencenet$0.03$0.15131K
openai--gpt-oss-20bneuralwatt$0.03$0.16?โœ…
qwen--qwen3-4b-fp8novitaai$0.03$0.03128Kโœ…
liquid-ai--LFM2-24B-A2Btogetherai$0.03$0.12131K
amazon-nova-microamazon$0.035$0.14128K
amazon-nova-microamazon-bedrock$0.035$0.14128K
mistral-nemo-12b-instruct--fp-8inferencenet$0.0375$0.1131K
+ +

๐Ÿ†“ Free Tool Calling Models

+

54 models with tool calling at zero cost โ€” perfect for prototyping agents.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextReasoning
openrouter--owl-alphaopenrouter1M
deepseek--deepseek-v4-flash--freeopenrouter1Mโœ…
qwen--qwen3-coder--freeopenrouter1M
nvidia--nemotron-3-super-120b-a12b--freeopenrouter1Mโœ…
gemma-4-26b-a4b-itauriko262Kโœ…
gemma-4-31b-itauriko262Kโœ…
arcee-ai--trinity-large-thinking--freeopenrouter262Kโœ…
google--gemma-4-26b-a4b-it--freeopenrouter262Kโœ…
google--gemma-4-31b-it--freeopenrouter262Kโœ…
nvidia--nemotron-3-nano-omni-30b-a3b-reasoning--freeopenrouter256Kโœ…
+ +

๐Ÿ”“ Open-Weight Tool Calling Models

+

278 models with tool calling you can run locally โ€” for privacy-first agents.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextReasoning
google--gemma-4-31b-itorcarouter1M
qwen--qwen3.5-flash-2026-02-23orcarouter1M
qwen--qwen3.5-flashorcarouter1M
qwen--qwen3.6-flash-2026-04-16orcarouter1M
qwen--qwen3.6-flashorcarouter1M
meta-llama-4-maverick-17bamazon-bedrock1M
meta-llama-4-scout-17bamazon-bedrock1M
minimax-m2-1amazon-bedrock1M
minimax-m2-5amazon-bedrock1M
minimax-m2amazon-bedrock1M
+ +

๐Ÿง  Tool Calling + Reasoning

+

+ Models with both tool calling and reasoning โ€” the most capable for complex agentic workflows + that need planning and execution. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContext
openai--gpt-oss-20bneuralwatt$0.03$0.16?
qwen--qwen3-4b-fp8novitaai$0.03$0.03128K
gpt-oss-120binferencenet$0.05$0.45131K
Qwen--Qwen3.6-35B-A3Bneuralwatt$0.05$0.1?
openai--gpt-oss-120bnovitaai$0.05$0.25131K
qwen3-30b-a3b-fp8cloudflare$0.051$0.33540K
glm-4.7-flashcloudflare$0.06$0.4131K
Nemotron-3-Nano-Omninebius$0.06$0.24128K
hermes-4-llama-3.1-8bnousresearch$0.06$0.12131K
seed-1.6-flashbytedance$0.07$0.3262K
ring-2.6-1tinclusionai$0.07$0.62262K
zai-org--glm-4.7-flashnovitaai$0.07$0.4200K
microsoft-phi-4-mini-reasoningmicrosoft$0.075$0.3128K
Qwen--Qwen3-32B-TEEchutes$0.08$0.2440K
gpt-oss-120bclarifai$0.09$0.36131K
+ +

๐Ÿ‘๏ธ Tool Calling + Vision

+

Models with tool calling and image understanding โ€” for agents that need to see and act.

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderInput $/1MOutput $/1MContext
Qwen--Qwen3.6-35B-A3Bneuralwatt$0.05$0.1?
qwen3.6-35b-fastneuralwatt$0.05$0.1?
openai--gpt-oss-120bnovitaai$0.05$0.25131K
amazon-nova-liteamazon$0.06$0.24300K
amazon-nova-liteamazon-bedrock$0.06$0.24300K
Nemotron-3-Nano-Omninebius$0.06$0.24128K
openai--gpt-5-nanoaimlapi$0.065$0.52400K
seed-1.6-flashbytedance$0.07$0.3262K
gemini-1.5-flash-8bgoogle$0.075$0.31M
gemini-1.5-flashgoogle$0.075$0.31M
gemini-2.0-flash-litegoogle$0.075$0.31M
gemini-2-0-flash-litegoogle-vertex$0.075$0.31M
microsoft-phi-4-mini-multimodalmicrosoft$0.08$0.32128K
qwen--qwen3-vl-8b-instructnovitaai$0.08$0.5131K
seed-2.0-minibytedance$0.1$0.4262K
+ +

๐Ÿ“ Tool Calling + Large Context (128K+)

+

+ Models with tool calling and large context windows โ€” for agents processing long documents or + complex multi-step tasks. +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelProviderContextInput $/1MReasoning
ling-2.6-flashinclusionai262K$0.01
bdc-coderinferencenet131K$0.01
klusterai--Meta-Llama-3.1-8B-Instruct-Turboklusterai131K$0.015
granite-4.0-h-microcloudflare131K$0.017
llama-3.1-8b-instruct--fp-16inferencenet131K$0.02
schematron-3binferencenet131K$0.02
schematron-v3inferencenet131K$0.02
gpt-oss-20binferencenet131K$0.03
schematron-v2-turboinferencenet131K$0.03
qwen--qwen3-4b-fp8novitaai128K$0.03โœ…
liquid-ai--LFM2-24B-A2Btogetherai131K$0.03
amazon-nova-microamazon128K$0.035
amazon-nova-microamazon-bedrock128K$0.035
mistral-nemo-12b-instruct--fp-8inferencenet131K$0.0375
klusterai--Meta-Llama-3.3-70B-Instruct-Turboklusterai131K$0.038
+ +

๐Ÿ“Š Methodology

+

+ All data is sourced from first-party APIs. Tool calling capability is defined by the + provider's own classification โ€” models that support function/tool calling via their API. + Aggregator providers are excluded from ranking tables to avoid duplicate models. +

+ +

๐Ÿ”— More Resources

+ + +

Small Language Models

+

๐ŸŽฏ AI Model Picker

+

โšก GitHub Action

+ + + diff --git a/site/twitter-thread.md b/site/twitter-thread.md new file mode 100644 index 00000000..336f66c3 --- /dev/null +++ b/site/twitter-thread.md @@ -0,0 +1,91 @@ +# Twitter/X Thread Template + +## Thread: AI Models Catalog Launch + +1/ ๐Ÿคฏ I just cataloged every major AI model on the market. + +4,587 models. 95 providers. All with pricing, context windows, and capabilities. + +And it's all open source. Let me show you what I built ๐Ÿ‘‡ + +2/ The problem: Every week a new AI model launches. Every month a new provider. + +Keeping track of pricing, context windows, and capabilities across 95 websites is impossible. + +So I automated it. All data scraped from first-party APIs. + +3/ Every model has structured YAML with: + +- ๐Ÿ’ฐ Pricing (input, output, cache) +- ๐Ÿ“ Context window & max output +- ๐Ÿ”ง Tool calling, reasoning, structured output +- ๐Ÿ‘๏ธ Vision, audio, video capabilities +- ๐Ÿ†“ Free/open weights status + +4/ The numbers: + +- 4,587 models across 95 providers +- 2,350 with tool calling +- 1,306 reasoning models +- 81 completely free +- 527 with open weights + +5/ But here's the best part โ€” the interactive catalog: + +๐Ÿ” Search and filter 4,587 models +๐Ÿ’ฐ Price calculator โ€” enter your tokens/month, see monthly costs +๐ŸŽฏ Model picker โ€” answer 2 questions, get top 5 recommendations +โš–๏ธ Side-by-side comparison of any 2-3 models + +Try it: i-need-token.github.io/ai-models + +6/ Need the cheapest model with 128K+ context and tool calling? + +Or the best free model for coding? + +The Model Picker answers these in 2 clicks. + +7/ All data is machine-readable: + +- YAML source with TypeScript types + Zod validation +- JSON & CSV downloads +- npm package (npm install ai-models) +- GitHub Action for CI/CD +- Hugging Face dataset + +8/ 68 documentation pages covering: + +- Free models guide (81 free models!) +- OpenAI alternatives (70+ compatible providers) +- Agentic models (1,080 with tool calling + reasoning) +- Code models, vision models, audio models +- Pricing comparison, context windows, and more + +9/ Quick start: + +curl -sL https://github.com/i-need-token/ai-models/releases/latest/download/models.json | jq '.models | length' + +# โ†’ 4587 + +Or as a GitHub Action: + +- uses: i-need-token/ai-models@v0.2.0 + +10/ If you're building with AI models, this saves you hours of research. + +โญ Star the repo: github.com/i-need-token/ai-models +๐Ÿ” Try the catalog: i-need-token.github.io/ai-models +๐Ÿ“– Read the docs: github.com/i-need-token/ai-models/tree/main/docs + +What would you like to see next? ๐Ÿ™ + +--- + +## Single Tweet Version + +I built a catalog of 4,587 AI models across 95 providers โ€” all with structured pricing, context windows, and capabilities. + +Free, open source, machine-readable. With an interactive catalog that has a price calculator, model picker, and comparison tool. + +โญ github.com/i-need-token/ai-models +๐Ÿ” i-need-token.github.io/ai-models diff --git a/social-preview.svg b/social-preview.svg new file mode 100644 index 00000000..5b7a630a --- /dev/null +++ b/social-preview.svg @@ -0,0 +1,84 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + ๐Ÿค– + + + AI Models Catalog + + + The most comprehensive structured catalog of AI models on GitHub + + + + 4,587 + Models + + + 95 + Providers + + + 2,350 + Tool Calling + + + 1,306 + Reasoning + + + 81 + Free + + + + Pricing + + + Context Windows + + + Modalities + + + Open Weights + + + Cached Pricing + + + + โœ“ First-Party Data Only ยท Zod Validation + + + npm ยท CDN ยท CSV ยท GitHub Action ยท Hugging Face + + + + $ npm install ai-models + + + + \ No newline at end of file diff --git a/tsconfig.build.json b/tsconfig.build.json new file mode 100644 index 00000000..f06717bb --- /dev/null +++ b/tsconfig.build.json @@ -0,0 +1,21 @@ +{ + "compilerOptions": { + "target": "ES2022", + "module": "ES2022", + "moduleResolution": "bundler", + "strict": true, + "noUncheckedIndexedAccess": true, + "noUnusedLocals": true, + "noUnusedParameters": true, + "noFallthroughCasesInSwitch": true, + "noPropertyAccessFromIndexSignature": true, + "exactOptionalPropertyTypes": true, + "esModuleInterop": true, + "skipLibCheck": true, + "declaration": true, + "emitDeclarationOnly": true, + "outDir": "dist", + "rootDir": "types" + }, + "include": ["types"] +}