{
  "generated_at": "2026-04-24T15:01:35.625676+00:00",
  "slug": "inference-surf-cascade-fyi-v1-chat-completions",
  "title": "Surf Inference \u00b7 LLM Chat Completions",
  "url": "https://inference.surf.cascade.fyi/v1/chat/completions",
  "category": "ai",
  "summary": "Generates chat completions via OpenAI-compatible endpoint supporting multiple LLM models with configurable parameters.",
  "seo": {
    "title": "OpenAI-Compatible LLM API | Surf Inference x402",
    "description": "OpenAI-compatible chat completions API with x402 micropayments. Pay 0.001 USDC per call on Base or Solana. Access Kimi, MiniMax, Qwen models."
  },
  "use_cases": [
    "Generate text responses for agent conversations",
    "Create embeddings and completions without API keys",
    "Access Chinese and multilingual LLMs programmatically",
    "Build chatbots with pay-per-use cost structure"
  ],
  "ideal_buyer": "AI agent developers seeking OpenAI-compatible inference with micropayment flexibility and multi-model access.",
  "example_prompt": "Generate a completion for 'Explain quantum computing in 3 sentences' using moonshotai/kimi-k2.5 with max 100 tokens.",
  "example_request_body": {
    "model": "moonshotai/kimi-k2.5",
    "messages": [
      {
        "role": "user",
        "content": "Explain quantum computing in 3 sentences"
      }
    ],
    "max_tokens": 100
  },
  "risk_notes": [],
  "pricing_sanity": {
    "flag": "cheap_outlier",
    "ratio": 0.1,
    "median_category_atomic": 10000
  },
  "pricing_review_required": false,
  "pricing_decimal_suspect": false,
  "trust_tier": "indexed_external",
  "accepts": [
    {
      "scheme": "exact",
      "network": "solana",
      "pay_to": "E7BFB4ucyNsa8K52uQsCyKgw4Dg9vHA5mo73W6aWTNZY",
      "asset": "EPjFWdd5AufqSSqeM2qN1xzybapC8G4wEGGkZwyTDt1v",
      "max_amount_required_atomic": "1000",
      "max_timeout_seconds": 300,
      "verified": false,
      "hints": {
        "input": {
          "body": {
            "required": [
              "model",
              "messages"
            ],
            "properties": {
              "model": {
                "type": "string",
                "description": "Model identifier. Available: moonshotai/kimi-k2.5, minimax/minimax-m2.5, qwen/qwen-2.5-7b-instruct, anthropic/claude-sonnet-4.5, anthropic/claude-sonnet-4.6, anthropic/claude-opus-4.5, anthropic/claude-opus-4.6, minimax/minimax-m2.7, z-ai/glm-5, x-ai/grok-4.1-fast, x-ai/grok-4.20-beta, x-ai/grok-4.20-multi-agent-beta, x-ai/grok-4.1-fast:online, x-ai/grok-4.20-beta:online, x-ai/grok-4.20-multi-agent-beta:online"
              },
              "stream": {
                "type": "boolean",
                "description": "Enable SSE streaming"
              },
              "messages": {
                "type": "array",
                "items": {
                  "type": "object",
                  "properties": {
                    "role": {
                      "enum": [
                        "user",
                        "assistant",
                        "system"
                      ],
                      "type": "string"
                    },
                    "content": {
                      "type": "string"
                    }
                  }
                },
                "description": "Chat messages"
              },
              "max_tokens": {
                "type": "number",
                "description": "Max tokens to generate"
              },
              "temperature": {
                "type": "number",
                "description": "Sampling temperature (0-2)"
              }
            }
          },
          "type": "http",
          "method": "POST",
          "bodyType": "json"
        },
        "output": {
          "type": "json",
          "example": {
            "id": "chatcmpl-abc123",
            "usage": {
              "total_tokens": 30,
              "prompt_tokens": 10,
              "completion_tokens": 20
            },
            "choices": [
              {
                "index": 0,
                "message": {
                  "role": "assistant",
                  "content": "Hello! How can I help?"
                },
                "finish_reason": "stop"
              }
            ]
          }
        }
      }
    },
    {
      "scheme": "exact",
      "network": "base",
      "pay_to": "0xdd6090df24e88caf558839584dd53bcef79c6338",
      "asset": "0x833589fCD6eDb6E08f4c7C32D4f71b54bdA02913",
      "max_amount_required_atomic": "1000",
      "max_timeout_seconds": 300,
      "verified": false,
      "hints": {
        "input": {
          "body": {
            "required": [
              "model",
              "messages"
            ],
            "properties": {
              "model": {
                "type": "string",
                "description": "Model identifier. Available: moonshotai/kimi-k2.5, minimax/minimax-m2.5, qwen/qwen-2.5-7b-instruct, anthropic/claude-sonnet-4.5, anthropic/claude-sonnet-4.6, anthropic/claude-opus-4.5, anthropic/claude-opus-4.6, minimax/minimax-m2.7, z-ai/glm-5, x-ai/grok-4.1-fast, x-ai/grok-4.20-beta, x-ai/grok-4.20-multi-agent-beta, x-ai/grok-4.1-fast:online, x-ai/grok-4.20-beta:online, x-ai/grok-4.20-multi-agent-beta:online"
              },
              "stream": {
                "type": "boolean",
                "description": "Enable SSE streaming"
              },
              "messages": {
                "type": "array",
                "items": {
                  "type": "object",
                  "properties": {
                    "role": {
                      "enum": [
                        "user",
                        "assistant",
                        "system"
                      ],
                      "type": "string"
                    },
                    "content": {
                      "type": "string"
                    }
                  }
                },
                "description": "Chat messages"
              },
              "max_tokens": {
                "type": "number",
                "description": "Max tokens to generate"
              },
              "temperature": {
                "type": "number",
                "description": "Sampling temperature (0-2)"
              }
            }
          },
          "type": "http",
          "method": "POST",
          "bodyType": "json"
        },
        "output": {
          "type": "json",
          "example": {
            "id": "chatcmpl-abc123",
            "usage": {
              "total_tokens": 30,
              "prompt_tokens": 10,
              "completion_tokens": 20
            },
            "choices": [
              {
                "index": 0,
                "message": {
                  "role": "assistant",
                  "content": "Hello! How can I help?"
                },
                "finish_reason": "stop"
              }
            ]
          }
        }
      }
    }
  ],
  "origin": {
    "slug": "inference-surf-cascade-fyi",
    "host": "inference.surf.cascade.fyi",
    "title": "Surf Inference",
    "description": "OpenAI-compatible LLM inference API with x402 or MPP micropayments.",
    "url": "https://inference.surf.cascade.fyi",
    "favicon": "https://inference.surf.cascade.fyi/favicon.svg"
  },
  "json_ld": {
    "@id": "https://x402all.com/resource/inference-surf-cascade-fyi-v1-chat-completions",
    "url": "https://x402all.com/resource/inference-surf-cascade-fyi-v1-chat-completions",
    "name": "Surf Inference \u00b7 LLM Chat Completions",
    "@type": "WebAPI",
    "offers": [
      {
        "url": "https://x402all.com/resource/inference-surf-cascade-fyi-v1-chat-completions",
        "@type": "Offer",
        "price": "0.001",
        "availability": "https://schema.org/InStock",
        "priceCurrency": "USDC",
        "priceSpecification": {
          "@type": "UnitPriceSpecification",
          "price": "0.001000",
          "unitText": "call",
          "priceCurrency": "USDC"
        },
        "eligibleCustomerType": "Agent",
        "additionalProperty": [
          {
            "@type": "PropertyValue",
            "name": "paymentNetwork",
            "value": "solana"
          },
          {
            "@type": "PropertyValue",
            "name": "paymentAsset",
            "value": "EPjFWdd5AufqSSqeM2qN1xzybapC8G4wEGGkZwyTDt1v"
          }
        ]
      },
      {
        "url": "https://x402all.com/resource/inference-surf-cascade-fyi-v1-chat-completions",
        "@type": "Offer",
        "price": "0.001",
        "availability": "https://schema.org/InStock",
        "priceCurrency": "USDC",
        "priceSpecification": {
          "@type": "UnitPriceSpecification",
          "price": "0.001000",
          "unitText": "call",
          "priceCurrency": "USDC"
        },
        "eligibleCustomerType": "Agent",
        "additionalProperty": [
          {
            "@type": "PropertyValue",
            "name": "paymentNetwork",
            "value": "base"
          },
          {
            "@type": "PropertyValue",
            "name": "paymentAsset",
            "value": "0x833589fCD6eDb6E08f4c7C32D4f71b54bdA02913"
          }
        ]
      }
    ],
    "sameAs": "https://inference.surf.cascade.fyi/v1/chat/completions",
    "@context": "https://schema.org",
    "provider": {
      "@id": "https://x402all.com/server/inference-surf-cascade-fyi",
      "url": "https://inference.surf.cascade.fyi",
      "name": "Surf Inference",
      "@type": "Organization"
    },
    "identifier": "inference-surf-cascade-fyi-v1-chat-completions",
    "description": "OpenAI-compatible chat completions API with x402 micropayments. Pay 0.001 USDC per call on Base or Solana. Access Kimi, MiniMax, Qwen models.",
    "potentialAction": {
      "@type": "BuyAction",
      "target": "https://axon402.com/test-buy?resource=inference-surf-cascade-fyi-v1-chat-completions",
      "description": "Test-buy this endpoint on AXON"
    },
    "applicationCategory": "ai"
  },
  "axon_deep_link": "https://axon402.com/test-buy?resource=inference-surf-cascade-fyi-v1-chat-completions"
}
