{
  "generated_at": "2026-04-24T15:01:35.625676+00:00",
  "slug": "api-zeroreader-com-v1-ai-llama-8b",
  "title": "ZeroReader \u00b7 Llama 3.1 8B Fast Inference",
  "url": "https://api.zeroreader.com/v1/ai/llama-8b",
  "category": "ai",
  "summary": "Generate fast, cost-efficient text completions using Llama 3.1 8B with OpenAI-compatible chat format.",
  "seo": {
    "title": "Llama 3.1 8B API | Fast LLM Inference via x402",
    "description": "Fast Llama 3.1 8B inference with OpenAI-compatible API. Low-latency LLM completions via x402 micropayments."
  },
  "use_cases": [
    "Power high-volume agent conversations with low latency",
    "Route cost-sensitive tasks to efficient 8B model",
    "Build responsive chat interfaces with streaming",
    "Fallback from larger models for speed-critical paths"
  ],
  "ideal_buyer": "AI agent developers and applications that need fast, affordable LLM inference for high-volume or latency-sensitive workloads.",
  "example_prompt": "Summarize this paragraph in 10 words: 'The quick brown fox jumps over the lazy dog while the sun sets behind the mountains.'",
  "example_request_body": {
    "messages": [
      {
        "role": "user",
        "content": "Hello, how are you?"
      }
    ],
    "max_tokens": 256,
    "temperature": 0.7
  },
  "risk_notes": [],
  "pricing_sanity": {
    "flag": "cheap_outlier",
    "ratio": 0.1,
    "median_category_atomic": 20000
  },
  "pricing_review_required": false,
  "pricing_decimal_suspect": false,
  "trust_tier": "indexed_external",
  "accepts": [
    {
      "scheme": "exact",
      "network": "base",
      "pay_to": "0xca99149c1a5959f7e5968259178f974aacc70f55",
      "asset": "0x833589fCD6eDb6E08f4c7C32D4f71b54bdA02913",
      "max_amount_required_atomic": "2000",
      "max_timeout_seconds": 300,
      "mime_type": "application/json",
      "description": "Llama 3.1 8B (Fast) \u2014 Best value. Fast inference, solid quality.",
      "verified": false,
      "hints": {
        "input": {
          "method": "POST",
          "messages": [
            {
              "role": "user",
              "content": "Hello, how are you?"
            }
          ],
          "max_tokens": 256,
          "temperature": 0.7
        },
        "output": {
          "id": "chatcmpl-example",
          "object": "chat.completion",
          "choices": [
            {
              "index": 0,
              "message": {
                "role": "assistant",
                "content": "I'm doing well!"
              },
              "finish_reason": "stop"
            }
          ]
        }
      }
    }
  ],
  "duplicate_cluster_id": "data-cl-461b269291ba",
  "origin": {
    "slug": "api-zeroreader-com",
    "host": "api.zeroreader.com",
    "url": "https://api.zeroreader.com",
    "favicon": "https://zeroreader.com/icon.svg"
  },
  "json_ld": {
    "@id": "https://x402all.com/resource/api-zeroreader-com-v1-ai-llama-8b",
    "url": "https://x402all.com/resource/api-zeroreader-com-v1-ai-llama-8b",
    "name": "ZeroReader \u00b7 Llama 3.1 8B Fast Inference",
    "@type": "WebAPI",
    "offers": {
      "url": "https://x402all.com/resource/api-zeroreader-com-v1-ai-llama-8b",
      "@type": "Offer",
      "price": "0.002",
      "availability": "https://schema.org/InStock",
      "priceCurrency": "USDC",
      "priceSpecification": {
        "@type": "UnitPriceSpecification",
        "price": "0.002000",
        "unitText": "call",
        "priceCurrency": "USDC"
      },
      "eligibleCustomerType": "Agent",
      "additionalProperty": [
        {
          "@type": "PropertyValue",
          "name": "paymentNetwork",
          "value": "base"
        },
        {
          "@type": "PropertyValue",
          "name": "paymentAsset",
          "value": "0x833589fCD6eDb6E08f4c7C32D4f71b54bdA02913"
        }
      ]
    },
    "sameAs": "https://api.zeroreader.com/v1/ai/llama-8b",
    "@context": "https://schema.org",
    "provider": {
      "@id": "https://x402all.com/server/api-zeroreader-com",
      "url": "https://api.zeroreader.com",
      "name": "api.zeroreader.com",
      "@type": "Organization"
    },
    "identifier": "api-zeroreader-com-v1-ai-llama-8b",
    "description": "Fast Llama 3.1 8B inference with OpenAI-compatible API. Low-latency LLM completions via x402 micropayments.",
    "potentialAction": {
      "@type": "BuyAction",
      "target": "https://axon402.com/test-buy?resource=api-zeroreader-com-v1-ai-llama-8b",
      "description": "Test-buy this endpoint on AXON"
    },
    "applicationCategory": "ai"
  },
  "axon_deep_link": "https://axon402.com/test-buy?resource=api-zeroreader-com-v1-ai-llama-8b"
}