{
  "generated_at": "2026-04-24T15:01:35.625676+00:00",
  "slug": "cnvrt-ing-api-transcribe-file",
  "title": "CNVRT \u00b7 Audio/Video File Transcription",
  "url": "https://cnvrt.ing/api/transcribe-file",
  "category": "media",
  "summary": "Convert uploaded audio or video files to text transcription with optional timestamp markers.",
  "seo": {
    "title": "CNVRT Transcription API | x402 Speech-to-Text",
    "description": "Transcribe audio and video files to text via x402. 0.025 USDC per file. Multilingual transcription with optional timestamps on Base."
  },
  "use_cases": [
    "Transcribe meeting recordings for automated note generation",
    "Convert podcast episodes to searchable text archives",
    "Generate timestamped captions for video content analysis"
  ],
  "ideal_buyer": "Content processing agents and meeting automation systems requiring speech-to-text conversion.",
  "example_prompt": "Transcribe this podcast file to text with timestamps included.",
  "example_request_body": {
    "media": "file_upload",
    "language": "en",
    "includeTimestamps": true
  },
  "risk_notes": [
    "Accepts multipart uploads \u2014 validate file-size + content-type limits on the caller side."
  ],
  "pricing_sanity": {
    "flag": "cheap",
    "ratio": 0.312,
    "median_category_atomic": 80000
  },
  "pricing_review_required": false,
  "pricing_decimal_suspect": false,
  "trust_tier": "indexed_external",
  "accepts": [
    {
      "scheme": "exact",
      "network": "base",
      "pay_to": "0xfad67ce5a834e68d5533ba7ac08619ff82a42084",
      "asset": "0x833589fCD6eDb6E08f4c7C32D4f71b54bdA02913",
      "max_amount_required_atomic": "25000",
      "max_timeout_seconds": 60,
      "mime_type": "multipart/form-data",
      "description": "Transcribe uploaded audio/video files to text. Payment via USDC on base.",
      "verified": false,
      "hints": {
        "input": {
          "type": "http",
          "method": "POST"
        },
        "output": {
          "input": {
            "type": "http",
            "method": "POST",
            "bodyType": "multipart-form-data",
            "bodyFields": {
              "media": {
                "type": "binary",
                "required": true,
                "description": "Audio or video file to transcribe (multipart upload)"
              },
              "language": {
                "type": "string",
                "required": false,
                "description": "Language code (ISO 639-1) for better accuracy"
              },
              "includeTimestamps": {
                "type": "boolean",
                "required": false,
                "description": "Include timestamp markers in the transcription"
              }
            }
          },
          "output": {
            "type": "object",
            "required": [
              "success",
              "transcription"
            ],
            "properties": {
              "jobId": {
                "type": "string",
                "description": "Unique job identifier"
              },
              "success": {
                "type": "boolean",
                "description": "Whether the transcription was successful"
              },
              "duration": {
                "type": "number",
                "description": "Duration of the media in seconds"
              },
              "language": {
                "type": "string",
                "description": "Detected or specified language"
              },
              "wordCount": {
                "type": "number",
                "description": "Number of words in transcription"
              },
              "timestamps": {
                "type": "array",
                "items": {
                  "type": "object",
                  "properties": {
                    "end": {
                      "type": "number",
                      "description": "End time in seconds"
                    },
                    "text": {
                      "type": "string",
                      "description": "Text for this segment"
                    },
                    "start": {
                      "type": "number",
                      "description": "Start time in seconds"
                    }
                  }
                },
                "description": "Array of timestamped segments (if requested)"
              },
              "transcription": {
                "type": "string",
                "description": "Full text transcription of the media"
              }
            }
          }
        }
      }
    }
  ],
  "origin": {
    "slug": "cnvrt-ing",
    "host": "cnvrt.ing",
    "title": "CNVRT - Perception Layer for Autonomous Systems",
    "description": "We're not building agents.... we're waking them up.",
    "url": "https://cnvrt.ing",
    "og_image": "https://cnvrt.ing/assets/cnvrt.png",
    "favicon": "https://cnvrt.ing/assets/favicon.ico"
  },
  "json_ld": {
    "@id": "https://x402all.com/resource/cnvrt-ing-api-transcribe-file",
    "url": "https://x402all.com/resource/cnvrt-ing-api-transcribe-file",
    "name": "CNVRT \u00b7 Audio/Video File Transcription",
    "@type": "WebAPI",
    "offers": {
      "url": "https://x402all.com/resource/cnvrt-ing-api-transcribe-file",
      "@type": "Offer",
      "price": "0.025",
      "availability": "https://schema.org/InStock",
      "priceCurrency": "USDC",
      "priceSpecification": {
        "@type": "UnitPriceSpecification",
        "price": "0.025000",
        "unitText": "call",
        "priceCurrency": "USDC"
      },
      "eligibleCustomerType": "Agent",
      "additionalProperty": [
        {
          "@type": "PropertyValue",
          "name": "paymentNetwork",
          "value": "base"
        },
        {
          "@type": "PropertyValue",
          "name": "paymentAsset",
          "value": "0x833589fCD6eDb6E08f4c7C32D4f71b54bdA02913"
        }
      ]
    },
    "sameAs": "https://cnvrt.ing/api/transcribe-file",
    "@context": "https://schema.org",
    "provider": {
      "@id": "https://x402all.com/server/cnvrt-ing",
      "url": "https://cnvrt.ing",
      "name": "CNVRT - Perception Layer for Autonomous Systems",
      "@type": "Organization"
    },
    "identifier": "cnvrt-ing-api-transcribe-file",
    "description": "Transcribe audio and video files to text via x402. 0.025 USDC per file. Multilingual transcription with optional timestamps on Base.",
    "potentialAction": {
      "@type": "BuyAction",
      "target": "https://axon402.com/test-buy?resource=cnvrt-ing-api-transcribe-file",
      "description": "Test-buy this endpoint on AXON"
    },
    "applicationCategory": "media"
  },
  "axon_deep_link": "https://axon402.com/test-buy?resource=cnvrt-ing-api-transcribe-file"
}
