{"version":1,"name":"GEDX402 Media","serviceName":"GEDX402 Media","tags":["vision","audio","tts","asr","usdc","multi-chain"],"iconUrl":"https://media.gedx402.com/favicon.svg","url":"https://media.gedx402.com","origin":"https://media.gedx402.com","role":"shard","shard":"GEDX402 Media","hub":"https://gedx402.com","openapi":"https://media.gedx402.com/openapi.json","llms_txt":"https://media.gedx402.com/llms.txt","agents_manifest":"https://media.gedx402.com/.well-known/agents.json","network":"base","payments":{"asset":"USDC","facilitator":"coinbase-cdp","networks":[{"id":"base","label":"Base","caip":"eip155:8453","asset":"USDC","family":"evm"},{"id":"polygon","label":"Polygon","caip":"eip155:137","asset":"USDC","family":"evm"},{"id":"arbitrum","label":"Arbitrum","caip":"eip155:42161","asset":"USDC","family":"evm"},{"id":"world","label":"World","caip":"eip155:480","asset":"USDC","family":"evm"},{"id":"solana","label":"Solana","caip":"solana:5eykt4UsFv8P8NJdTREpY1vzqKqZKvdp","asset":"USDC","family":"solana"}],"primary_network":"base"},"facilitator":"https://api.cdp.coinbase.com/platform/v2/x402","resources":["https://media.gedx402.com/v1/asr/flux","https://media.gedx402.com/v1/asr/nova-3","https://media.gedx402.com/v1/asr/smart-turn-v2","https://media.gedx402.com/v1/asr/whisper-large-v3-turbo","https://media.gedx402.com/v1/asr/whisper-tiny-en","https://media.gedx402.com/v1/speech/transcribe","https://media.gedx402.com/v1/tts/aura-1","https://media.gedx402.com/v1/tts/aura-2-en","https://media.gedx402.com/v1/tts/aura-2-es","https://media.gedx402.com/v1/tts/melotts","https://media.gedx402.com/v1/vision/describe","https://media.gedx402.com/v1/vision/llama-3.2-11b","https://media.gedx402.com/v1/caption/llava-1.5-7b-hf","https://media.gedx402.com/v1/caption/uform-gen2-qwen-500m","https://media.gedx402.com/v1/guard/llama-guard-3-8b","https://media.gedx402.com/v1/detect/detr-resnet-50"],"catalog_url":"https://media.gedx402.com/v1/models","demo_url":"https://media.gedx402.com/v1/demo","instructions":"Shard API with 16 paid routes. Full catalog at hub GET /v1/models. Pay per request with USDC on Base, Polygon, Arbitrum, World, Solana via x402 v2 (Coinbase CDP facilitator). Choose any listed network in the 402 accepts[] response.","ownershipProofs":["0xb3C2776cE3F99cb3366520c27b4aC5D436942Ab6","6X7E1kWxiDb9KMVBWpj1vhGLngaH9nBJS31YUyrG2mwq"],"pricing":{"formula":"max(floor, (neurons/1000)*NEURON_USD_RATE*MARKUP_MULTIPLIER+FACILITATOR_BUFFER_USD)","neuron_usd_rate":0.011,"markup_multiplier":2.5,"facilitator_buffer_usd":0.002},"routes":[{"path":"/v1/vision/describe","method":"POST","model":"@cf/meta/llama-3.2-11b-vision-instruct","kind":"vision","shard":"media","origin":"https://media.gedx402.com","summary":"Image Description","description":"Describe or answer questions about an image with Llama 3.2 11B Vision Instruct (@cf/meta/llama-3.2-11b-vision-instruct). POST image (base64) plus optional prompt; multimodal pricing includes image and text neurons.","discovery":true,"price_usd":0.33288,"price_display":"$0.333","estimated_neurons":12032,"worst_case_price_usd":0.8837324999999999,"worst_case_price_display":"$0.884"},{"path":"/v1/speech/transcribe","method":"POST","model":"@cf/openai/whisper","kind":"audio","shard":"media","origin":"https://media.gedx402.com","summary":"Speech-to-Text","description":"Transcribe speech to text with Whisper (@cf/openai/whisper). POST audio (base64) or audio URL; returns transcript text billed by audio duration.","discovery":true,"price_usd":0.006,"price_display":"$0.0060","estimated_neurons":21,"worst_case_price_usd":0.007665,"worst_case_price_display":"$0.0077"},{"path":"/v1/guard/llama-guard-3-8b","method":"POST","model":"@cf/meta/llama-guard-3-8b","kind":"guard","shard":"media","origin":"https://media.gedx402.com","summary":"Llama Guard 3 8B Safety Guard","description":"Run safety moderation with Llama Guard 3 8B (@cf/meta/llama-guard-3-8b). POST messages or content to classify policy violations before downstream LLM calls.","discovery":true,"price_usd":0.01,"price_display":"$0.010","estimated_neurons":23,"worst_case_price_usd":0.01,"worst_case_price_display":"$0.010"},{"path":"/v1/vision/llama-3.2-11b","method":"POST","model":"@cf/meta/llama-3.2-11b-vision-instruct","kind":"vision","shard":"media","origin":"https://media.gedx402.com","summary":"Llama 3.2 11B Vision Instruct Vision","description":"Describe or answer questions about an image with Llama 3.2 11B Vision Instruct (@cf/meta/llama-3.2-11b-vision-instruct). POST image (base64) plus optional prompt; multimodal pricing includes image and text neurons.","discovery":true,"price_usd":0.33288,"price_display":"$0.333","estimated_neurons":12032,"worst_case_price_usd":0.8837324999999999,"worst_case_price_display":"$0.884"},{"path":"/v1/tts/melotts","method":"POST","model":"@cf/myshell-ai/melotts","kind":"tts","shard":"media","origin":"https://media.gedx402.com","summary":"Melotts Text-to-Speech","description":"Synthesize speech from text with Melotts (@cf/myshell-ai/melotts). POST text; returns audio bytes billed by character count.","discovery":true,"price_usd":0.005,"price_display":"$0.0050","estimated_neurons":10,"worst_case_price_usd":0.005,"worst_case_price_display":"$0.0050"},{"path":"/v1/tts/aura-1","method":"POST","model":"@cf/deepgram/aura-1","kind":"tts","shard":"media","origin":"https://media.gedx402.com","summary":"Aura 1 Text-to-Speech","description":"Synthesize speech from text with Aura 1 (@cf/deepgram/aura-1). POST text; returns audio bytes billed by character count.","discovery":true,"price_usd":0.020755000000000003,"price_display":"$0.021","estimated_neurons":682,"worst_case_price_usd":0.1520125,"worst_case_price_display":"$0.152"},{"path":"/v1/tts/aura-2-en","method":"POST","model":"@cf/deepgram/aura-2-en","kind":"tts","shard":"media","origin":"https://media.gedx402.com","summary":"Aura 2 EN Text-to-Speech","description":"Synthesize speech from text with Aura 2 EN (@cf/deepgram/aura-2-en). POST text; returns audio bytes billed by character count.","discovery":true,"price_usd":0.03951,"price_display":"$0.040","estimated_neurons":1364,"worst_case_price_usd":0.302025,"worst_case_price_display":"$0.302"},{"path":"/v1/tts/aura-2-es","method":"POST","model":"@cf/deepgram/aura-2-es","kind":"tts","shard":"media","origin":"https://media.gedx402.com","summary":"Aura 2 ES Text-to-Speech","description":"Synthesize speech from text with Aura 2 ES (@cf/deepgram/aura-2-es). POST text; returns audio bytes billed by character count.","discovery":true,"price_usd":0.03951,"price_display":"$0.040","estimated_neurons":1364,"worst_case_price_usd":0.302025,"worst_case_price_display":"$0.302"},{"path":"/v1/asr/whisper-large-v3-turbo","method":"POST","model":"@cf/openai/whisper-large-v3-turbo","kind":"audio","shard":"media","origin":"https://media.gedx402.com","summary":"Whisper Large V3 Turbo Speech-to-Text","description":"Transcribe speech to text with Whisper Large V3 Turbo (@cf/openai/whisper-large-v3-turbo). POST audio (base64) or audio URL; returns transcript text billed by audio duration.","discovery":true,"price_usd":0.006,"price_display":"$0.0060","estimated_neurons":24,"worst_case_price_usd":0.008435,"worst_case_price_display":"$0.0084"},{"path":"/v1/asr/nova-3","method":"POST","model":"@cf/deepgram/nova-3","kind":"audio","shard":"media","origin":"https://media.gedx402.com","summary":"Nova 3 Speech-to-Text","description":"Transcribe speech to text with Nova 3 (@cf/deepgram/nova-3). POST audio (base64) or audio URL; returns transcript text billed by audio duration.","discovery":true,"price_usd":0.008517499999999999,"price_display":"$0.0085","estimated_neurons":237,"worst_case_price_usd":0.06700999999999999,"worst_case_price_display":"$0.067"},{"path":"/v1/asr/flux","method":"POST","model":"@cf/deepgram/flux","kind":"audio","shard":"media","origin":"https://media.gedx402.com","summary":"Flux Speech-to-Text","description":"Conversational speech recognition with Flux (@cf/deepgram/flux) for voice agents. WebSocket-only: GET with Upgrade and query params encoding (linear16) and sample_rate (Hz); stream PCM audio and receive turn events. Billed by audio duration.","discovery":true,"price_usd":0.011625,"price_display":"$0.012","estimated_neurons":350,"worst_case_price_usd":0.09825,"worst_case_price_display":"$0.098"},{"path":"/v1/asr/smart-turn-v2","method":"POST","model":"@cf/pipecat-ai/smart-turn-v2","kind":"audio","shard":"media","origin":"https://media.gedx402.com","summary":"Smart Turn V2 Speech-to-Text","description":"Transcribe speech to text with Smart Turn V2 (@cf/pipecat-ai/smart-turn-v2). POST audio (base64) or audio URL; returns transcript text billed by audio duration.","discovery":true,"price_usd":0.0020275000000000002,"price_display":"$0.0020","estimated_neurons":1,"worst_case_price_usd":0.0020825,"worst_case_price_display":"$0.0021"},{"path":"/v1/detect/detr-resnet-50","method":"POST","model":"@cf/facebook/detr-resnet-50","kind":"detect","shard":"media","origin":"https://media.gedx402.com","summary":"Detr Resnet 50 Object Detection","description":"Detect objects in an image with Detr Resnet 50 (@cf/facebook/detr-resnet-50). POST base64 image; returns bounding boxes and labels.","discovery":true,"price_usd":0.0042,"price_display":"$0.0042","estimated_neurons":80,"worst_case_price_usd":0.0042,"worst_case_price_display":"$0.0042"},{"path":"/v1/caption/llava-1.5-7b-hf","method":"POST","model":"@cf/llava-hf/llava-1.5-7b-hf","kind":"caption","shard":"media","origin":"https://media.gedx402.com","summary":"Llava 1.5 7B Hf Image Captioning","description":"Generate a natural-language caption for an image with Llava 1.5 7B Hf (@cf/llava-hf/llava-1.5-7b-hf). POST image data; returns descriptive text.","discovery":true,"price_usd":0.22307249999999998,"price_display":"$0.223","estimated_neurons":8039,"worst_case_price_usd":0.5541175,"worst_case_price_display":"$0.554"},{"path":"/v1/caption/uform-gen2-qwen-500m","method":"POST","model":"@cf/unum/uform-gen2-qwen-500m","kind":"caption","shard":"media","origin":"https://media.gedx402.com","summary":"Uform Gen2 Qwen 500m Image Captioning","description":"Generate a natural-language caption for an image with Uform Gen2 Qwen 500m (@cf/unum/uform-gen2-qwen-500m). POST image data; returns descriptive text.","discovery":true,"price_usd":0.13993999999999998,"price_display":"$0.140","estimated_neurons":5016,"worst_case_price_usd":0.41537999999999997,"worst_case_price_display":"$0.415"},{"path":"/v1/asr/whisper-tiny-en","method":"POST","model":"@cf/openai/whisper-tiny-en","kind":"audio","shard":"media","origin":"https://media.gedx402.com","summary":"Whisper Tiny EN Speech-to-Text","description":"Transcribe speech to text with Whisper Tiny EN (@cf/openai/whisper-tiny-en). POST audio (base64) or audio URL; returns transcript text billed by audio duration.","discovery":true,"price_usd":0.003,"price_display":"$0.0030","estimated_neurons":21,"worst_case_price_usd":0.007665,"worst_case_price_display":"$0.0077"}],"paid_route_count":16,"discovery_route_count":16,"discovery_omitted_slug_count":75}