{
  "$schema": "https://ishard.us/schemas/pricing.v1.json",
  "currency": "USD",
  "as_of": "2026-05-07",
  "tiers": {
    "open_shard": {
      "name": "Open Shard",
      "billing_unit": "per_million_tokens",
      "models": {
        "llama_3_3_70b": {"input": 0.55, "output": 0.55, "class": "70B", "max_context_tokens": 131072, "hf_id": "meta-llama/Llama-3.3-70B-Instruct"},
        "deepseek_v3":   {"input": 1.10, "output": 1.10, "class": "MoE", "max_context_tokens": 131072, "hf_id": "deepseek-ai/DeepSeek-V3"},
        "llama_3_1_405b":{"input": 2.80, "output": 2.80, "class": "405B", "max_context_tokens": 131072, "hf_id": "meta-llama/Meta-Llama-3.1-405B-Instruct"}
      },
      "modifiers": {
        "custom_checkpoint_surcharge_pct": 15
      },
      "signup_credit_usd": 10,
      "sla": "best_effort",
      "openai_compatible": true
    },
    "dedicated_shard": {
      "name": "Dedicated Shard",
      "billing_unit": "per_hour",
      "node_classes": {
        "rtx_5090":     {"vram_gb": 32,  "price_per_hour": 1.50, "available": true,  "count": 2},
        "spark":        {"vram_gb": 128, "price_per_hour": 2.50, "available": true,  "count": 2,  "uma": true, "fp4_native": true},
        "rtx_pro_6000": {"vram_gb": 96,  "price_per_hour": 3.50, "available": "partial", "count": 1, "anchor_tenant": "npcx"},
        "spark_pair":   {"vram_gb": 256, "price_per_hour": 4.75, "available": true,  "count": 1,  "uma": true, "linked": true}
      },
      "minimum_hours": 1,
      "sla": "best_effort_99_0_during_reserved_window"
    },
    "private_fleet": {
      "name": "Private Fleet",
      "billing_unit": "monthly_contract",
      "discount_vs_hourly_pct": {"min": 30, "max": 40},
      "minimum_term_months": 6,
      "max_nodes": 5,
      "onboarding_usd": 0,
      "sla": "negotiated",
      "data_residency_written_into_contract": "US",
      "intake": "mailto:hello@ijarvis.ai?subject=iShard%20Private%20Fleet"
    }
  },
  "notes": [
    "All prices in USD.",
    "Per-token prices apply to both input and output tokens (flat).",
    "Hourly prices are billed by the second after the first hour.",
    "Pricing is reviewed quarterly. Existing reservations honor their booked rate."
  ],
  "contact": "hello@ijarvis.ai"
}
