{
  "$schema": "https://ishard.us/schemas/agents-manifest.v1.json",
  "manifest_version": "1.0",
  "name": "iShard",
  "operator": {
    "legal_name": "iJarvis LLC",
    "country": "US",
    "region": "FL",
    "locality": "Tampa",
    "contact_email": "hello@ijarvis.ai"
  },
  "service": {
    "category": "gpu_inference",
    "description": "Boutique Blackwell-first GPU inference. Serverless per-token, hourly per-node reservations, and monthly private fleet contracts.",
    "regions": ["us-fl-tampa-1"],
    "single_site": true,
    "single_operator": true,
    "data_residency": ["US"]
  },
  "endpoints": {
    "homepage": "https://ishard.us/",
    "pricing_machine": "https://ishard.us/pricing.json",
    "fleet_machine": "https://ishard.us/fleet.json",
    "llms_digest": "https://ishard.us/llms.txt",
    "ai_policy": "https://ishard.us/ai.txt",
    "mcp_descriptor": "https://ishard.us/.well-known/mcp.json",
    "status_page": "https://status.ishard.us/",
    "docs": "https://docs.ishard.us/",
    "api_base": "https://api.ishard.us/v1/",
    "openai_compatible_base": "https://api.ishard.us/v1/",
    "support": "mailto:hello@ijarvis.ai"
  },
  "api": {
    "openai_compatible": true,
    "auth": {
      "scheme": "bearer",
      "header": "Authorization",
      "token_prefix": "Bearer ",
      "obtain_via": "mailto:hello@ijarvis.ai?subject=iShard%20API%20key"
    },
    "rate_limit": {
      "open_shard_default_rpm": 600,
      "dedicated_shard": "node_capped"
    },
    "available_endpoints": [
      {"method": "POST", "path": "/v1/chat/completions", "openai_compatible": true},
      {"method": "POST", "path": "/v1/completions", "openai_compatible": true},
      {"method": "POST", "path": "/v1/embeddings", "openai_compatible": true},
      {"method": "GET",  "path": "/v1/models"},
      {"method": "GET",  "path": "/v1/usage"},
      {"method": "POST", "path": "/v1/reservations", "description": "Create a Dedicated Shard reservation. Returns a single-use Stripe payment link."},
      {"method": "GET",  "path": "/v1/reservations/{id}"},
      {"method": "DELETE", "path": "/v1/reservations/{id}"}
    ],
    "ga_target": "2026-Q3"
  },
  "payment": {
    "supported_methods": ["stripe_payment_link"],
    "agent_friendly": true,
    "single_use_payment_link": true,
    "card_data_required_from_agent": false,
    "settlement_trigger": "On payment success, iShard issues a per-tenant Tailscale ACL and a scoped base_url. The agent's caller (or a delegated human) approves the payment link.",
    "experimental": {
      "x402_status": "tracking",
      "acp_status": "tracking",
      "stripe_pay_by_agent": "tracking"
    }
  },
  "tiers": [
    {
      "id": "open_shard",
      "billing": "per_token",
      "currency": "USD",
      "tokens_unit": 1000000,
      "models": [
        {"alias": "llama-3.3-70b", "class": "70B", "price_in": 0.55, "price_out": 0.55, "max_context_tokens": 131072, "hf_id": "meta-llama/Llama-3.3-70B-Instruct"},
        {"alias": "deepseek-v3", "class": "MoE", "price_in": 1.10, "price_out": 1.10, "max_context_tokens": 131072, "hf_id": "deepseek-ai/DeepSeek-V3"},
        {"alias": "llama-3.1-405b", "class": "405B", "price_in": 2.80, "price_out": 2.80, "max_context_tokens": 131072, "hf_id": "meta-llama/Meta-Llama-3.1-405B-Instruct"}
      ],
      "custom_checkpoint_surcharge_pct": 15,
      "sla": "best_effort"
    },
    {
      "id": "dedicated_shard",
      "billing": "per_hour",
      "currency": "USD",
      "node_classes": [
        {"class": "rtx_5090", "vram_gb": 32, "price_per_hour": 1.50},
        {"class": "spark", "vram_gb": 128, "uma": true, "price_per_hour": 2.50},
        {"class": "rtx_pro_6000", "vram_gb": 96, "price_per_hour": 3.50},
        {"class": "spark_pair", "vram_gb": 256, "uma": true, "price_per_hour": 4.75}
      ],
      "minimum_hours": 1,
      "sla": "best_effort_99_0_during_window"
    },
    {
      "id": "private_fleet",
      "billing": "monthly",
      "currency": "USD",
      "discount_vs_hourly_pct": [30, 40],
      "minimum_term_months": 6,
      "max_nodes": 5,
      "sla": "negotiated",
      "intake": "mailto:hello@ijarvis.ai?subject=iShard%20Private%20Fleet"
    }
  ],
  "compliance": {
    "soc2": null,
    "hipaa_baa": null,
    "encryption_in_transit": "TLS 1.3",
    "encryption_at_rest": "LUKS / dm-crypt on production volumes",
    "data_residency_default": "US",
    "data_residency_written_into_contract_tier": "private_fleet",
    "customer_payload_used_for_training": false
  },
  "honest_disclosures": [
    "Single physical site until Q4 2026 multi-site rollout.",
    "Single human operator. Disclosed in SLA.",
    "No 99.x uptime commitment on Open Shard tier.",
    "Not price-leader on per-token; positioned on dedication, hardware tier, and operator access."
  ],
  "last_updated": "2026-05-07"
}
