diff --git a/.changeset/llm-metadata-run-tags.md b/.changeset/llm-metadata-run-tags.md
new file mode 100644
index 00000000000..85f04c363b8
--- /dev/null
+++ b/.changeset/llm-metadata-run-tags.md
@@ -0,0 +1,5 @@
+---
+"@trigger.dev/core": patch
+---
+
+Propagate run tags to span attributes so they can be extracted server-side for LLM cost attribution metadata.
diff --git a/.server-changes/llm-cost-tracking.md b/.server-changes/llm-cost-tracking.md
new file mode 100644
index 00000000000..7567aae7d1b
--- /dev/null
+++ b/.server-changes/llm-cost-tracking.md
@@ -0,0 +1,6 @@
+---
+area: webapp
+type: feature
+---
+
+Add automatic LLM cost calculation for spans with GenAI semantic conventions. When a span arrives with `gen_ai.response.model` and token usage data, costs are calculated from an in-memory pricing registry backed by Postgres and dual-written to both span attributes (`trigger.llm.*`) and a new `llm_metrics_v1` ClickHouse table that captures usage, cost, performance (TTFC, tokens/sec), and behavioral (finish reason, operation type) metrics.
diff --git a/apps/webapp/app/assets/icons/AiProviderIcons.tsx b/apps/webapp/app/assets/icons/AiProviderIcons.tsx
new file mode 100644
index 00000000000..85a01b98d63
--- /dev/null
+++ b/apps/webapp/app/assets/icons/AiProviderIcons.tsx
@@ -0,0 +1,177 @@
+type IconProps = { className?: string };
+
+export function OpenAIIcon({ className }: IconProps) {
+  return (
+    <svg className={className} viewBox="0 0 24 24" fill="none" xmlns="http://www.w3.org/2000/svg">
+      <path
+        d="M9.648 9.27004V7.36778C9.648 7.20757 9.70764 7.08738 9.84657 7.00738L13.6396 4.80477C14.1559 4.50443 14.7715 4.36434 15.4069 4.36434C17.7899 4.36434 19.2992 6.22658 19.2992 8.20884C19.2992 8.34898 19.2992 8.50919 19.2793 8.6694L15.3473 6.3466C15.1091 6.20651 14.8707 6.20651 14.6324 6.3466L9.648 9.27004ZM18.5048 16.6789V12.1334C18.5048 11.853 18.3855 11.6528 18.1473 11.5126L13.1629 8.58919L14.7913 7.64801C14.9303 7.56801 15.0495 7.56801 15.1884 7.64801L18.9814 9.85062C20.0737 10.4915 20.8084 11.853 20.8084 13.1745C20.8084 14.6962 19.9148 16.098 18.5048 16.6787V16.6789ZM8.47638 12.6742L6.848 11.7131C6.70907 11.6331 6.64943 11.5128 6.64943 11.3526V6.94746C6.64943 4.80498 8.2778 3.18295 10.4821 3.18295C11.3163 3.18295 12.0906 3.46334 12.7461 3.96392L8.834 6.24669C8.59578 6.38679 8.47658 6.58702 8.47658 6.86746V12.6743L8.47638 12.6742ZM11.9814 14.7165L9.648 13.395V10.5918L11.9814 9.27025L14.3146 10.5918V13.395L11.9814 14.7165ZM13.4807 20.8038C12.6466 20.8038 11.8723 20.5234 11.2168 20.0229L15.1288 17.7401C15.3671 17.6 15.4863 17.3997 15.4863 17.1193V11.3124L17.1346 12.2735C17.2735 12.3535 17.3331 12.4737 17.3331 12.634V17.0391C17.3331 19.1816 15.6848 20.8036 13.4807 20.8036V20.8038ZM8.77424 16.3385L4.9812 14.136C3.88892 13.4951 3.15426 12.1336 3.15426 10.8121C3.15426 9.27025 4.06775 7.88863 5.4776 7.30789V11.8733C5.4776 12.1537 5.59683 12.3539 5.83506 12.494L10.7997 15.3974L9.17134 16.3385C9.03241 16.4185 8.91317 16.4185 8.77424 16.3385ZM8.55592 19.6224C6.31192 19.6224 4.66364 17.9204 4.66364 15.8179C4.66364 15.6577 4.68355 15.4975 4.70329 15.3373L8.61535 17.62C8.85358 17.7602 9.09201 17.7602 9.33023 17.62L14.3146 14.7167V16.619C14.3146 16.7792 14.255 16.8994 14.1161 16.9794L10.3231 19.182C9.80672 19.4823 9.19109 19.6224 8.55571 19.6224H8.55592ZM13.4807 22.0052C15.8836 22.0052 17.8891 20.2832 18.3461 18.0004C20.5701 17.4197 21.9999 15.3172 21.9999 13.1747C21.9999 11.773 21.4043 10.4115 20.3319 9.43025C20.4312 9.00972 20.4908 8.58919 20.4908 8.16886C20.4908 5.30551 18.1872 3.16283 15.5261 3.16283C14.9901 3.16283 14.4737 3.24283 13.9574 3.42316C13.0636 2.54207 11.8324 1.98145 10.4821 1.98145C8.07927 1.98145 6.07369 3.70339 5.61678 5.98616C3.39269 6.5669 1.96289 8.6694 1.96289 10.8119C1.96289 12.2136 2.55857 13.5751 3.63095 14.5563C3.53166 14.9768 3.47207 15.3974 3.47207 15.8177C3.47207 18.6811 5.77567 20.8237 8.43668 20.8237C8.97277 20.8237 9.48911 20.7437 10.0055 20.5634C10.899 21.4445 12.1302 22.0052 13.4807 22.0052Z"
+        fill="currentColor"
+      />
+    </svg>
+  );
+}
+
+export function AnthropicIcon({ className }: IconProps) {
+  return (
+    <svg
+      className={className}
+      viewBox="0 0 24 24"
+      fill="currentColor"
+      xmlns="http://www.w3.org/2000/svg"
+    >
+      <path d="M17.3041 3.541h-3.6718l6.696 16.918H24Zm-10.6082 0L0 20.459h3.7442l1.3693-3.5527h7.0052l1.3693 3.5528h3.7442L10.5363 3.5409Zm-.3712 10.2232 2.2914-5.9456 2.2914 5.9456Z" />
+    </svg>
+  );
+}
+
+export function GeminiIcon({ className }: IconProps) {
+  return (
+    <svg
+      className={className}
+      viewBox="0 0 24 24"
+      fill="currentColor"
+      xmlns="http://www.w3.org/2000/svg"
+    >
+      <path d="M12 0C12 6.627 6.627 12 0 12c6.627 0 12 5.373 12 12 0-6.627 5.373-12 12-12-6.627 0-12-5.373-12-12Z" />
+    </svg>
+  );
+}
+
+export function LlamaIcon({ className }: IconProps) {
+  return (
+    <svg
+      className={className}
+      viewBox="0 0 12 12"
+      fill="currentColor"
+      xmlns="http://www.w3.org/2000/svg"
+    >
+      <path
+        fill-rule="evenodd"
+        clip-rule="evenodd"
+        d="M3.4485 2C4.406 2 5.2065 2.466 6.1635 3.688L6.3045 3.5015C6.3995 3.3785 6.496 3.2595 6.5945 3.1465L6.751 2.9715C7.294 2.394 7.896 2 8.6125 2C9.249 2 9.847 2.2785 10.358 2.758L10.467 2.8645C11.332 3.747 11.9255 5.2195 11.9935 6.8775L11.999 7.0735L12 7.1985C12 7.949 11.86 8.578 11.591 9.0485L11.521 9.1635L11.467 9.24C11.3165 9.45 11.135 9.619 10.924 9.7445L10.7915 9.8155L10.748 9.8355C10.6986 9.85749 10.6482 9.87718 10.597 9.8945C10.3825 9.96542 10.1579 10.0006 9.932 9.9985C9.67 9.9985 9.434 9.965 9.213 9.891C8.906 9.789 8.6315 9.611 8.35 9.333L8.2365 9.2155C7.86 8.8095 7.4695 8.2275 6.99 7.4225L6.275 6.2175L6.003 5.77L5.12 7.335L4.9485 7.631C3.7985 9.578 3.1135 10 2.178 10C1.573 10 1.0755 9.79 0.71 9.409L0.626 9.317C0.384 9.0305 0.2075 8.6615 0.1045 8.2225L0.071 8.0625C0.0323456 7.84982 0.00961585 7.63456 0.003 7.4185L0 7.234C0.001 6.8615 0.03 6.489 0.087 6.119L0.137 5.8325C0.286 5.0675 0.551 4.3535 0.905 3.754L1.0095 3.584C1.598 2.669 2.404 2.0575 3.317 2.004L3.4485 2ZM3.432 3.3075L3.3315 3.3125C2.9165 3.354 2.5285 3.649 2.2055 4.101L2.1365 4.2005L2.1315 4.2095C1.7965 4.718 1.539 5.3985 1.4035 6.132L1.4015 6.143C1.33323 6.5148 1.29859 6.89199 1.298 7.27L1.299 7.364C1.301 7.454 1.3075 7.544 1.319 7.634L1.3405 7.7795C1.3865 8.031 1.469 8.2335 1.5835 8.3835L1.642 8.452C1.7935 8.6135 1.991 8.698 2.227 8.698C2.777 8.698 3.125 8.36 4.075 6.8775L5.1625 5.1775L5.3895 4.827L5.32 4.728C4.555 3.65 4.042 3.3075 3.432 3.3075ZM8.53 3.0315L8.442 3.035C8.1245 3.059 7.8305 3.2145 7.532 3.5015L7.434 3.6005C7.2145 3.8315 6.9905 4.1325 6.7505 4.504L6.8835 4.703C6.9735 4.84 7.0645 4.983 7.1585 5.132L7.305 5.3695L8.003 6.537L8.3505 7.094C8.642 7.557 8.8655 7.894 9.0545 8.135L9.161 8.266C9.302 8.429 9.4255 8.536 9.5495 8.6025L9.6005 8.6275C9.714 8.6775 9.829 8.6965 9.9595 8.6965C10.0475 8.6975 10.1345 8.685 10.2185 8.66C10.3875 8.608 10.5235 8.5 10.625 8.3415L10.6725 8.26L10.711 8.179C10.808 7.9495 10.856 7.649 10.856 7.2865L10.853 7.062C10.813 5.6265 10.384 4.376 9.753 3.663L9.665 3.5685C9.33 3.227 8.943 3.0315 8.53 3.0315Z"
+        fill="currentColor"
+      />
+    </svg>
+  );
+}
+
+export function DeepseekIcon({ className }: IconProps) {
+  return (
+    <svg className={className} viewBox="0 0 24 24" fill="none" xmlns="http://www.w3.org/2000/svg">
+      <g clip-path="url(#clip0_20374_57805)">
+        <path
+          fill-rule="evenodd"
+          clip-rule="evenodd"
+          d="M23.7479 4.48176C23.4939 4.35776 23.384 4.59476 23.236 4.71576C23.185 4.75476 23.142 4.80576 23.099 4.85176C22.727 5.24876 22.293 5.50876 21.726 5.47776C20.897 5.43176 20.189 5.69176 19.563 6.32576C19.43 5.54376 18.988 5.07776 18.316 4.77776C17.964 4.62176 17.608 4.46676 17.361 4.12776C17.189 3.88676 17.142 3.61776 17.056 3.35376C17.001 3.19376 16.946 3.03076 16.763 3.00376C16.563 2.97276 16.4849 3.13976 16.4069 3.27976C16.094 3.85176 15.9729 4.48176 15.9849 5.11976C16.0119 6.55576 16.618 7.69976 17.823 8.51276C17.96 8.60576 17.995 8.69976 17.952 8.83576C17.87 9.11576 17.772 9.38776 17.686 9.66876C17.631 9.84776 17.549 9.88576 17.357 9.80876C16.7082 9.52995 16.1189 9.12939 15.6209 8.62876C14.7639 7.80076 13.9899 6.88676 13.0239 6.17076C12.8001 6.00537 12.5703 5.84827 12.3349 5.69976C11.3499 4.74276 12.4649 3.95676 12.7229 3.86376C12.9929 3.76576 12.8159 3.43176 11.9439 3.43576C11.0719 3.43976 10.2739 3.73076 9.25695 4.11976C9.10582 4.17767 8.95033 4.22348 8.79195 4.25676C7.84158 4.07769 6.8696 4.0433 5.90895 4.15476C4.02395 4.36476 2.51895 5.25676 1.41195 6.77776C0.0819496 8.60576 -0.23105 10.6838 0.15195 12.8498C0.55495 15.1338 1.72095 17.0248 3.51195 18.5028C5.36995 20.0358 7.50895 20.7868 9.94995 20.6428C11.4319 20.5578 13.0829 20.3588 14.9439 18.7828C15.4139 19.0168 15.906 19.1098 16.724 19.1798C17.354 19.2388 17.96 19.1498 18.429 19.0518C19.164 18.8958 19.1129 18.2148 18.8479 18.0908C16.693 17.0868 17.166 17.4958 16.735 17.1648C17.831 15.8688 19.481 14.5228 20.127 10.1618C20.177 9.81476 20.134 9.59676 20.127 9.31676C20.123 9.14676 20.162 9.07976 20.357 9.06076C20.898 9.00463 21.4228 8.84327 21.902 8.58576C23.298 7.82276 23.862 6.57076 23.995 5.06876C24.015 4.83876 23.9909 4.60276 23.7479 4.48176ZM11.5809 17.9998C9.49195 16.3578 8.47895 15.8168 8.06095 15.8398C7.66895 15.8638 7.73995 16.3108 7.82595 16.6028C7.91595 16.8908 8.03295 17.0888 8.19695 17.3418C8.31095 17.5088 8.38895 17.7578 8.08395 17.9448C7.41095 18.3608 6.24195 17.8048 6.18695 17.7778C4.82595 16.9758 3.68695 15.9178 2.88595 14.4708C2.11195 13.0778 1.66195 11.5838 1.58795 9.98876C1.56795 9.60276 1.68095 9.46676 2.06495 9.39676C2.56906 9.30029 3.08558 9.28711 3.59395 9.35776C5.72595 9.66976 7.53995 10.6228 9.06195 12.1318C9.92995 12.9918 10.5869 14.0188 11.2639 15.0228C11.9839 16.0888 12.7579 17.1048 13.7439 17.9368C14.0919 18.2288 14.3689 18.4508 14.6349 18.6138C13.8329 18.7038 12.4949 18.7238 11.5809 17.9998ZM12.5809 11.5598C12.5808 11.5101 12.5927 11.4611 12.6157 11.4171C12.6387 11.373 12.672 11.3353 12.7129 11.307C12.7538 11.2787 12.8009 11.2609 12.8502 11.2549C12.8995 11.2489 12.9495 11.2551 12.9959 11.2728C13.0551 11.294 13.1062 11.3331 13.142 11.3848C13.1779 11.4364 13.1967 11.4979 13.1959 11.5608C13.1961 11.6014 13.1881 11.6416 13.1726 11.6791C13.157 11.7166 13.1341 11.7506 13.1053 11.7792C13.0764 11.8078 13.0422 11.8303 13.0045 11.8455C12.9669 11.8607 12.9266 11.8683 12.8859 11.8678C12.8457 11.8679 12.8057 11.86 12.7685 11.8445C12.7313 11.829 12.6976 11.8063 12.6693 11.7776C12.641 11.7489 12.6186 11.7149 12.6037 11.6775C12.5887 11.6401 12.5803 11.6 12.5809 11.5598ZM15.6909 13.1558C15.4909 13.2368 15.2919 13.3068 15.1009 13.3158C14.8136 13.3258 14.5316 13.236 14.3029 13.0618C14.0289 12.8318 13.8329 12.7038 13.7509 12.3038C13.7227 12.1083 13.7281 11.9094 13.7669 11.7158C13.8369 11.3888 13.7589 11.1788 13.5279 10.9888C13.3409 10.8328 13.1019 10.7898 12.8399 10.7898C12.7502 10.7845 12.6631 10.7578 12.5859 10.7118C12.4759 10.6578 12.3859 10.5218 12.4719 10.3538C12.4999 10.2998 12.6319 10.1678 12.6639 10.1438C13.0199 9.94176 13.4309 10.0078 13.8099 10.1598C14.1619 10.3038 14.4279 10.5678 14.8109 10.9418C15.2019 11.3928 15.2729 11.5178 15.4959 11.8558C15.6719 12.1208 15.8319 12.3928 15.9409 12.7038C16.0079 12.8988 15.9219 13.0578 15.6909 13.1558Z"
+          fill="currentColor"
+        />
+      </g>
+      <defs>
+        <clipPath id="clip0_20374_57805">
+          <rect width="24" height="24" fill="currentColor" />
+        </clipPath>
+      </defs>
+    </svg>
+  );
+}
+
+export function XAIIcon({ className }: IconProps) {
+  return (
+    <svg className={className} viewBox="0 0 24 24" fill="none" xmlns="http://www.w3.org/2000/svg">
+      <path
+        d="M17.7329 8.44672L18.0784 22.0139H20.8452L21.1911 3.50781L17.7329 8.44672Z"
+        fill="currentColor"
+      />
+      <path d="M21.1911 2H16.9692L10.3442 11.4621L12.4552 14.4768L21.1911 2Z" fill="currentColor" />
+      <path
+        d="M2.95508 22.0136H7.17691L9.28824 18.9989L7.17691 15.9839L2.95508 22.0136Z"
+        fill="currentColor"
+      />
+      <path
+        d="M2.95508 8.44629L12.4546 22.0134H16.6764L7.17691 8.44629H2.95508Z"
+        fill="currentColor"
+      />
+    </svg>
+  );
+}
+
+export function PerplexityIcon({ className }: IconProps) {
+  return (
+    <svg className={className} viewBox="0 0 24 24" fill="none" xmlns="http://www.w3.org/2000/svg">
+      <path
+        fill-rule="evenodd"
+        clip-rule="evenodd"
+        d="M18.4875 2V8.06H20.75V16.6833H18.3042V22L12.44 16.8383V21.9592H11.5308V16.8325L5.66 22V16.6125H3.25V7.99H5.65333V2L11.5308 7.41167V2.15833H12.4392V7.56667L18.4875 2ZM12.44 9.53667V15.6358L17.395 19.9975V14.0333L12.44 9.53667ZM11.5242 9.47L6.56917 13.9683V19.9975L11.5242 15.6358V9.47083V9.47ZM18.3042 15.7867H19.8408V8.9575H13.2167L18.3042 13.5742V15.7867ZM10.8192 8.88667H4.15833V15.7158H5.65833V13.5692L10.8183 8.88583L10.8192 8.88667ZM6.5625 4.06333V7.98833H10.825L6.5625 4.06333ZM17.5783 4.06333L13.3158 7.98833H17.5783V4.06333Z"
+        fill="currentColor"
+      />
+    </svg>
+  );
+}
+
+export function CerebrasIcon({ className }: IconProps) {
+  return (
+    <svg className={className} viewBox="0 0 24 24" fill="none" xmlns="http://www.w3.org/2000/svg">
+      <path
+        fill-rule="evenodd"
+        clip-rule="evenodd"
+        d="M11.6535 20.6834C10.4382 20.6834 9.28717 20.4401 8.23625 20.0036C6.66345 19.3453 5.31944 18.2433 4.36862 16.8551C3.4178 15.4669 2.86732 13.7997 2.86732 11.9964C2.86732 10.7943 3.11039 9.65655 3.56078 8.61182C4.22564 7.0519 5.3409 5.72809 6.7421 4.7907C8.1433 3.85331 9.83047 3.30948 11.6535 3.30948V2C10.2594 2 8.92972 2.27907 7.71437 2.78712C5.8985 3.54562 4.35432 4.81217 3.26767 6.40788C2.17386 8.00356 1.5376 9.92844 1.5376 11.9964C1.5376 13.3774 1.82356 14.6941 2.33114 15.8891C3.09609 17.6851 4.38291 19.2093 5.99144 20.2898C7.60713 21.3703 9.55167 22 11.6463 22V20.6834H11.6535Z"
+        fill="currentColor"
+      />
+      <path
+        fill-rule="evenodd"
+        clip-rule="evenodd"
+        d="M7.14949 17.3272C6.32735 16.6403 5.71253 15.8102 5.2979 14.9014C4.88323 13.9927 4.66877 13.0124 4.66877 12.0249C4.66877 11.2378 4.8046 10.4506 5.06911 9.69931C5.34079 8.94794 5.74113 8.23241 6.29159 7.58122C6.9779 6.7655 7.81433 6.15012 8.72225 5.73508C9.63021 5.32005 10.6239 5.11254 11.6105 5.11254C12.3969 5.11254 13.1904 5.24849 13.9411 5.51325C14.6989 5.78516 15.4138 6.18588 16.0643 6.7297L16.9151 5.72077C16.143 5.07676 15.2851 4.59018 14.3843 4.27533C13.4835 3.95332 12.547 3.7959 11.6105 3.7959C10.4309 3.7959 9.25846 4.04634 8.17178 4.54009C7.08514 5.03382 6.09141 5.77087 5.27643 6.73687C4.62587 7.50967 4.14689 8.36119 3.82518 9.25563C3.50347 10.1501 3.34619 11.0875 3.34619 12.0249C3.34619 13.1984 3.59641 14.3719 4.08969 15.4524C4.58298 16.5329 5.32649 17.5276 6.29876 18.3362L7.14949 17.3272Z"
+        fill="currentColor"
+      />
+      <path
+        fill-rule="evenodd"
+        clip-rule="evenodd"
+        d="M9.18714 16.4758C8.32211 16.0179 7.64298 15.3524 7.17829 14.5724C6.7136 13.7925 6.47052 12.8909 6.47052 11.9821C6.47052 11.1807 6.65641 10.3721 7.06388 9.62074C7.52144 8.75492 8.19345 8.08228 8.97983 7.6243C9.76624 7.1592 10.667 6.9159 11.5821 6.9159C12.3828 6.9159 13.1978 7.10194 13.9556 7.50269L14.5704 6.33631C13.6196 5.83541 12.5901 5.59212 11.5749 5.59927C10.424 5.59927 9.28725 5.90697 8.30069 6.48655C7.31412 7.06618 6.46339 7.92487 5.89146 9.00535C5.39101 9.95706 5.14795 10.9803 5.14795 11.9821C5.14795 13.127 5.45536 14.2576 6.04159 15.2379C6.62782 16.2254 7.48568 17.0626 8.57236 17.635L9.18714 16.4758Z"
+        fill="currentColor"
+      />
+      <path
+        fill-rule="evenodd"
+        clip-rule="evenodd"
+        d="M11.6608 15.2165C11.2104 15.2165 10.7815 15.1235 10.3955 14.9589C9.80924 14.7156 9.31596 14.3005 8.96564 13.7782C8.61536 13.2558 8.40804 12.6333 8.40804 11.9606C8.40804 11.5098 8.50095 11.0805 8.66537 10.6941C8.90845 10.1145 9.32309 9.61359 9.84496 9.26297C10.3669 8.91235 10.9888 8.70484 11.6608 8.70484V7.38818C11.0317 7.38818 10.4312 7.517 9.88072 7.74597C9.05858 8.09659 8.36511 8.66905 7.87183 9.39892C7.37142 10.136 7.08545 11.0233 7.08545 11.9678C7.08545 12.5975 7.21412 13.1986 7.4429 13.7496C7.79322 14.5725 8.37228 15.2666 9.10147 15.7603C9.83067 16.2469 10.71 16.5331 11.6608 16.5331V15.2165Z"
+        fill="currentColor"
+      />
+      <path
+        fill-rule="evenodd"
+        clip-rule="evenodd"
+        d="M12.7332 10.9234C12.5831 10.766 12.4187 10.6372 12.2542 10.5442C12.0898 10.4511 11.9183 10.401 11.7395 10.401C11.4965 10.401 11.2891 10.444 11.0961 10.5299C10.9102 10.6157 10.7458 10.7302 10.61 10.8805C10.4741 11.0236 10.374 11.1953 10.3026 11.3814C10.2311 11.5674 10.2025 11.7678 10.2025 11.9681C10.2025 12.1685 10.2382 12.3689 10.3026 12.5549C10.374 12.7409 10.4741 12.9127 10.61 13.0558C10.7458 13.1989 10.9031 13.3206 11.0961 13.4064C11.282 13.4923 11.4965 13.5352 11.7395 13.5352C11.9397 13.5352 12.1327 13.4923 12.3043 13.4136C12.4759 13.3277 12.626 13.2061 12.7475 13.0486L13.6197 13.986C13.491 14.1148 13.3409 14.2293 13.1693 14.3223C12.9978 14.4154 12.8262 14.4941 12.6546 14.5513C12.483 14.6086 12.3114 14.6515 12.1542 14.673C11.9969 14.7016 11.8539 14.7087 11.7395 14.7087C11.3463 14.7087 10.9746 14.6443 10.6314 14.5155C10.2811 14.3868 9.98084 14.2007 9.73064 13.9574C9.47326 13.7213 9.27311 13.4279 9.12298 13.0916C8.97285 12.7553 8.90137 12.376 8.90137 11.9681C8.90137 11.5531 8.97285 11.181 9.12298 10.8447C9.27311 10.5084 9.47326 10.2222 9.73064 9.97887C9.98801 9.74274 10.2883 9.55669 10.6314 9.42075C10.9817 9.29193 11.3535 9.22754 11.7395 9.22754C12.0755 9.22754 12.4115 9.29193 12.7475 9.42075C13.0835 9.54953 13.3838 9.7499 13.634 10.0218L12.7332 10.9234Z"
+        fill="currentColor"
+      />
+    </svg>
+  );
+}
+
+export function MistralIcon({ className }: IconProps) {
+  return (
+    <svg className={className} viewBox="0 0 24 24" fill="currentColor" xmlns="http://www.w3.org/2000/svg">
+      <path d="M7.28516 3.74658H4.1416V6.8809H7.28516V3.74658Z" />
+      <path d="M19.8579 3.74658H16.7144V6.8809H19.8579V3.74658Z" />
+      <path d="M10.4277 6.88086H4.1416V10.0152H10.4277V6.88086Z" />
+      <path d="M19.8588 6.88086H13.5728V10.0152H19.8588V6.88086Z" />
+      <path d="M19.8564 10.0137H4.1416V13.148H19.8564V10.0137Z" />
+      <path d="M7.28516 13.1484H4.1416V16.2828H7.28516V13.1484Z" />
+      <path d="M13.5723 13.1484H10.4287V16.2828H13.5723V13.1484Z" />
+      <path d="M19.8579 13.1484H16.7144V16.2828H19.8579V13.1484Z" />
+      <path d="M10.4286 16.2812H1V19.4157H10.4286V16.2812Z" />
+      <path d="M23.0024 16.2812H13.5728V19.4157H23.0024V16.2812Z" />
+    </svg>
+  );
+}
+
+export function AzureIcon({ className }: IconProps) {
+  return (
+    <svg
+      className={className}
+      viewBox="0 0 24 24"
+      fill="currentColor"
+      xmlns="http://www.w3.org/2000/svg"
+    >
+      <path d="M13.05 4.24L6.56 18.05l2.77-.46 1.89-4.55 4.2 5.19.03-.01 2.99.53L13.05 4.24zm-4.1 7.51L2.49 20.21h5.23l1.23-3.04v-5.42z" />
+    </svg>
+  );
+}
+
diff --git a/apps/webapp/app/assets/icons/AnthropicLogoIcon.tsx b/apps/webapp/app/assets/icons/AnthropicLogoIcon.tsx
new file mode 100644
index 00000000000..3e647284cce
--- /dev/null
+++ b/apps/webapp/app/assets/icons/AnthropicLogoIcon.tsx
@@ -0,0 +1,12 @@
+export function AnthropicLogoIcon({ className }: { className?: string }) {
+  return (
+    <svg
+      className={className}
+      viewBox="0 0 24 24"
+      fill="currentColor"
+      xmlns="http://www.w3.org/2000/svg"
+    >
+      <path d="M17.3041 3.541h-3.6718l6.696 16.918H24Zm-10.6082 0L0 20.459h3.7442l1.3693-3.5527h7.0052l1.3693 3.5528h3.7442L10.5363 3.5409Zm-.3712 10.2232 2.2914-5.9456 2.2914 5.9456Z" />
+    </svg>
+  );
+}
diff --git a/apps/webapp/app/components/code/QueryResultsChart.tsx b/apps/webapp/app/components/code/QueryResultsChart.tsx
index 190304a1e9c..2c3f1c9f2bf 100644
--- a/apps/webapp/app/components/code/QueryResultsChart.tsx
+++ b/apps/webapp/app/components/code/QueryResultsChart.tsx
@@ -1209,9 +1209,19 @@ function createYAxisFormatter(
       formatDurationMilliseconds(value * 1000, { style: "short" });
   }
 
+  if (format === "durationNs") {
+    return (value: number): string =>
+      formatDurationMilliseconds(value / 1_000_000, { style: "short" });
+  }
+
   if (format === "costInDollars" || format === "cost") {
     return (value: number): string => {
       const dollars = format === "cost" ? value / 100 : value;
+      if (dollars === 0) return "$0";
+      if (Math.abs(dollars) >= 1000) return `$${(dollars / 1000).toFixed(1)}K`;
+      if (Math.abs(dollars) >= 1) return `$${dollars.toFixed(2)}`;
+      if (Math.abs(dollars) >= 0.01) return `$${dollars.toFixed(4)}`;
+      if (Math.abs(dollars) >= 0.0001) return `$${dollars.toFixed(6)}`;
       return formatCurrencyAccurate(dollars);
     };
   }
diff --git a/apps/webapp/app/components/code/TSQLResultsTable.tsx b/apps/webapp/app/components/code/TSQLResultsTable.tsx
index 3eb033c1d09..b2caf74dac6 100644
--- a/apps/webapp/app/components/code/TSQLResultsTable.tsx
+++ b/apps/webapp/app/components/code/TSQLResultsTable.tsx
@@ -81,6 +81,11 @@ function getFormattedValue(value: unknown, column: OutputColumnMetadata): string
           return formatDurationMilliseconds(value * 1000, { style: "short" });
         }
         break;
+      case "durationNs":
+        if (typeof value === "number") {
+          return formatDurationMilliseconds(value / 1_000_000, { style: "short" });
+        }
+        break;
       case "cost":
         if (typeof value === "number") {
           return formatCurrencyAccurate(value / 100);
@@ -282,6 +287,12 @@ function getDisplayLength(value: unknown, column: OutputColumnMetadata): number
           return formatted.length;
         }
         return 10;
+      case "durationNs":
+        if (typeof value === "number") {
+          const formatted = formatDurationMilliseconds(value / 1_000_000, { style: "short" });
+          return formatted.length;
+        }
+        return 10;
       case "cost":
       case "costInDollars":
         // Currency format: "$1,234.56"
@@ -598,6 +609,15 @@ function CellValue({
           );
         }
         return <span>{String(value)}</span>;
+      case "durationNs":
+        if (typeof value === "number") {
+          return (
+            <span className="tabular-nums">
+              {formatDurationMilliseconds(value / 1_000_000, { style: "short" })}
+            </span>
+          );
+        }
+        return <span>{String(value)}</span>;
       case "cost":
         if (typeof value === "number") {
           return <span className="tabular-nums">{formatCurrencyAccurate(value / 100)}</span>;
diff --git a/apps/webapp/app/components/metrics/ModelsFilter.tsx b/apps/webapp/app/components/metrics/ModelsFilter.tsx
new file mode 100644
index 00000000000..6250cd20c99
--- /dev/null
+++ b/apps/webapp/app/components/metrics/ModelsFilter.tsx
@@ -0,0 +1,159 @@
+import { CubeIcon } from "@heroicons/react/20/solid";
+import * as Ariakit from "@ariakit/react";
+import { type ReactNode, useMemo } from "react";
+import { AppliedFilter } from "~/components/primitives/AppliedFilter";
+import {
+  ComboBox,
+  SelectItem,
+  SelectList,
+  SelectPopover,
+  SelectProvider,
+  SelectTrigger,
+} from "~/components/primitives/Select";
+import { useSearchParams } from "~/hooks/useSearchParam";
+import { appliedSummary, FilterMenuProvider } from "~/components/runs/v3/SharedFilters";
+import { tablerIcons } from "~/utils/tablerIcons";
+import tablerSpritePath from "~/components/primitives/tabler-sprite.svg";
+import { AnthropicLogoIcon } from "~/assets/icons/AnthropicLogoIcon";
+
+const shortcut = { key: "m" };
+
+export type ModelOption = {
+  model: string;
+  system: string;
+};
+
+interface ModelsFilterProps {
+  possibleModels: ModelOption[];
+}
+
+function modelIcon(system: string, model: string): ReactNode {
+  // For gateway/openrouter, derive provider from model prefix
+  let provider = system.split(".")[0];
+  if (provider === "gateway" || provider === "openrouter") {
+    if (model.includes("/")) {
+      provider = model.split("/")[0].replace(/-/g, "");
+    }
+  }
+
+  // Special case: Anthropic uses a custom SVG icon
+  if (provider === "anthropic") {
+    return <AnthropicLogoIcon className="size-4 shrink-0" />;
+  }
+
+  const iconName = `tabler-brand-${provider}`;
+  if (tablerIcons.has(iconName)) {
+    return (
+      <svg className="size-4 shrink-0 stroke-[1.5]">
+        <use xlinkHref={`${tablerSpritePath}#${iconName}`} />
+      </svg>
+    );
+  }
+
+  return <CubeIcon className="size-4 shrink-0" />;
+}
+
+export function ModelsFilter({ possibleModels }: ModelsFilterProps) {
+  const { values, replace, del } = useSearchParams();
+  const selectedModels = values("models");
+
+  if (selectedModels.length === 0 || selectedModels.every((v) => v === "")) {
+    return (
+      <FilterMenuProvider>
+        {(search, setSearch) => (
+          <ModelsDropdown
+            trigger={
+              <SelectTrigger
+                icon={<CubeIcon className="size-4" />}
+                variant="secondary/small"
+                shortcut={shortcut}
+                tooltipTitle="Filter by model"
+              >
+                <span className="ml-0.5">Models</span>
+              </SelectTrigger>
+            }
+            searchValue={search}
+            clearSearchValue={() => setSearch("")}
+            possibleModels={possibleModels}
+          />
+        )}
+      </FilterMenuProvider>
+    );
+  }
+
+  return (
+    <FilterMenuProvider>
+      {(search, setSearch) => (
+        <ModelsDropdown
+          trigger={
+            <Ariakit.Select render={<div className="group cursor-pointer focus-custom" />}>
+              <AppliedFilter
+                label="Model"
+                icon={<CubeIcon className="size-4" />}
+                value={appliedSummary(selectedModels)}
+                onRemove={() => del(["models"])}
+                variant="secondary/small"
+              />
+            </Ariakit.Select>
+          }
+          searchValue={search}
+          clearSearchValue={() => setSearch("")}
+          possibleModels={possibleModels}
+        />
+      )}
+    </FilterMenuProvider>
+  );
+}
+
+function ModelsDropdown({
+  trigger,
+  clearSearchValue,
+  searchValue,
+  onClose,
+  possibleModels,
+}: {
+  trigger: ReactNode;
+  clearSearchValue: () => void;
+  searchValue: string;
+  onClose?: () => void;
+  possibleModels: ModelOption[];
+}) {
+  const { values, replace } = useSearchParams();
+
+  const handleChange = (values: string[]) => {
+    clearSearchValue();
+    replace({ models: values });
+  };
+
+  const filtered = useMemo(() => {
+    return possibleModels.filter((m) => {
+      return m.model?.toLowerCase().includes(searchValue.toLowerCase());
+    });
+  }, [searchValue, possibleModels]);
+
+  return (
+    <SelectProvider value={values("models")} setValue={handleChange} virtualFocus={true}>
+      {trigger}
+      <SelectPopover
+        className="min-w-0 max-w-[min(360px,var(--popover-available-width))]"
+        hideOnEscape={() => {
+          if (onClose) {
+            onClose();
+            return false;
+          }
+          return true;
+        }}
+      >
+        <ComboBox placeholder="Filter by model..." value={searchValue} />
+        <SelectList>
+          {filtered.map((m) => (
+            <SelectItem key={m.model} value={m.model} icon={modelIcon(m.system, m.model)}>
+              {m.model}
+            </SelectItem>
+          ))}
+          {filtered.length === 0 && <SelectItem disabled>No models found</SelectItem>}
+        </SelectList>
+      </SelectPopover>
+    </SelectProvider>
+  );
+}
diff --git a/apps/webapp/app/components/runs/v3/RunIcon.tsx b/apps/webapp/app/components/runs/v3/RunIcon.tsx
index 846d7cae0a4..572435f75c9 100644
--- a/apps/webapp/app/components/runs/v3/RunIcon.tsx
+++ b/apps/webapp/app/components/runs/v3/RunIcon.tsx
@@ -3,10 +3,25 @@ import {
   HandRaisedIcon,
   InformationCircleIcon,
   RectangleStackIcon,
+  SparklesIcon,
   Squares2X2Icon,
   TableCellsIcon,
   TagIcon,
+  WrenchIcon,
 } from "@heroicons/react/20/solid";
+import { AnthropicLogoIcon } from "~/assets/icons/AnthropicLogoIcon";
+import {
+  AnthropicIcon,
+  AzureIcon,
+  CerebrasIcon,
+  DeepseekIcon,
+  GeminiIcon,
+  LlamaIcon,
+  MistralIcon,
+  OpenAIIcon,
+  PerplexityIcon,
+  XAIIcon,
+} from "~/assets/icons/AiProviderIcons";
 import { AttemptIcon } from "~/assets/icons/AttemptIcon";
 import { TaskIcon } from "~/assets/icons/TaskIcon";
 import { cn } from "~/utils/cn";
@@ -112,6 +127,31 @@ export function RunIcon({ name, className, spanName }: TaskIconProps) {
       return <FunctionIcon className={cn(className, "text-error")} />;
     case "streams":
       return <StreamsIcon className={cn(className, "text-text-dimmed")} />;
+    case "hero-sparkles":
+      return <SparklesIcon className={cn(className, "text-text-dimmed")} />;
+    case "hero-wrench":
+      return <WrenchIcon className={cn(className, "text-text-dimmed")} />;
+    case "tabler-brand-anthropic":
+    case "ai-provider-anthropic":
+      return <AnthropicIcon className={cn(className, "text-text-dimmed")} />;
+    case "ai-provider-openai":
+      return <OpenAIIcon className={cn(className, "text-text-dimmed")} />;
+    case "ai-provider-gemini":
+      return <GeminiIcon className={cn(className, "text-text-dimmed")} />;
+    case "ai-provider-llama":
+      return <LlamaIcon className={cn(className, "text-text-dimmed")} />;
+    case "ai-provider-deepseek":
+      return <DeepseekIcon className={cn(className, "text-text-dimmed")} />;
+    case "ai-provider-xai":
+      return <XAIIcon className={cn(className, "text-text-dimmed")} />;
+    case "ai-provider-perplexity":
+      return <PerplexityIcon className={cn(className, "text-text-dimmed")} />;
+    case "ai-provider-cerebras":
+      return <CerebrasIcon className={cn(className, "text-text-dimmed")} />;
+    case "ai-provider-mistral":
+      return <MistralIcon className={cn(className, "text-text-dimmed")} />;
+    case "ai-provider-azure":
+      return <AzureIcon className={cn(className, "text-text-dimmed")} />;
   }
 
   return <InformationCircleIcon className={cn(className, "text-text-dimmed")} />;
diff --git a/apps/webapp/app/components/runs/v3/SpanTitle.tsx b/apps/webapp/app/components/runs/v3/SpanTitle.tsx
index fb0105c45db..fe85fd70c9e 100644
--- a/apps/webapp/app/components/runs/v3/SpanTitle.tsx
+++ b/apps/webapp/app/components/runs/v3/SpanTitle.tsx
@@ -3,6 +3,8 @@ import { TaskEventStyle } from "@trigger.dev/core/v3";
 import type { TaskEventLevel } from "@trigger.dev/database";
 import { Fragment } from "react";
 import { cn } from "~/utils/cn";
+import { tablerIcons } from "~/utils/tablerIcons";
+import tablerSpritePath from "~/components/primitives/tabler-sprite.svg";
 
 type SpanTitleProps = {
   message: string;
@@ -45,6 +47,15 @@ function SpanAccessory({
         />
       );
     }
+    case "pills": {
+      return (
+        <div className="flex items-center gap-1">
+          {accessory.items.map((item, index) => (
+            <SpanPill key={index} text={item.text} icon={item.icon} />
+          ))}
+        </div>
+      );
+    }
     default: {
       return (
         <div className={cn("flex gap-1")}>
@@ -59,6 +70,21 @@ function SpanAccessory({
   }
 }
 
+function SpanPill({ text, icon }: { text: string; icon?: string }) {
+  const hasIcon = icon && tablerIcons.has(icon);
+
+  return (
+    <span className="inline-flex items-center gap-0.5 rounded-full border border-charcoal-700 bg-charcoal-850 px-1.5 py-px text-xxs text-text-dimmed">
+      {hasIcon && (
+        <svg className="size-3 stroke-[1.5] text-text-dimmed/70">
+          <use xlinkHref={`${tablerSpritePath}#${icon}`} />
+        </svg>
+      )}
+      <span className="truncate">{text}</span>
+    </span>
+  );
+}
+
 export function SpanCodePathAccessory({
   accessory,
   className,
diff --git a/apps/webapp/app/components/runs/v3/ai/AIChatMessages.tsx b/apps/webapp/app/components/runs/v3/ai/AIChatMessages.tsx
new file mode 100644
index 00000000000..9e5a799e1bc
--- /dev/null
+++ b/apps/webapp/app/components/runs/v3/ai/AIChatMessages.tsx
@@ -0,0 +1,317 @@
+import { CheckIcon, ClipboardDocumentIcon, CodeBracketSquareIcon } from "@heroicons/react/20/solid";
+import { lazy, Suspense, useState } from "react";
+import { CodeBlock } from "~/components/code/CodeBlock";
+import { Button } from "~/components/primitives/Buttons";
+import { Header3 } from "~/components/primitives/Headers";
+import { Paragraph } from "~/components/primitives/Paragraph";
+import type { DisplayItem, ToolUse } from "./types";
+
+// Lazy load streamdown to avoid SSR issues
+const StreamdownRenderer = lazy(() =>
+  import("streamdown").then((mod) => ({
+    default: ({ children }: { children: string }) => (
+      <mod.ShikiThemeContext.Provider value={["one-dark-pro", "one-dark-pro"]}>
+        <mod.Streamdown isAnimating={false}>{children}</mod.Streamdown>
+      </mod.ShikiThemeContext.Provider>
+    ),
+  }))
+);
+
+export function AIChatMessages({ items }: { items: DisplayItem[] }) {
+  return (
+    <div className="flex flex-col gap-1">
+      {items.map((item, i) => {
+        switch (item.type) {
+          case "system":
+            return <SystemSection key={i} text={item.text} />;
+          case "user":
+            return <UserSection key={i} text={item.text} />;
+          case "tool-use":
+            return <ToolUseSection key={i} tools={item.tools} />;
+          case "assistant":
+            return <AssistantResponse key={i} text={item.text} />;
+        }
+      })}
+    </div>
+  );
+}
+
+// ---------------------------------------------------------------------------
+// Section header (shared across all sections)
+// ---------------------------------------------------------------------------
+
+function SectionHeader({ label, right }: { label: string; right?: React.ReactNode }) {
+  return (
+    <div className="flex items-center justify-between">
+      <Header3>{label}</Header3>
+      {right && <div className="flex items-center gap-2">{right}</div>}
+    </div>
+  );
+}
+
+export function ChatBubble({ children }: { children: React.ReactNode }) {
+  return (
+    <div className="rounded-md border border-grid-bright bg-charcoal-750/50 px-3.5 py-2">
+      {children}
+    </div>
+  );
+}
+
+// ---------------------------------------------------------------------------
+// System
+// ---------------------------------------------------------------------------
+
+function SystemSection({ text }: { text: string }) {
+  const [expanded, setExpanded] = useState(false);
+  const isLong = text.length > 150;
+  const preview = isLong ? text.slice(0, 150) + "..." : text;
+  const displayText = expanded || !isLong ? text : preview;
+
+  return (
+    <div className="flex flex-col gap-1.5 py-2.5">
+      <SectionHeader
+        label="System"
+        right={
+          isLong ? (
+            <button
+              onClick={() => setExpanded(!expanded)}
+              className="text-[10px] text-text-link hover:underline"
+            >
+              {expanded ? "Collapse" : "Expand"}
+            </button>
+          ) : undefined
+        }
+      />
+      <ChatBubble>
+        <Paragraph variant="small/dimmed" className="streamdown-container">
+          <Suspense fallback={<span className="whitespace-pre-wrap">{displayText}</span>}>
+            <StreamdownRenderer>{displayText}</StreamdownRenderer>
+          </Suspense>
+        </Paragraph>
+      </ChatBubble>
+    </div>
+  );
+}
+
+// ---------------------------------------------------------------------------
+// User
+// ---------------------------------------------------------------------------
+
+function UserSection({ text }: { text: string }) {
+  return (
+    <div className="flex flex-col gap-1.5 py-2.5">
+      <SectionHeader label="User" />
+      <ChatBubble>
+        <Paragraph variant="small/dimmed" className="streamdown-container">
+          <Suspense fallback={<span className="whitespace-pre-wrap">{text}</span>}>
+            <StreamdownRenderer>{text}</StreamdownRenderer>
+          </Suspense>
+        </Paragraph>
+      </ChatBubble>
+    </div>
+  );
+}
+
+// ---------------------------------------------------------------------------
+// Assistant response (with markdown/raw toggle)
+// ---------------------------------------------------------------------------
+
+function isJsonString(value: string): boolean {
+  const trimmed = value.trimStart();
+  if (!trimmed.startsWith("{") && !trimmed.startsWith("[")) return false;
+  try {
+    JSON.parse(value);
+    return true;
+  } catch {
+    return false;
+  }
+}
+
+export function AssistantResponse({
+  text,
+  headerLabel = "Assistant",
+}: {
+  text: string;
+  headerLabel?: string;
+}) {
+  const isJson = isJsonString(text);
+  const [mode, setMode] = useState<"rendered" | "raw">("rendered");
+  const [copied, setCopied] = useState(false);
+
+  function handleCopy() {
+    navigator.clipboard.writeText(text);
+    setCopied(true);
+    setTimeout(() => setCopied(false), 2000);
+  }
+
+  if (isJson) {
+    return (
+      <div className="flex flex-col gap-1.5 py-2.5">
+        <SectionHeader label={headerLabel} />
+        <CodeBlock
+          code={text}
+          maxLines={20}
+          showLineNumbers={false}
+          showCopyButton
+          language="json"
+        />
+      </div>
+    );
+  }
+
+  return (
+    <div className="flex flex-col gap-1.5 py-2.5">
+      <SectionHeader
+        label={headerLabel}
+        right={
+          <div className="flex items-center">
+            <Button
+              variant="minimal/small"
+              onClick={() => setMode(mode === "rendered" ? "raw" : "rendered")}
+              LeadingIcon={CodeBracketSquareIcon}
+            >
+              {mode === "rendered" ? "Raw" : "Rendered"}
+            </Button>
+            <Button
+              variant="minimal/small"
+              onClick={handleCopy}
+              LeadingIcon={copied ? CheckIcon : ClipboardDocumentIcon}
+              leadingIconClassName={copied ? "text-green-500" : undefined}
+            >
+              Copy
+            </Button>
+          </div>
+        }
+      />
+      {mode === "rendered" ? (
+        <ChatBubble>
+          <Paragraph variant="small/dimmed" className="streamdown-container">
+            <Suspense fallback={<span className="whitespace-pre-wrap">{text}</span>}>
+              <StreamdownRenderer>{text}</StreamdownRenderer>
+            </Suspense>
+          </Paragraph>
+        </ChatBubble>
+      ) : (
+        <CodeBlock
+          code={text}
+          maxLines={20}
+          showLineNumbers={false}
+          showCopyButton={false}
+          className="pl-2"
+        />
+      )}
+    </div>
+  );
+}
+
+// ---------------------------------------------------------------------------
+// Tool use (merged calls + results)
+// ---------------------------------------------------------------------------
+
+function ToolUseSection({ tools }: { tools: ToolUse[] }) {
+  return (
+    <div className="flex flex-col gap-1.5 py-2.5">
+      <SectionHeader label={tools.length === 1 ? "Tool call" : `Tool calls (${tools.length})`} />
+      <div className="flex flex-col gap-2">
+        {tools.map((tool) => (
+          <ToolUseRow key={tool.toolCallId} tool={tool} />
+        ))}
+      </div>
+    </div>
+  );
+}
+
+type ToolTab = "input" | "output" | "details";
+
+function ToolUseRow({ tool }: { tool: ToolUse }) {
+  const hasInput = tool.inputJson !== "{}";
+  const hasResult = !!tool.resultOutput;
+  const hasDetails = !!tool.description || !!tool.parametersJson;
+
+  const availableTabs: ToolTab[] = [
+    ...(hasInput ? (["input"] as const) : []),
+    ...(hasResult ? (["output"] as const) : []),
+    ...(hasDetails ? (["details"] as const) : []),
+  ];
+
+  const defaultTab: ToolTab | null = hasInput ? "input" : null;
+  const [activeTab, setActiveTab] = useState<ToolTab | null>(defaultTab);
+
+  function handleTabClick(tab: ToolTab) {
+    setActiveTab(activeTab === tab ? null : tab);
+  }
+
+  return (
+    <div className="rounded-sm border border-grid-bright bg-charcoal-800/40">
+      <div className="flex items-center gap-2 px-2.5 py-1.5">
+        <code className="font-mono text-xs text-text-bright">{tool.toolName}</code>
+        {tool.resultSummary && (
+          <span className="ml-auto text-[10px] text-text-dimmed">{tool.resultSummary}</span>
+        )}
+      </div>
+
+      {availableTabs.length > 0 && (
+        <>
+          <div className="flex gap-0 border-t border-grid-bright">
+            {availableTabs.map((tab) => (
+              <button
+                key={tab}
+                onClick={() => handleTabClick(tab)}
+                className={`px-2.5 py-1 text-[11px] capitalize transition-colors ${
+                  activeTab === tab
+                    ? "bg-charcoal-750 text-text-bright"
+                    : "text-text-dimmed hover:text-text-bright"
+                }`}
+              >
+                {tab}
+              </button>
+            ))}
+          </div>
+
+          {activeTab === "input" && hasInput && (
+            <div className="border-t border-grid-dimmed">
+              <CodeBlock
+                code={tool.inputJson}
+                maxLines={12}
+                showLineNumbers={false}
+                showCopyButton
+              />
+            </div>
+          )}
+
+          {activeTab === "output" && hasResult && (
+            <div className="border-t border-grid-dimmed">
+              <CodeBlock
+                code={tool.resultOutput!}
+                maxLines={16}
+                showLineNumbers={false}
+                showCopyButton
+              />
+            </div>
+          )}
+
+          {activeTab === "details" && hasDetails && (
+            <div className="flex flex-col gap-2 border-t border-grid-dimmed px-2.5 py-2">
+              {tool.description && (
+                <p className="text-xs leading-relaxed text-text-dimmed">{tool.description}</p>
+              )}
+              {tool.parametersJson && (
+                <div>
+                  <span className="text-[10px] font-medium uppercase tracking-wide text-text-dimmed">
+                    Parameters schema
+                  </span>
+                  <CodeBlock
+                    code={tool.parametersJson}
+                    maxLines={16}
+                    showLineNumbers={false}
+                    showCopyButton
+                  />
+                </div>
+              )}
+            </div>
+          )}
+        </>
+      )}
+    </div>
+  );
+}
diff --git a/apps/webapp/app/components/runs/v3/ai/AIModelSummary.tsx b/apps/webapp/app/components/runs/v3/ai/AIModelSummary.tsx
new file mode 100644
index 00000000000..62341fc9041
--- /dev/null
+++ b/apps/webapp/app/components/runs/v3/ai/AIModelSummary.tsx
@@ -0,0 +1,113 @@
+import { formatCurrencyAccurate } from "~/utils/numberFormatter";
+import { Header3 } from "~/components/primitives/Headers";
+import type { AISpanData } from "./types";
+
+export function AITagsRow({ aiData }: { aiData: AISpanData }) {
+  return (
+    <div className="flex flex-col gap-1 py-2.5">
+      <div className="flex flex-col text-xs @container">
+        <MetricRow label="Model" value={aiData.model} />
+        {aiData.provider !== "unknown" && <MetricRow label="Provider" value={aiData.provider} />}
+        {aiData.resolvedProvider && (
+          <MetricRow label="Resolved provider" value={aiData.resolvedProvider} />
+        )}
+        {aiData.finishReason && <MetricRow label="Finish reason" value={aiData.finishReason} />}
+        {aiData.serviceTier && <MetricRow label="Service tier" value={aiData.serviceTier} />}
+        {aiData.toolChoice && <MetricRow label="Tool choice" value={aiData.toolChoice} />}
+        {aiData.toolCount != null && aiData.toolCount > 0 && (
+          <MetricRow
+            label="Tools provided"
+            value={`${aiData.toolCount} ${aiData.toolCount === 1 ? "tool" : "tools"}`}
+          />
+        )}
+        {aiData.messageCount != null && (
+          <MetricRow
+            label="Messages"
+            value={`${aiData.messageCount} ${aiData.messageCount === 1 ? "message" : "messages"}`}
+          />
+        )}
+        {aiData.telemetryMetadata &&
+          Object.entries(aiData.telemetryMetadata).map(([key, value]) => (
+            <MetricRow key={key} label={key} value={value} />
+          ))}
+      </div>
+    </div>
+  );
+}
+
+export function AIStatsSummary({ aiData }: { aiData: AISpanData }) {
+  return (
+    <div className="flex flex-col gap-1 py-2.5">
+      <Header3>Stats</Header3>
+      <div className="flex flex-col text-xs @container">
+        <MetricRow label="Input" value={aiData.inputTokens.toLocaleString()} unit="tokens" />
+        <MetricRow label="Output" value={aiData.outputTokens.toLocaleString()} unit="tokens" />
+        {aiData.cachedTokens != null && aiData.cachedTokens > 0 && (
+          <MetricRow
+            label="Cache read"
+            value={aiData.cachedTokens.toLocaleString()}
+            unit="tokens"
+          />
+        )}
+        {aiData.cacheCreationTokens != null && aiData.cacheCreationTokens > 0 && (
+          <MetricRow
+            label="Cache write"
+            value={aiData.cacheCreationTokens.toLocaleString()}
+            unit="tokens"
+          />
+        )}
+        {aiData.reasoningTokens != null && aiData.reasoningTokens > 0 && (
+          <MetricRow
+            label="Reasoning"
+            value={aiData.reasoningTokens.toLocaleString()}
+            unit="tokens"
+          />
+        )}
+        <MetricRow label="Total" value={aiData.totalTokens.toLocaleString()} unit="tokens" bold />
+
+        {aiData.totalCost != null && (
+          <MetricRow label="Cost" value={formatCurrencyAccurate(aiData.totalCost)} />
+        )}
+        {aiData.msToFirstChunk != null && (
+          <MetricRow label="TTFC" value={formatTtfc(aiData.msToFirstChunk)} />
+        )}
+        {aiData.tokensPerSecond != null && (
+          <MetricRow label="Speed" value={`${Math.round(aiData.tokensPerSecond)} tok/s`} />
+        )}
+      </div>
+    </div>
+  );
+}
+
+function MetricRow({
+  label,
+  value,
+  unit,
+  bold,
+}: {
+  label: string;
+  value: string;
+  unit?: string;
+  bold?: boolean;
+}) {
+  return (
+    <div className="grid h-7 grid-cols-[1fr_auto] items-center gap-4 rounded-sm px-1.5 transition odd:bg-charcoal-750/40 @[28rem]:grid-cols-[8rem_1fr] hover:bg-white/[0.04]">
+      <span className="text-text-dimmed">{label}</span>
+      <span
+        className={`text-right @[28rem]:text-left ${
+          bold ? "font-medium text-text-bright" : "text-text-bright"
+        }`}
+      >
+        {value}
+        {unit && <span className="ml-1 text-text-dimmed">{unit}</span>}
+      </span>
+    </div>
+  );
+}
+
+function formatTtfc(ms: number): string {
+  if (ms >= 10_000) {
+    return `${(ms / 1000).toFixed(1)}s`;
+  }
+  return `${Math.round(ms)}ms`;
+}
diff --git a/apps/webapp/app/components/runs/v3/ai/AISpanDetails.tsx b/apps/webapp/app/components/runs/v3/ai/AISpanDetails.tsx
new file mode 100644
index 00000000000..0070c7ffe3c
--- /dev/null
+++ b/apps/webapp/app/components/runs/v3/ai/AISpanDetails.tsx
@@ -0,0 +1,225 @@
+import { CheckIcon, ClipboardDocumentIcon } from "@heroicons/react/20/solid";
+import { useState } from "react";
+import { Button } from "~/components/primitives/Buttons";
+import { Header3 } from "~/components/primitives/Headers";
+import { Paragraph } from "~/components/primitives/Paragraph";
+import { TabButton, TabContainer } from "~/components/primitives/Tabs";
+import { useHasAdminAccess } from "~/hooks/useUser";
+import { CodeBlock } from "~/components/code/CodeBlock";
+import { AIChatMessages, AssistantResponse, ChatBubble } from "./AIChatMessages";
+import { AIStatsSummary, AITagsRow } from "./AIModelSummary";
+import { AIToolsInventory } from "./AIToolsInventory";
+import type { AISpanData, DisplayItem } from "./types";
+
+type AITab = "overview" | "messages" | "tools";
+
+export function AISpanDetails({
+  aiData,
+  rawProperties,
+}: {
+  aiData: AISpanData;
+  rawProperties?: string;
+}) {
+  const [tab, setTab] = useState<AITab>("overview");
+  const isAdmin = useHasAdminAccess();
+  const toolCount = aiData.toolCount ?? aiData.toolDefinitions?.length ?? 0;
+
+  return (
+    <div className="flex h-full flex-col overflow-hidden">
+      {/* Tab bar */}
+      <div className="shrink-0 overflow-x-auto px-3 py-1 scrollbar-thin scrollbar-track-transparent scrollbar-thumb-charcoal-600">
+        <TabContainer>
+          <TabButton
+            isActive={tab === "overview"}
+            layoutId="ai-span"
+            onClick={() => setTab("overview")}
+            shortcut={{ key: "o" }}
+          >
+            Overview
+          </TabButton>
+          <TabButton
+            isActive={tab === "messages"}
+            layoutId="ai-span"
+            onClick={() => setTab("messages")}
+            shortcut={{ key: "m" }}
+          >
+            Messages
+          </TabButton>
+          <TabButton
+            isActive={tab === "tools"}
+            layoutId="ai-span"
+            onClick={() => setTab("tools")}
+            shortcut={{ key: "t" }}
+          >
+            <span className="inline-flex items-center whitespace-nowrap">
+              Tools
+              {toolCount > 0 && (
+                <span className="ml-1 inline-flex min-w-4 -translate-y-px items-center justify-center rounded-full border border-charcoal-600 bg-charcoal-650 px-1 py-0.5 text-[0.625rem] font-medium leading-none text-text-bright">
+                  {toolCount}
+                </span>
+              )}
+            </span>
+          </TabButton>
+        </TabContainer>
+      </div>
+
+      {/* Tab content */}
+      <div className="scrollbar-gutter-stable min-h-0 flex-1 overflow-y-auto scrollbar-thin scrollbar-track-transparent scrollbar-thumb-charcoal-600">
+        {tab === "overview" && <OverviewTab aiData={aiData} />}
+        {tab === "messages" && <MessagesTab aiData={aiData} />}
+        {tab === "tools" && <ToolsTab aiData={aiData} />}
+      </div>
+
+      {/* Footer: Copy raw (admin only) */}
+      {isAdmin && rawProperties && <CopyRawFooter rawProperties={rawProperties} />}
+    </div>
+  );
+}
+
+function OverviewTab({ aiData }: { aiData: AISpanData }) {
+  const { userText, outputText, outputObject, outputToolNames } = extractInputOutput(aiData);
+
+  return (
+    <div className="flex flex-col px-3">
+      <AITagsRow aiData={aiData} />
+      <AIStatsSummary aiData={aiData} />
+
+      {userText && (
+        <div className="flex flex-col gap-1.5 py-2.5">
+          <Header3>Input</Header3>
+          <ChatBubble>
+            <Paragraph variant="small/dimmed">{userText}</Paragraph>
+          </ChatBubble>
+        </div>
+      )}
+
+      {outputText && <AssistantResponse text={outputText} headerLabel="Output" />}
+      {!outputText && outputObject && (
+        <div className="flex flex-col gap-1.5 py-2.5">
+          <Header3>Output</Header3>
+          <CodeBlock
+            code={outputObject}
+            maxLines={20}
+            showLineNumbers={false}
+            showCopyButton
+            language="json"
+          />
+        </div>
+      )}
+      {outputToolNames.length > 0 && !outputText && !outputObject && (
+        <div className="flex flex-col gap-1.5 py-2.5">
+          <Header3>Output</Header3>
+          <ChatBubble>
+            <Paragraph variant="small/dimmed">
+              Called {outputToolNames.length === 1 ? "tool" : "tools"}:{" "}
+              <span className="font-mono text-text-bright">{outputToolNames.join(", ")}</span>
+            </Paragraph>
+          </ChatBubble>
+        </div>
+      )}
+    </div>
+  );
+}
+
+function MessagesTab({ aiData }: { aiData: AISpanData }) {
+  const showFallbackText = aiData.responseText && !hasAssistantItem(aiData.items);
+  const showFallbackObject =
+    !showFallbackText && aiData.responseObject && !hasAssistantItem(aiData.items);
+
+  return (
+    <div className="px-3">
+      <div className="flex flex-col">
+        {aiData.items && aiData.items.length > 0 && <AIChatMessages items={aiData.items} />}
+        {showFallbackText && <AssistantResponse text={aiData.responseText!} />}
+        {showFallbackObject && (
+          <div className="flex flex-col gap-1.5 py-2.5">
+            <Header3>Assistant</Header3>
+            <CodeBlock
+              code={aiData.responseObject!}
+              maxLines={20}
+              showLineNumbers={false}
+              showCopyButton
+              language="json"
+            />
+          </div>
+        )}
+      </div>
+    </div>
+  );
+}
+
+function ToolsTab({ aiData }: { aiData: AISpanData }) {
+  return <AIToolsInventory aiData={aiData} />;
+}
+
+function CopyRawFooter({ rawProperties }: { rawProperties: string }) {
+  const [copied, setCopied] = useState(false);
+
+  function handleCopy() {
+    navigator.clipboard.writeText(rawProperties);
+    setCopied(true);
+    setTimeout(() => setCopied(false), 2000);
+  }
+
+  return (
+    <div className="flex h-[3.25rem] shrink-0 items-center justify-end border-t border-grid-dimmed px-2">
+      <Button
+        variant="minimal/medium"
+        onClick={handleCopy}
+        LeadingIcon={copied ? CheckIcon : ClipboardDocumentIcon}
+        leadingIconClassName={copied ? "text-green-500" : undefined}
+      >
+        Copy raw properties
+      </Button>
+    </div>
+  );
+}
+
+// ---------------------------------------------------------------------------
+// Helpers
+// ---------------------------------------------------------------------------
+
+function extractInputOutput(aiData: AISpanData): {
+  userText: string | undefined;
+  outputText: string | undefined;
+  outputObject: string | undefined;
+  outputToolNames: string[];
+} {
+  let userText: string | undefined;
+  let outputText: string | undefined;
+  const outputToolNames: string[] = [];
+
+  if (aiData.items) {
+    for (let i = aiData.items.length - 1; i >= 0; i--) {
+      if (aiData.items[i].type === "user") {
+        userText = (aiData.items[i] as { type: "user"; text: string }).text;
+        break;
+      }
+    }
+
+    for (let i = aiData.items.length - 1; i >= 0; i--) {
+      const item = aiData.items[i];
+      if (item.type === "assistant") {
+        outputText = item.text;
+        break;
+      }
+      if (item.type === "tool-use") {
+        for (const tool of item.tools) {
+          outputToolNames.push(tool.toolName);
+        }
+        break;
+      }
+    }
+  }
+
+  if (!outputText && aiData.responseText) {
+    outputText = aiData.responseText;
+  }
+
+  return { userText, outputText, outputObject: aiData.responseObject, outputToolNames };
+}
+
+function hasAssistantItem(items: DisplayItem[] | undefined): boolean {
+  if (!items) return false;
+  return items.some((item) => item.type === "assistant");
+}
diff --git a/apps/webapp/app/components/runs/v3/ai/AIToolsInventory.tsx b/apps/webapp/app/components/runs/v3/ai/AIToolsInventory.tsx
new file mode 100644
index 00000000000..a329698dd5e
--- /dev/null
+++ b/apps/webapp/app/components/runs/v3/ai/AIToolsInventory.tsx
@@ -0,0 +1,84 @@
+import { useState } from "react";
+import { CodeBlock } from "~/components/code/CodeBlock";
+import type { AISpanData, ToolDefinition } from "./types";
+import { Paragraph } from "~/components/primitives/Paragraph";
+
+export function AIToolsInventory({ aiData }: { aiData: AISpanData }) {
+  const defs = aiData.toolDefinitions ?? [];
+  const calledNames = getCalledToolNames(aiData);
+
+  if (defs.length === 0) {
+    return (
+      <div className="px-3 py-6 text-center">
+        <Paragraph variant="small/dimmed">No tool definitions available for this span.</Paragraph>
+      </div>
+    );
+  }
+
+  return (
+    <div className="flex flex-col divide-y divide-grid-bright px-3">
+      {defs.map((def) => {
+        const wasCalled = calledNames.has(def.name);
+        return <ToolDefRow key={def.name} def={def} wasCalled={wasCalled} />;
+      })}
+    </div>
+  );
+}
+
+function ToolDefRow({ def, wasCalled }: { def: ToolDefinition; wasCalled: boolean }) {
+  const [showSchema, setShowSchema] = useState(false);
+
+  return (
+    <div className="flex flex-col gap-1.5 py-2.5">
+      <div className="flex items-center gap-2">
+        <div
+          className={`size-1.5 shrink-0 rounded-full ${
+            wasCalled ? "bg-success" : "bg-charcoal-600"
+          }`}
+        />
+        <code className="font-mono text-xs text-text-bright">{def.name}</code>
+        <span className="text-[10px] text-text-dimmed">{wasCalled ? "called" : "not called"}</span>
+      </div>
+
+      {def.description && (
+        <p className="pl-3.5 text-xs leading-relaxed text-text-dimmed">{def.description}</p>
+      )}
+
+      {def.parametersJson && (
+        <div className="pl-3.5">
+          <button
+            onClick={() => setShowSchema(!showSchema)}
+            className="text-[10px] text-text-link hover:underline"
+          >
+            {showSchema ? "Hide schema" : "Show schema"}
+          </button>
+          {showSchema && (
+            <div className="mt-1">
+              <CodeBlock
+                code={def.parametersJson}
+                maxLines={16}
+                showLineNumbers={false}
+                showCopyButton
+              />
+            </div>
+          )}
+        </div>
+      )}
+    </div>
+  );
+}
+
+function getCalledToolNames(aiData: AISpanData): Set<string> {
+  const names = new Set<string>();
+  if (!aiData.items) return names;
+
+  for (const item of aiData.items) {
+    if (item.type === "tool-use") {
+      for (const tool of item.tools) {
+        names.add(tool.toolName);
+      }
+    }
+  }
+
+  return names;
+}
diff --git a/apps/webapp/app/components/runs/v3/ai/extractAISpanData.ts b/apps/webapp/app/components/runs/v3/ai/extractAISpanData.ts
new file mode 100644
index 00000000000..dbe9b61d952
--- /dev/null
+++ b/apps/webapp/app/components/runs/v3/ai/extractAISpanData.ts
@@ -0,0 +1,513 @@
+import type { AISpanData, DisplayItem, ToolDefinition, ToolUse } from "./types";
+
+/**
+ * Extracts structured AI span data from unflattened OTEL span properties.
+ *
+ * Works with the nested object produced by `unflattenAttributes()` — expects
+ * keys like `gen_ai.response.model`, `ai.prompt.messages`, `trigger.llm.total_cost`, etc.
+ *
+ * @param properties  Unflattened span properties object
+ * @param durationMs  Span duration in milliseconds
+ * @returns Structured AI data, or undefined if this isn't an AI generation span
+ */
+export function extractAISpanData(
+  properties: Record<string, unknown>,
+  durationMs: number
+): AISpanData | undefined {
+  const genAi = properties.gen_ai;
+  if (!genAi || typeof genAi !== "object") return undefined;
+
+  const g = genAi as Record<string, unknown>;
+  const ai = rec(properties.ai);
+  const trigger = rec(properties.trigger);
+
+  const gResponse = rec(g.response);
+  const gRequest = rec(g.request);
+  const gUsage = rec(g.usage);
+  const gOperation = rec(g.operation);
+  const aiModel = rec(ai.model);
+  const aiResponse = rec(ai.response);
+  const aiPrompt = rec(ai.prompt);
+  const aiUsage = rec(ai.usage);
+  const triggerLlm = rec(trigger.llm);
+
+  const model = str(gResponse.model) ?? str(gRequest.model) ?? str(aiModel.id);
+  if (!model) return undefined;
+
+  // Prefer ai.usage (richer) over gen_ai.usage.
+  // Gateway/some providers emit promptTokens/completionTokens instead of inputTokens/outputTokens.
+  const inputTokens =
+    num(aiUsage.inputTokens) ?? num(aiUsage.promptTokens) ?? num(gUsage.input_tokens) ?? 0;
+  const outputTokens =
+    num(aiUsage.outputTokens) ?? num(aiUsage.completionTokens) ?? num(gUsage.output_tokens) ?? 0;
+  const totalTokens = num(aiUsage.totalTokens) ?? inputTokens + outputTokens;
+
+  const tokensPerSecond =
+    num(aiResponse.avgOutputTokensPerSecond) ??
+    (outputTokens > 0 && durationMs > 0
+      ? Math.round((outputTokens / (durationMs / 1000)) * 10) / 10
+      : undefined);
+
+  const toolDefs = parseToolDefinitions(aiPrompt.tools);
+  const providerMeta = parseProviderMetadata(aiResponse.providerMetadata);
+  const aiTelemetry = rec(ai.telemetry);
+  const telemetryMeta = extractTelemetryMetadata(aiTelemetry.metadata);
+
+  return {
+    model,
+    provider: str(g.system) ?? "unknown",
+    operationName: str(gOperation.name) ?? str(ai.operationId) ?? "",
+    finishReason: str(aiResponse.finishReason),
+    serviceTier: providerMeta?.serviceTier,
+    resolvedProvider: providerMeta?.resolvedProvider,
+    toolChoice: parseToolChoice(aiPrompt.toolChoice),
+    toolCount: toolDefs?.length,
+    messageCount: countMessages(aiPrompt.messages),
+    telemetryMetadata: telemetryMeta,
+    inputTokens,
+    outputTokens,
+    totalTokens,
+    cachedTokens: num(aiUsage.cachedInputTokens) ?? num(gUsage.cache_read_input_tokens),
+    cacheCreationTokens:
+      num(aiUsage.cacheCreationInputTokens) ?? num(gUsage.cache_creation_input_tokens),
+    reasoningTokens: num(aiUsage.reasoningTokens) ?? num(gUsage.reasoning_tokens),
+    tokensPerSecond,
+    msToFirstChunk: num(aiResponse.msToFirstChunk),
+    durationMs,
+    inputCost: num(triggerLlm.input_cost),
+    outputCost: num(triggerLlm.output_cost),
+    totalCost: num(triggerLlm.total_cost),
+    responseText: str(aiResponse.text) || undefined,
+    responseObject: str(aiResponse.object) || undefined,
+    toolDefinitions: toolDefs,
+    items: buildDisplayItems(aiPrompt.messages, aiResponse.toolCalls, toolDefs),
+  };
+}
+
+// ---------------------------------------------------------------------------
+// Primitive helpers
+// ---------------------------------------------------------------------------
+
+function rec(v: unknown): Record<string, unknown> {
+  return v && typeof v === "object" ? (v as Record<string, unknown>) : {};
+}
+
+function str(v: unknown): string | undefined {
+  return typeof v === "string" ? v : undefined;
+}
+
+function num(v: unknown): number | undefined {
+  return typeof v === "number" ? v : undefined;
+}
+
+// ---------------------------------------------------------------------------
+// Message → DisplayItem transformation
+// ---------------------------------------------------------------------------
+
+type RawMessage = {
+  role: string;
+  content: unknown;
+  toolCallId?: string;
+  name?: string;
+};
+
+/**
+ * Build display items from prompt messages and optionally response tool calls.
+ * - Parses ai.prompt.messages and merges consecutive tool-call + tool-result pairs
+ * - If ai.response.toolCalls is present (finishReason=tool-calls), appends those too
+ */
+function buildDisplayItems(
+  messagesRaw: unknown,
+  responseToolCallsRaw: unknown,
+  toolDefs?: ToolDefinition[]
+): DisplayItem[] | undefined {
+  const items = parseMessagesToDisplayItems(messagesRaw);
+  const responseToolCalls = parseResponseToolCalls(responseToolCallsRaw);
+
+  if (!items && !responseToolCalls) return undefined;
+
+  const result = items ?? [];
+
+  if (responseToolCalls && responseToolCalls.length > 0) {
+    result.push({ type: "tool-use", tools: responseToolCalls });
+  }
+
+  if (toolDefs && toolDefs.length > 0) {
+    const defsByName = new Map(toolDefs.map((d) => [d.name, d]));
+    for (const item of result) {
+      if (item.type === "tool-use") {
+        for (const tool of item.tools) {
+          const def = defsByName.get(tool.toolName);
+          if (def) {
+            tool.description = def.description;
+            tool.parametersJson = def.parametersJson;
+          }
+        }
+      }
+    }
+  }
+
+  return result.length > 0 ? result : undefined;
+}
+
+function parseMessagesToDisplayItems(raw: unknown): DisplayItem[] | undefined {
+  if (typeof raw !== "string") return undefined;
+
+  let messages: RawMessage[];
+  try {
+    const parsed = JSON.parse(raw);
+    if (!Array.isArray(parsed)) return undefined;
+    messages = parsed.map((item: unknown) => {
+      const m = rec(item);
+      return {
+        role: str(m.role) ?? "user",
+        content: m.content,
+        toolCallId: str(m.toolCallId),
+        name: str(m.name),
+      };
+    });
+  } catch {
+    return undefined;
+  }
+
+  const items: DisplayItem[] = [];
+  let i = 0;
+
+  while (i < messages.length) {
+    const msg = messages[i];
+
+    if (msg.role === "system") {
+      items.push({ type: "system", text: extractTextContent(msg.content) });
+      i++;
+      continue;
+    }
+
+    if (msg.role === "user") {
+      items.push({ type: "user", text: extractTextContent(msg.content) });
+      i++;
+      continue;
+    }
+
+    // Assistant message — check if it contains tool calls
+    if (msg.role === "assistant") {
+      const toolCalls = extractToolCalls(msg.content);
+
+      if (toolCalls.length > 0) {
+        // Collect subsequent tool result messages that match these tool calls
+        const toolCallIds = new Set(toolCalls.map((tc) => tc.toolCallId));
+        let j = i + 1;
+        while (j < messages.length && messages[j].role === "tool") {
+          j++;
+        }
+        // Gather tool result messages between i+1 and j
+        const toolResultMsgs = messages.slice(i + 1, j);
+
+        // Build ToolUse entries by pairing calls with results
+        const tools: ToolUse[] = toolCalls.map((tc) => {
+          const resultMsg = toolResultMsgs.find((m) => {
+            // Match by toolCallId in the message's content parts
+            const results = extractToolResults(m.content);
+            return results.some((r) => r.toolCallId === tc.toolCallId);
+          });
+
+          const result = resultMsg
+            ? extractToolResults(resultMsg.content).find(
+              (r) => r.toolCallId === tc.toolCallId
+            )
+            : undefined;
+
+          return {
+            toolCallId: tc.toolCallId,
+            toolName: tc.toolName,
+            inputJson: JSON.stringify(tc.input, null, 2),
+            resultSummary: result?.summary,
+            resultOutput: result?.formattedOutput,
+          };
+        });
+
+        items.push({ type: "tool-use", tools });
+        i = j; // skip past the tool result messages
+        continue;
+      }
+
+      // Assistant message with just text
+      const text = extractTextContent(msg.content);
+      if (text) {
+        items.push({ type: "assistant", text });
+      }
+      i++;
+      continue;
+    }
+
+    // Skip any other message types (tool messages that weren't consumed above)
+    i++;
+  }
+
+  return items.length > 0 ? items : undefined;
+}
+
+// ---------------------------------------------------------------------------
+// Response tool calls (from ai.response.toolCalls, used when finishReason=tool-calls)
+// ---------------------------------------------------------------------------
+
+/**
+ * Parse ai.response.toolCalls JSON string into ToolUse entries.
+ * These are tool calls the model requested but haven't been executed yet in this span.
+ */
+function parseResponseToolCalls(raw: unknown): ToolUse[] | undefined {
+  if (typeof raw !== "string") return undefined;
+  try {
+    const parsed = JSON.parse(raw);
+    if (!Array.isArray(parsed)) return undefined;
+    const tools: ToolUse[] = [];
+    for (const item of parsed) {
+      const tc = rec(item);
+      if (tc.type === "tool-call" || tc.toolName || tc.toolCallId) {
+        tools.push({
+          toolCallId: str(tc.toolCallId) ?? "",
+          toolName: str(tc.toolName) ?? "",
+          inputJson: JSON.stringify(
+            tc.input && typeof tc.input === "object" ? tc.input : {},
+            null,
+            2
+          ),
+        });
+      }
+    }
+    return tools.length > 0 ? tools : undefined;
+  } catch {
+    return undefined;
+  }
+}
+
+// ---------------------------------------------------------------------------
+// Content part extraction
+// ---------------------------------------------------------------------------
+
+function extractTextContent(content: unknown): string {
+  if (typeof content === "string") return content;
+  if (!Array.isArray(content)) return "";
+
+  const texts: string[] = [];
+  for (const raw of content) {
+    const p = rec(raw);
+    if (p.type === "text" && typeof p.text === "string") {
+      texts.push(p.text);
+    } else if (typeof p.text === "string") {
+      texts.push(p.text);
+    }
+  }
+  return texts.join("\n");
+}
+
+type ParsedToolCall = {
+  toolCallId: string;
+  toolName: string;
+  input: Record<string, unknown>;
+};
+
+function extractToolCalls(content: unknown): ParsedToolCall[] {
+  if (!Array.isArray(content)) return [];
+  const calls: ParsedToolCall[] = [];
+  for (const raw of content) {
+    const p = rec(raw);
+    if (p.type === "tool-call") {
+      calls.push({
+        toolCallId: str(p.toolCallId) ?? "",
+        toolName: str(p.toolName) ?? "",
+        input: p.input && typeof p.input === "object" ? (p.input as Record<string, unknown>) : {},
+      });
+    }
+  }
+  return calls;
+}
+
+type ParsedToolResult = {
+  toolCallId: string;
+  toolName: string;
+  summary: string;
+  formattedOutput: string;
+};
+
+function extractToolResults(content: unknown): ParsedToolResult[] {
+  if (!Array.isArray(content)) return [];
+  const results: ParsedToolResult[] = [];
+  for (const raw of content) {
+    const p = rec(raw);
+    if (p.type === "tool-result") {
+      const { summary, formattedOutput } = summarizeToolOutput(p.output);
+      results.push({
+        toolCallId: str(p.toolCallId) ?? "",
+        toolName: str(p.toolName) ?? "",
+        summary,
+        formattedOutput,
+      });
+    }
+  }
+  return results;
+}
+
+/**
+ * Summarize a tool output into a short label and a formatted string for display.
+ * Handles the AI SDK's `{ type: "json", value: { status, contentType, body, truncated } }` shape.
+ */
+function summarizeToolOutput(output: unknown): { summary: string; formattedOutput: string } {
+  if (typeof output === "string") {
+    return {
+      summary: output.length > 80 ? output.slice(0, 80) + "..." : output,
+      formattedOutput: output,
+    };
+  }
+
+  if (!output || typeof output !== "object") {
+    return { summary: "result", formattedOutput: JSON.stringify(output, null, 2) };
+  }
+
+  const o = output as Record<string, unknown>;
+
+  // AI SDK wraps tool results as { type: "json", value: { status, contentType, body, ... } }
+  if (o.type === "json" && o.value && typeof o.value === "object") {
+    const v = o.value as Record<string, unknown>;
+    const parts: string[] = [];
+    if (typeof v.status === "number") parts.push(`${v.status}`);
+    if (typeof v.contentType === "string") parts.push(v.contentType);
+    if (v.truncated === true) parts.push("truncated");
+    return {
+      summary: parts.length > 0 ? parts.join(" · ") : "json result",
+      formattedOutput: JSON.stringify(v, null, 2),
+    };
+  }
+
+  return { summary: "result", formattedOutput: JSON.stringify(output, null, 2) };
+}
+
+// ---------------------------------------------------------------------------
+// Tool definitions (from ai.prompt.tools)
+// ---------------------------------------------------------------------------
+
+/**
+ * Parse ai.prompt.tools — after the array fix, this arrives as a JSON array string
+ * where each element is itself a JSON string of a tool definition.
+ */
+function parseToolDefinitions(raw: unknown): ToolDefinition[] | undefined {
+  if (typeof raw !== "string") return undefined;
+  try {
+    const parsed = JSON.parse(raw);
+    if (!Array.isArray(parsed)) return undefined;
+    const defs: ToolDefinition[] = [];
+    for (const item of parsed) {
+      // Each item is either a JSON string or already an object
+      const obj = typeof item === "string" ? JSON.parse(item) : item;
+      if (!obj || typeof obj !== "object") continue;
+      const o = obj as Record<string, unknown>;
+      const name = str(o.name);
+      if (!name) continue;
+      const schema = o.parameters ?? o.inputSchema;
+      defs.push({
+        name,
+        description: str(o.description),
+        parametersJson:
+          schema && typeof schema === "object"
+            ? JSON.stringify(schema, null, 2)
+            : undefined,
+      });
+    }
+    return defs.length > 0 ? defs : undefined;
+  } catch {
+    return undefined;
+  }
+}
+
+// ---------------------------------------------------------------------------
+// Provider metadata (service tier, inference geo, etc.)
+// ---------------------------------------------------------------------------
+
+function parseProviderMetadata(
+  raw: unknown
+): { serviceTier?: string; resolvedProvider?: string; gatewayCost?: string } | undefined {
+  if (typeof raw !== "string") return undefined;
+  try {
+    const parsed = JSON.parse(raw) as Record<string, unknown>;
+    if (!parsed || typeof parsed !== "object") return undefined;
+
+    let serviceTier: string | undefined;
+    let resolvedProvider: string | undefined;
+    let gatewayCost: string | undefined;
+
+    // Anthropic: { anthropic: { usage: { service_tier: "standard" } } }
+    const anthropic = rec(parsed.anthropic);
+    serviceTier = str(rec(anthropic.usage).service_tier);
+
+    // Azure/OpenAI: { azure: { serviceTier: "default" } } or { openai: { serviceTier: "..." } }
+    if (!serviceTier) {
+      serviceTier = str(rec(parsed.azure).serviceTier) ?? str(rec(parsed.openai).serviceTier);
+    }
+
+    // Gateway: { gateway: { routing: { finalProvider, resolvedProvider }, cost } }
+    const gateway = rec(parsed.gateway);
+    const routing = rec(gateway.routing);
+    resolvedProvider = str(routing.finalProvider) ?? str(routing.resolvedProvider);
+    gatewayCost = str(gateway.cost);
+
+    // OpenRouter: { openrouter: { provider: "xAI" } }
+    if (!resolvedProvider) {
+      resolvedProvider = str(rec(parsed.openrouter).provider);
+    }
+
+    if (!serviceTier && !resolvedProvider && !gatewayCost) return undefined;
+    return { serviceTier, resolvedProvider, gatewayCost };
+  } catch {
+    return undefined;
+  }
+}
+
+// ---------------------------------------------------------------------------
+// Tool choice parsing
+// ---------------------------------------------------------------------------
+
+function parseToolChoice(raw: unknown): string | undefined {
+  if (typeof raw !== "string") return undefined;
+  try {
+    const parsed = JSON.parse(raw);
+    if (typeof parsed === "string") return parsed;
+    if (parsed && typeof parsed === "object") {
+      const obj = parsed as Record<string, unknown>;
+      if (typeof obj.type === "string") return obj.type;
+    }
+    return undefined;
+  } catch {
+    return undefined;
+  }
+}
+
+// ---------------------------------------------------------------------------
+// Message count
+// ---------------------------------------------------------------------------
+
+function countMessages(raw: unknown): number | undefined {
+  if (typeof raw !== "string") return undefined;
+  try {
+    const parsed = JSON.parse(raw);
+    if (!Array.isArray(parsed)) return undefined;
+    return parsed.length > 0 ? parsed.length : undefined;
+  } catch {
+    return undefined;
+  }
+}
+
+// ---------------------------------------------------------------------------
+// Telemetry metadata
+// ---------------------------------------------------------------------------
+
+function extractTelemetryMetadata(raw: unknown): Record<string, string> | undefined {
+  if (!raw || typeof raw !== "object") return undefined;
+
+  const result: Record<string, string> = {};
+  for (const [key, value] of Object.entries(raw as Record<string, unknown>)) {
+    if (typeof value === "string" || typeof value === "number" || typeof value === "boolean") {
+      result[key] = String(value);
+    }
+  }
+
+  return Object.keys(result).length > 0 ? result : undefined;
+}
diff --git a/apps/webapp/app/components/runs/v3/ai/index.ts b/apps/webapp/app/components/runs/v3/ai/index.ts
new file mode 100644
index 00000000000..7e33a46fb2c
--- /dev/null
+++ b/apps/webapp/app/components/runs/v3/ai/index.ts
@@ -0,0 +1,3 @@
+export { AISpanDetails } from "./AISpanDetails";
+export { extractAISpanData } from "./extractAISpanData";
+export type { AISpanData, DisplayItem, ToolUse } from "./types";
diff --git a/apps/webapp/app/components/runs/v3/ai/types.ts b/apps/webapp/app/components/runs/v3/ai/types.ts
new file mode 100644
index 00000000000..be10ee9bcd1
--- /dev/null
+++ b/apps/webapp/app/components/runs/v3/ai/types.ts
@@ -0,0 +1,105 @@
+// ---------------------------------------------------------------------------
+// Tool use (merged assistant tool-call + tool result)
+// ---------------------------------------------------------------------------
+
+export type ToolDefinition = {
+  name: string;
+  description?: string;
+  /** JSON schema as formatted string */
+  parametersJson?: string;
+};
+
+export type ToolUse = {
+  toolCallId: string;
+  toolName: string;
+  /** Tool description from the definition, if available */
+  description?: string;
+  /** JSON schema of the tool's parameters, pretty-printed */
+  parametersJson?: string;
+  /** Formatted input args as JSON string */
+  inputJson: string;
+  /** Short summary of the result (e.g. "200 · text/html · truncated") */
+  resultSummary?: string;
+  /** Full formatted result for display in a code block */
+  resultOutput?: string;
+};
+
+// ---------------------------------------------------------------------------
+// Display items — what the UI actually renders
+// ---------------------------------------------------------------------------
+
+/** System prompt text (collapsible) */
+export type SystemItem = {
+  type: "system";
+  text: string;
+};
+
+/** User message text */
+export type UserItem = {
+  type: "user";
+  text: string;
+};
+
+/** One or more tool calls with their results, grouped */
+export type ToolUseItem = {
+  type: "tool-use";
+  tools: ToolUse[];
+};
+
+/** Final assistant text response */
+export type AssistantItem = {
+  type: "assistant";
+  text: string;
+};
+
+export type DisplayItem = SystemItem | UserItem | ToolUseItem | AssistantItem;
+
+// ---------------------------------------------------------------------------
+// Span-level AI data
+// ---------------------------------------------------------------------------
+
+export type AISpanData = {
+  model: string;
+  provider: string;
+  operationName: string;
+
+  // Categorical tags
+  finishReason?: string;
+  serviceTier?: string;
+  /** Resolved downstream provider for gateway/openrouter spans (e.g. "xAI", "mistral") */
+  resolvedProvider?: string;
+  toolChoice?: string;
+  toolCount?: number;
+  messageCount?: number;
+  /** User-defined telemetry metadata (from ai.telemetry.metadata) */
+  telemetryMetadata?: Record<string, string>;
+
+  // Token counts
+  inputTokens: number;
+  outputTokens: number;
+  totalTokens: number;
+  cachedTokens?: number;
+  cacheCreationTokens?: number;
+  reasoningTokens?: number;
+
+  // Performance
+  tokensPerSecond?: number;
+  msToFirstChunk?: number;
+  durationMs: number;
+
+  // Cost
+  inputCost?: number;
+  outputCost?: number;
+  totalCost?: number;
+
+  // Response text (final assistant output)
+  responseText?: string;
+  // Structured object response (JSON) — mutually exclusive with responseText
+  responseObject?: string;
+
+  // Tool definitions (from ai.prompt.tools)
+  toolDefinitions?: ToolDefinition[];
+
+  // Display-ready message items (system, user, tool-use groups, assistant text)
+  items?: DisplayItem[];
+};
diff --git a/apps/webapp/app/env.server.ts b/apps/webapp/app/env.server.ts
index bdfdbea6b3e..2e6da79fdf1 100644
--- a/apps/webapp/app/env.server.ts
+++ b/apps/webapp/app/env.server.ts
@@ -1247,6 +1247,12 @@ const EnvironmentSchema = z
     // Metric widget concurrency limits
     METRIC_WIDGET_DEFAULT_ORG_CONCURRENCY_LIMIT: z.coerce.number().int().default(30),
 
+    // Admin ClickHouse URL (for admin dashboard queries like missing models)
+    ADMIN_CLICKHOUSE_URL: z
+      .string()
+      .optional()
+      .transform((v) => v ?? process.env.CLICKHOUSE_URL),
+
     EVENTS_CLICKHOUSE_URL: z
       .string()
       .optional()
@@ -1277,6 +1283,16 @@ const EnvironmentSchema = z
     EVENTS_CLICKHOUSE_MAX_TRACE_DETAILED_SUMMARY_VIEW_COUNT: z.coerce.number().int().default(5_000),
     EVENTS_CLICKHOUSE_MAX_LIVE_RELOADING_SETTING: z.coerce.number().int().default(2000),
 
+    // LLM cost tracking
+    LLM_COST_TRACKING_ENABLED: BoolEnv.default(true),
+    LLM_PRICING_RELOAD_INTERVAL_MS: z.coerce.number().int().default(5 * 60 * 1000), // 5 minutes
+    LLM_PRICING_SEED_ON_STARTUP: BoolEnv.default(false),
+    LLM_PRICING_READY_TIMEOUT_MS: z.coerce.number().int().default(500),
+    LLM_METRICS_BATCH_SIZE: z.coerce.number().int().default(5000),
+    LLM_METRICS_FLUSH_INTERVAL_MS: z.coerce.number().int().default(2000),
+    LLM_METRICS_MAX_BATCH_SIZE: z.coerce.number().int().default(10000),
+    LLM_METRICS_MAX_CONCURRENCY: z.coerce.number().int().default(2),
+
     // Bootstrap
     TRIGGER_BOOTSTRAP_ENABLED: z.string().default("0"),
     TRIGGER_BOOTSTRAP_WORKER_GROUP_NAME: z.string().optional(),
diff --git a/apps/webapp/app/presenters/v3/BuiltInDashboards.server.ts b/apps/webapp/app/presenters/v3/BuiltInDashboards.server.ts
index da95eeacc00..144176c88fb 100644
--- a/apps/webapp/app/presenters/v3/BuiltInDashboards.server.ts
+++ b/apps/webapp/app/presenters/v3/BuiltInDashboards.server.ts
@@ -4,6 +4,7 @@ import { z } from "zod";
 const overviewDashboard: BuiltInDashboard = {
   key: "overview",
   title: "Metrics",
+  filters: ["tasks", "queues"],
   layout: {
     version: "1",
     layout: [
@@ -213,7 +214,297 @@ const overviewDashboard: BuiltInDashboard = {
   },
 };
 
-const builtInDashboards: BuiltInDashboard[] = [overviewDashboard];
+const llmDashboard: BuiltInDashboard = {
+  key: "llm",
+  title: "AI Metrics",
+  filters: ["tasks", "models"],
+  layout: {
+    version: "1",
+    layout: [
+      // Big numbers row
+      { i: "llm-cost", x: 0, y: 0, w: 3, h: 4 },
+      { i: "llm-calls", x: 3, y: 0, w: 3, h: 4 },
+      { i: "llm-ttfc", x: 6, y: 0, w: 3, h: 4 },
+      { i: "llm-tps", x: 9, y: 0, w: 3, h: 4 },
+      // Cost section
+      { i: "llm-title-cost", x: 0, y: 4, w: 12, h: 2, minH: 2, maxH: 2 },
+      { i: "llm-cost-time", x: 0, y: 6, w: 6, h: 13 },
+      { i: "llm-cost-model", x: 6, y: 6, w: 6, h: 13 },
+      // Usage section
+      { i: "llm-title-usage", x: 0, y: 19, w: 12, h: 2, minH: 2, maxH: 2 },
+      { i: "llm-tokens-time", x: 0, y: 21, w: 6, h: 13 },
+      { i: "llm-calls-model", x: 6, y: 21, w: 6, h: 13 },
+      // Performance section
+      { i: "llm-title-perf", x: 0, y: 34, w: 12, h: 2, minH: 2, maxH: 2 },
+      { i: "llm-ttfc-time", x: 0, y: 36, w: 6, h: 13 },
+      { i: "llm-tps-model", x: 6, y: 36, w: 6, h: 13 },
+      { i: "llm-latency-pct", x: 0, y: 49, w: 6, h: 13 },
+      { i: "llm-latency-time", x: 6, y: 49, w: 6, h: 13 },
+      // Behavior section
+      { i: "llm-title-behavior", x: 0, y: 62, w: 12, h: 2, minH: 2, maxH: 2 },
+      { i: "llm-finish-reasons", x: 0, y: 64, w: 6, h: 13 },
+      { i: "llm-top-runs", x: 6, y: 64, w: 6, h: 13 },
+      // Attribution section
+      { i: "llm-title-attribution", x: 0, y: 77, w: 12, h: 2, minH: 2, maxH: 2 },
+      { i: "llm-cost-task", x: 0, y: 79, w: 6, h: 13 },
+      { i: "llm-cost-provider", x: 6, y: 79, w: 6, h: 13 },
+      { i: "llm-cost-user", x: 0, y: 92, w: 12, h: 13 },
+      // Efficiency section
+      { i: "llm-title-efficiency", x: 0, y: 105, w: 12, h: 2, minH: 2, maxH: 2 },
+      { i: "llm-cost-operation", x: 0, y: 107, w: 6, h: 13 },
+      { i: "llm-cache-util", x: 6, y: 107, w: 6, h: 13 },
+    ],
+    widgets: {
+      "llm-cost": {
+        title: "Total LLM cost",
+        query: "SELECT\r\n  SUM(total_cost) AS total_cost\r\nFROM\r\n  llm_metrics",
+        display: {
+          type: "bignumber",
+          column: "total_cost",
+          aggregation: "sum",
+          abbreviate: true,
+        },
+      },
+      "llm-calls": {
+        title: "Total calls",
+        query: "SELECT\r\n  count() AS total_calls\r\nFROM\r\n  llm_metrics",
+        display: {
+          type: "bignumber",
+          column: "total_calls",
+          aggregation: "sum",
+          abbreviate: false,
+        },
+      },
+      "llm-ttfc": {
+        title: "Avg TTFC",
+        query:
+          "SELECT\r\n  round(avg(ms_to_first_chunk), 1) AS avg_ttfc\r\nFROM\r\n  llm_metrics\r\nWHERE ms_to_first_chunk > 0",
+        display: {
+          type: "bignumber",
+          column: "avg_ttfc",
+          aggregation: "avg",
+          abbreviate: false,
+          suffix: "ms",
+        },
+      },
+      "llm-tps": {
+        title: "Avg tokens/sec",
+        query:
+          "SELECT\r\n  round(avg(tokens_per_second), 1) AS avg_tps\r\nFROM\r\n  llm_metrics\r\nWHERE tokens_per_second > 0",
+        display: {
+          type: "bignumber",
+          column: "avg_tps",
+          aggregation: "avg",
+          abbreviate: false,
+          suffix: "/s",
+        },
+      },
+      "llm-title-cost": { title: "Cost", query: "", display: { type: "title" } },
+      "llm-cost-time": {
+        title: "Cost over time",
+        query:
+          "SELECT\r\n  timeBucket(),\r\n  SUM(total_cost) AS total_cost\r\nFROM\r\n  llm_metrics\r\nGROUP BY\r\n  timeBucket\r\nORDER BY\r\n  timeBucket",
+        display: {
+          type: "chart",
+          chartType: "line",
+          xAxisColumn: "timebucket",
+          yAxisColumns: ["total_cost"],
+          groupByColumn: null,
+          stacked: false,
+          sortByColumn: null,
+          sortDirection: "asc",
+          aggregation: "sum",
+        },
+      },
+      "llm-cost-model": {
+        title: "Cost by model",
+        query:
+          "SELECT\r\n  timeBucket(),\r\n  response_model,\r\n  SUM(total_cost) AS total_cost\r\nFROM\r\n  llm_metrics\r\nGROUP BY\r\n  timeBucket,\r\n  response_model\r\nORDER BY\r\n  timeBucket",
+        display: {
+          type: "chart",
+          chartType: "bar",
+          xAxisColumn: "timebucket",
+          yAxisColumns: ["total_cost"],
+          groupByColumn: "response_model",
+          stacked: true,
+          sortByColumn: null,
+          sortDirection: "asc",
+          aggregation: "sum",
+        },
+      },
+      "llm-title-usage": { title: "Usage", query: "", display: { type: "title" } },
+      "llm-tokens-time": {
+        title: "Tokens over time",
+        query:
+          "SELECT\r\n  timeBucket(),\r\n  SUM(input_tokens) AS input_tokens,\r\n  SUM(output_tokens) AS output_tokens\r\nFROM\r\n  llm_metrics\r\nGROUP BY\r\n  timeBucket\r\nORDER BY\r\n  timeBucket",
+        display: {
+          type: "chart",
+          chartType: "bar",
+          xAxisColumn: "timebucket",
+          yAxisColumns: ["input_tokens", "output_tokens"],
+          groupByColumn: null,
+          stacked: true,
+          sortByColumn: null,
+          sortDirection: "asc",
+          aggregation: "sum",
+        },
+      },
+      "llm-calls-model": {
+        title: "Calls by model",
+        query:
+          "SELECT\r\n  response_model,\r\n  count() AS calls,\r\n  SUM(total_tokens) AS tokens,\r\n  SUM(total_cost) AS cost\r\nFROM\r\n  llm_metrics\r\nGROUP BY\r\n  response_model\r\nORDER BY\r\n  cost DESC",
+        display: { type: "table", prettyFormatting: true, sorting: [] },
+      },
+      "llm-title-perf": { title: "Performance", query: "", display: { type: "title" } },
+      "llm-ttfc-time": {
+        title: "TTFC over time",
+        query:
+          "SELECT\r\n  timeBucket(),\r\n  round(avg(ms_to_first_chunk), 1) AS avg_ttfc\r\nFROM\r\n  llm_metrics\r\nWHERE ms_to_first_chunk > 0\r\nGROUP BY\r\n  timeBucket\r\nORDER BY\r\n  timeBucket",
+        display: {
+          type: "chart",
+          chartType: "line",
+          xAxisColumn: "timebucket",
+          yAxisColumns: ["avg_ttfc"],
+          groupByColumn: null,
+          stacked: false,
+          sortByColumn: null,
+          sortDirection: "asc",
+          aggregation: "avg",
+        },
+      },
+      "llm-tps-model": {
+        title: "Tokens/sec by model",
+        query:
+          "SELECT\r\n  timeBucket(),\r\n  response_model,\r\n  round(avg(tokens_per_second), 1) AS avg_tps\r\nFROM\r\n  llm_metrics\r\nWHERE tokens_per_second > 0\r\nGROUP BY\r\n  timeBucket,\r\n  response_model\r\nORDER BY\r\n  timeBucket",
+        display: {
+          type: "chart",
+          chartType: "line",
+          xAxisColumn: "timebucket",
+          yAxisColumns: ["avg_tps"],
+          groupByColumn: "response_model",
+          stacked: false,
+          sortByColumn: null,
+          sortDirection: "asc",
+          aggregation: "avg",
+        },
+      },
+      "llm-latency-pct": {
+        title: "Latency percentiles by model",
+        query:
+          "SELECT\r\n  response_model,\r\n  round(quantile(0.5)(ms_to_first_chunk), 1) AS p50,\r\n  round(quantile(0.9)(ms_to_first_chunk), 1) AS p90,\r\n  round(quantile(0.95)(ms_to_first_chunk), 1) AS p95,\r\n  round(quantile(0.99)(ms_to_first_chunk), 1) AS p99,\r\n  count() AS calls\r\nFROM\r\n  llm_metrics\r\nWHERE ms_to_first_chunk > 0\r\nGROUP BY\r\n  response_model\r\nORDER BY\r\n  p50 DESC",
+        display: { type: "table", prettyFormatting: true, sorting: [] },
+      },
+      "llm-latency-time": {
+        title: "Latency percentiles over time",
+        query:
+          "SELECT\r\n  timeBucket(),\r\n  round(quantile(0.5)(ms_to_first_chunk), 1) AS p50,\r\n  round(quantile(0.95)(ms_to_first_chunk), 1) AS p95\r\nFROM\r\n  llm_metrics\r\nWHERE ms_to_first_chunk > 0\r\nGROUP BY\r\n  timeBucket\r\nORDER BY\r\n  timeBucket",
+        display: {
+          type: "chart",
+          chartType: "line",
+          xAxisColumn: "timebucket",
+          yAxisColumns: ["p50", "p95"],
+          groupByColumn: null,
+          stacked: false,
+          sortByColumn: null,
+          sortDirection: "asc",
+          aggregation: "avg",
+          seriesColors: { p95: "#f43f5e" },
+        },
+      },
+      "llm-title-behavior": { title: "Behavior", query: "", display: { type: "title" } },
+      "llm-finish-reasons": {
+        title: "Finish reasons over time",
+        query:
+          "SELECT\r\n  timeBucket(),\r\n  finish_reason,\r\n  count() AS calls\r\nFROM\r\n  llm_metrics\r\nWHERE finish_reason != ''\r\nGROUP BY\r\n  timeBucket,\r\n  finish_reason\r\nORDER BY\r\n  timeBucket",
+        display: {
+          type: "chart",
+          chartType: "bar",
+          xAxisColumn: "timebucket",
+          yAxisColumns: ["calls"],
+          groupByColumn: "finish_reason",
+          stacked: true,
+          sortByColumn: null,
+          sortDirection: "asc",
+          aggregation: "sum",
+        },
+      },
+      "llm-top-runs": {
+        title: "Most expensive runs",
+        query:
+          "SELECT\r\n  run_id,\r\n  task_identifier,\r\n  SUM(total_cost) AS llm_cost,\r\n  SUM(total_tokens) AS tokens\r\nFROM\r\n  llm_metrics\r\nGROUP BY\r\n  run_id,\r\n  task_identifier\r\nORDER BY\r\n  llm_cost DESC\r\nLIMIT 50",
+        display: { type: "table", prettyFormatting: true, sorting: [] },
+      },
+      "llm-title-attribution": { title: "Attribution", query: "", display: { type: "title" } },
+      "llm-cost-task": {
+        title: "Cost by task",
+        query:
+          "SELECT\r\n  task_identifier,\r\n  SUM(total_cost) AS cost,\r\n  SUM(total_tokens) AS tokens,\r\n  count() AS calls\r\nFROM\r\n  llm_metrics\r\nGROUP BY\r\n  task_identifier\r\nORDER BY\r\n  cost DESC",
+        display: { type: "table", prettyFormatting: true, sorting: [] },
+      },
+      "llm-cost-provider": {
+        title: "Cost by provider",
+        query:
+          "SELECT\r\n  timeBucket(),\r\n  gen_ai_system,\r\n  SUM(total_cost) AS total_cost\r\nFROM\r\n  llm_metrics\r\nGROUP BY\r\n  timeBucket,\r\n  gen_ai_system\r\nORDER BY\r\n  timeBucket",
+        display: {
+          type: "chart",
+          chartType: "bar",
+          xAxisColumn: "timebucket",
+          yAxisColumns: ["total_cost"],
+          groupByColumn: "gen_ai_system",
+          stacked: true,
+          sortByColumn: null,
+          sortDirection: "asc",
+          aggregation: "sum",
+        },
+      },
+      "llm-cost-user": {
+        title: "Cost by user",
+        query:
+          "SELECT\r\n  metadata['userId'] AS user_id,\r\n  SUM(total_cost) AS cost,\r\n  SUM(total_tokens) AS tokens,\r\n  count() AS calls\r\nFROM\r\n  llm_metrics\r\nWHERE metadata['userId'] != ''\r\nGROUP BY\r\n  user_id\r\nORDER BY\r\n  cost DESC\r\nLIMIT 20",
+        display: { type: "table", prettyFormatting: true, sorting: [] },
+      },
+      "llm-title-efficiency": { title: "Efficiency", query: "", display: { type: "title" } },
+      "llm-cost-operation": {
+        title: "Cost by operation type",
+        query:
+          "SELECT\r\n  timeBucket(),\r\n  operation_id,\r\n  SUM(total_cost) AS total_cost\r\nFROM\r\n  llm_metrics\r\nWHERE operation_id != ''\r\nGROUP BY\r\n  timeBucket,\r\n  operation_id\r\nORDER BY\r\n  timeBucket",
+        display: {
+          type: "chart",
+          chartType: "bar",
+          xAxisColumn: "timebucket",
+          yAxisColumns: ["total_cost"],
+          groupByColumn: "operation_id",
+          stacked: true,
+          sortByColumn: null,
+          sortDirection: "asc",
+          aggregation: "sum",
+        },
+      },
+      "llm-cache-util": {
+        title: "Cache utilization",
+        query:
+          "SELECT\r\n  timeBucket(),\r\n  round(countIf(cached_read_tokens > 0) * 100.0 / count(), 1) AS cache_hit_pct,\r\n  round(avg(cached_read_tokens), 0) AS avg_cached_tokens\r\nFROM\r\n  llm_metrics\r\nGROUP BY\r\n  timeBucket\r\nORDER BY\r\n  timeBucket",
+        display: {
+          type: "chart",
+          chartType: "line",
+          xAxisColumn: "timebucket",
+          yAxisColumns: ["cache_hit_pct"],
+          groupByColumn: null,
+          stacked: false,
+          sortByColumn: null,
+          sortDirection: "asc",
+          aggregation: "avg",
+        },
+      },
+    },
+  },
+};
+
+const builtInDashboards: BuiltInDashboard[] = [overviewDashboard, llmDashboard];
+
+export function builtInDashboardList(): BuiltInDashboard[] {
+  return builtInDashboards;
+}
 
 export function builtInDashboard(key: string): BuiltInDashboard {
   const dashboard = builtInDashboards.find((d) => d.key === key);
diff --git a/apps/webapp/app/presenters/v3/MetricDashboardPresenter.server.ts b/apps/webapp/app/presenters/v3/MetricDashboardPresenter.server.ts
index d5363ddb9af..90b60891c58 100644
--- a/apps/webapp/app/presenters/v3/MetricDashboardPresenter.server.ts
+++ b/apps/webapp/app/presenters/v3/MetricDashboardPresenter.server.ts
@@ -58,10 +58,14 @@ export type CustomDashboard = {
   defaultPeriod: string;
 };
 
+export type BuiltInDashboardFilter = "tasks" | "queues" | "models";
+
 export type BuiltInDashboard = {
   key: string;
   title: string;
   layout: DashboardLayout;
+  /** Which filters to show in the toolbar. Defaults to ["tasks", "queues"] if not specified. */
+  filters?: BuiltInDashboardFilter[];
 };
 
 /** Returns the dashboard layout */
diff --git a/apps/webapp/app/presenters/v3/SpanPresenter.server.ts b/apps/webapp/app/presenters/v3/SpanPresenter.server.ts
index ce83c2e242b..9ad94745616 100644
--- a/apps/webapp/app/presenters/v3/SpanPresenter.server.ts
+++ b/apps/webapp/app/presenters/v3/SpanPresenter.server.ts
@@ -24,6 +24,7 @@ import { engine } from "~/v3/runEngine.server";
 import { resolveEventRepositoryForStore } from "~/v3/eventRepository/index.server";
 import { IEventRepository, SpanDetail } from "~/v3/eventRepository/eventRepository.types";
 import { safeJsonParse } from "~/utils/json";
+import { extractAISpanData } from "~/components/runs/v3/ai";
 
 type Result = Awaited<ReturnType<SpanPresenter["call"]>>;
 export type Span = NonNullable<NonNullable<Result>["span"]>;
@@ -543,6 +544,13 @@ export class SpanPresenter extends BasePresenter {
       entity: span.entity,
       metadata: span.metadata,
       triggeredRuns,
+      aiData:
+        span.properties && typeof span.properties === "object"
+          ? extractAISpanData(
+              span.properties as Record<string, unknown>,
+              span.duration / 1_000_000
+            )
+          : undefined,
     };
 
     switch (span.entity.type) {
@@ -665,6 +673,12 @@ export class SpanPresenter extends BasePresenter {
         };
       }
       default:
+        if (data.aiData) {
+          return {
+            ...data,
+            entity: { type: "ai-generation" as const, object: data.aiData },
+          };
+        }
         return { ...data, entity: null };
     }
   }
diff --git a/apps/webapp/app/routes/_app.orgs.$organizationSlug.projects.$projectParam.env.$envParam.dashboards.$dashboardKey/route.tsx b/apps/webapp/app/routes/_app.orgs.$organizationSlug.projects.$projectParam.env.$envParam.dashboards.$dashboardKey/route.tsx
index 1606158598a..1374fd0f3de 100644
--- a/apps/webapp/app/routes/_app.orgs.$organizationSlug.projects.$projectParam.env.$envParam.dashboards.$dashboardKey/route.tsx
+++ b/apps/webapp/app/routes/_app.orgs.$organizationSlug.projects.$projectParam.env.$envParam.dashboards.$dashboardKey/route.tsx
@@ -6,6 +6,7 @@ import { typedjson, useTypedLoaderData } from "remix-typedjson";
 import { z } from "zod";
 import { PageBody, PageContainer } from "~/components/layout/AppLayout";
 import { LogsTaskFilter } from "~/components/logs/LogsTaskFilter";
+import { ModelsFilter, type ModelOption } from "~/components/metrics/ModelsFilter";
 import { type WidgetData } from "~/components/metrics/QueryWidget";
 import { QueuesFilter } from "~/components/metrics/QueuesFilter";
 import { ScopeFilter } from "~/components/metrics/ScopeFilter";
@@ -22,10 +23,12 @@ import { findProjectBySlug } from "~/models/project.server";
 import { findEnvironmentBySlug } from "~/models/runtimeEnvironment.server";
 import { getAllTaskIdentifiers } from "~/models/task.server";
 import {
+  type BuiltInDashboardFilter,
   type LayoutItem,
   type Widget,
   MetricDashboardPresenter,
 } from "~/presenters/v3/MetricDashboardPresenter.server";
+import { clickhouseClient } from "~/services/clickhouseInstance.server";
 import { requireUser } from "~/services/session.server";
 import { cn } from "~/utils/cn";
 import { EnvironmentParamSchema } from "~/utils/pathBuilder";
@@ -66,11 +69,38 @@ export const loader = async ({ request, params }: LoaderFunctionArgs) => {
     getAllTaskIdentifiers($replica, environment.id),
   ]);
 
+  const filters = dashboard.filters ?? ["tasks", "queues"];
+
+  // Load distinct models from ClickHouse if the dashboard has a models filter
+  let possibleModels: { model: string; system: string }[] = [];
+  if (filters.includes("models")) {
+    const queryFn = clickhouseClient.reader.query({
+      name: "getDistinctModels",
+      query: `SELECT response_model, any(gen_ai_system) AS gen_ai_system FROM trigger_dev.llm_metrics_v1 WHERE organization_id = {organizationId: String} AND project_id = {projectId: String} AND environment_id = {environmentId: String} AND response_model != '' GROUP BY response_model ORDER BY response_model`,
+      params: z.object({
+        organizationId: z.string(),
+        projectId: z.string(),
+        environmentId: z.string(),
+      }),
+      schema: z.object({ response_model: z.string(), gen_ai_system: z.string() }),
+    });
+    const [error, rows] = await queryFn({
+      organizationId: project.organizationId,
+      projectId: project.id,
+      environmentId: environment.id,
+    });
+    if (!error) {
+      possibleModels = rows.map((r) => ({ model: r.response_model, system: r.gen_ai_system }));
+    }
+  }
+
   return typedjson({
     ...dashboard,
+    filters,
     possibleTasks: possibleTasks
       .map((task) => ({ slug: task.slug, triggerSource: task.triggerSource }))
       .sort((a, b) => a.slug.localeCompare(b.slug)),
+    possibleModels,
   });
 };
 
@@ -80,7 +110,9 @@ export default function Page() {
     title,
     layout: dashboardLayout,
     defaultPeriod,
+    filters,
     possibleTasks,
+    possibleModels,
   } = useTypedLoaderData<typeof loader>();
 
   const organization = useOrganization();
@@ -107,7 +139,9 @@ export default function Page() {
             widgets={dashboardLayout.widgets}
             defaultPeriod={defaultPeriod}
             editable={false}
+            filters={filters}
             possibleTasks={possibleTasks}
+            possibleModels={possibleModels}
           />
         </div>
       </PageBody>
@@ -120,7 +154,9 @@ export function MetricDashboard({
   widgets,
   defaultPeriod,
   editable,
+  filters: filterConfig,
   possibleTasks,
+  possibleModels,
   onLayoutChange,
   onEditWidget,
   onRenameWidget,
@@ -133,8 +169,12 @@ export function MetricDashboard({
   widgets: Record<string, Widget>;
   defaultPeriod: string;
   editable: boolean;
+  /** Which filters to show. Defaults to ["tasks", "queues"]. */
+  filters?: BuiltInDashboardFilter[];
   /** Possible tasks for filtering */
   possibleTasks?: { slug: string; triggerSource: TaskTriggerSource }[];
+  /** Possible models for filtering */
+  possibleModels?: ModelOption[];
   onLayoutChange?: (layout: LayoutItem[]) => void;
   onEditWidget?: (widgetId: string, widget: WidgetData) => void;
   onRenameWidget?: (widgetId: string, newTitle: string) => void;
@@ -161,6 +201,9 @@ export function MetricDashboard({
   const scope = parsedScope.success ? parsedScope.data : "environment";
   const tasks = values("tasks").filter((v) => v !== "");
   const queues = values("queues").filter((v) => v !== "");
+  const models = values("models").filter((v) => v !== "");
+
+  const activeFilters = filterConfig ?? ["tasks", "queues"];
 
   const handleLayoutChange = useCallback(
     (newLayout: readonly LayoutItem[]) => {
@@ -187,8 +230,13 @@ export function MetricDashboard({
     <div className="grid max-h-full grid-rows-[auto_1fr] overflow-hidden">
       <div className="flex items-center gap-1 border-b border-b-grid-bright py-2 pl-2 pr-3">
         <ScopeFilter />
-        <LogsTaskFilter possibleTasks={possibleTasks ?? []} />
-        <QueuesFilter />
+        {activeFilters.includes("tasks") && (
+          <LogsTaskFilter possibleTasks={possibleTasks ?? []} />
+        )}
+        {activeFilters.includes("queues") && <QueuesFilter />}
+        {activeFilters.includes("models") && (
+          <ModelsFilter possibleModels={possibleModels ?? []} />
+        )}
         <TimeFilter
           defaultPeriod={defaultPeriod}
           labelName="Period"
@@ -243,6 +291,7 @@ export function MetricDashboard({
                     to={to ?? null}
                     taskIdentifiers={tasks.length > 0 ? tasks : undefined}
                     queues={queues.length > 0 ? queues : undefined}
+                    responseModels={models.length > 0 ? models : undefined}
                     config={widget.display}
                     organizationId={organization.id}
                     projectId={project.id}
diff --git a/apps/webapp/app/routes/_app.orgs.$organizationSlug.projects.$projectParam.env.$envParam.query/ExamplesContent.tsx b/apps/webapp/app/routes/_app.orgs.$organizationSlug.projects.$projectParam.env.$envParam.query/ExamplesContent.tsx
index 4d027223f14..f0c3c1d616f 100644
--- a/apps/webapp/app/routes/_app.orgs.$organizationSlug.projects.$projectParam.env.$envParam.query/ExamplesContent.tsx
+++ b/apps/webapp/app/routes/_app.orgs.$organizationSlug.projects.$projectParam.env.$envParam.query/ExamplesContent.tsx
@@ -118,6 +118,96 @@ LIMIT 100`,
     scope: "environment",
     table: "metrics",
   },
+  {
+    title: "LLM cost by model (past 7d)",
+    description: "Total cost, input tokens, and output tokens grouped by model over the last 7 days.",
+    query: `SELECT
+  response_model,
+  SUM(total_cost) AS total_cost,
+  SUM(input_tokens) AS input_tokens,
+  SUM(output_tokens) AS output_tokens
+FROM llm_metrics
+WHERE start_time > now() - INTERVAL 7 DAY
+GROUP BY response_model
+ORDER BY total_cost DESC`,
+    scope: "environment",
+    table: "llm_metrics",
+  },
+  {
+    title: "LLM cost over time",
+    description: "Total LLM cost bucketed over time. The bucket size adjusts automatically.",
+    query: `SELECT
+  timeBucket(),
+  SUM(total_cost) AS total_cost
+FROM llm_metrics
+GROUP BY timeBucket
+ORDER BY timeBucket
+LIMIT 1000`,
+    scope: "environment",
+    table: "llm_metrics",
+  },
+  {
+    title: "Most expensive runs by LLM cost (top 50)",
+    description: "Top 50 runs by total LLM cost with token breakdown.",
+    query: `SELECT
+  run_id,
+  task_identifier,
+  SUM(total_cost) AS llm_cost,
+  SUM(input_tokens) AS input_tokens,
+  SUM(output_tokens) AS output_tokens
+FROM llm_metrics
+GROUP BY run_id, task_identifier
+ORDER BY llm_cost DESC
+LIMIT 50`,
+    scope: "environment",
+    table: "llm_metrics",
+  },
+  {
+    title: "LLM calls by provider",
+    description: "Count and cost of LLM calls grouped by AI provider.",
+    query: `SELECT
+  gen_ai_system,
+  count() AS call_count,
+  SUM(total_cost) AS total_cost
+FROM llm_metrics
+GROUP BY gen_ai_system
+ORDER BY total_cost DESC`,
+    scope: "environment",
+    table: "llm_metrics",
+  },
+  {
+    title: "LLM cost by user",
+    description:
+      "Total LLM cost per user from run tags or AI SDK telemetry metadata. Uses metadata.userId which comes from experimental_telemetry metadata or run tags like user:123.",
+    query: `SELECT
+  metadata.userId AS user_id,
+  SUM(total_cost) AS total_cost,
+  SUM(total_tokens) AS total_tokens,
+  count() AS call_count
+FROM llm_metrics
+WHERE metadata.userId != ''
+GROUP BY metadata.userId
+ORDER BY total_cost DESC
+LIMIT 50`,
+    scope: "environment",
+    table: "llm_metrics",
+  },
+  {
+    title: "LLM cost by metadata key",
+    description:
+      "Browse all metadata keys and their LLM cost. Metadata comes from run tags (key:value) and AI SDK telemetry metadata.",
+    query: `SELECT
+  metadata,
+  response_model,
+  total_cost,
+  total_tokens,
+  run_id
+FROM llm_metrics
+ORDER BY start_time DESC
+LIMIT 20`,
+    scope: "environment",
+    table: "llm_metrics",
+  },
 ];
 
 const tableOptions = querySchemas.map((s) => ({ label: s.name, value: s.name }));
diff --git a/apps/webapp/app/routes/_app.orgs.$organizationSlug.projects.$projectParam.env.$envParam.runs.$runParam/route.tsx b/apps/webapp/app/routes/_app.orgs.$organizationSlug.projects.$projectParam.env.$envParam.runs.$runParam/route.tsx
index e02d29b95b5..118226906e1 100644
--- a/apps/webapp/app/routes/_app.orgs.$organizationSlug.projects.$projectParam.env.$envParam.runs.$runParam/route.tsx
+++ b/apps/webapp/app/routes/_app.orgs.$organizationSlug.projects.$projectParam.env.$envParam.runs.$runParam/route.tsx
@@ -119,7 +119,7 @@ const resizableSettings = {
     },
     inspector: {
       id: "inspector",
-      default: "430px" as const,
+      default: "500px" as const,
       min: "50px" as const,
     },
   },
diff --git a/apps/webapp/app/routes/_app.orgs.$organizationSlug.projects.$projectParam.env.$envParam.test.tasks.$taskParam/route.tsx b/apps/webapp/app/routes/_app.orgs.$organizationSlug.projects.$projectParam.env.$envParam.test.tasks.$taskParam/route.tsx
index 29d9e246e2d..ee69419e1b7 100644
--- a/apps/webapp/app/routes/_app.orgs.$organizationSlug.projects.$projectParam.env.$envParam.test.tasks.$taskParam/route.tsx
+++ b/apps/webapp/app/routes/_app.orgs.$organizationSlug.projects.$projectParam.env.$envParam.test.tasks.$taskParam/route.tsx
@@ -120,6 +120,12 @@ export const loader = async ({ request, params }: LoaderFunctionArgs) => {
 
     return typedjson({ ...result, regions: regionsResult.regions });
   } catch (error) {
+    logger.error("Failed to load test page", {
+      taskParam,
+      error: error instanceof Error ? error.message : error,
+      stack: error instanceof Error ? error.stack : undefined,
+    });
+
     return redirectWithErrorMessage(
       v3TestPath({ slug: organizationSlug }, { slug: projectParam }, environment),
       request,
diff --git a/apps/webapp/app/routes/admin.api.v1.llm-models.$modelId.ts b/apps/webapp/app/routes/admin.api.v1.llm-models.$modelId.ts
new file mode 100644
index 00000000000..4e8357c886c
--- /dev/null
+++ b/apps/webapp/app/routes/admin.api.v1.llm-models.$modelId.ts
@@ -0,0 +1,152 @@
+import { type ActionFunctionArgs, type LoaderFunctionArgs, json } from "@remix-run/server-runtime";
+import { z } from "zod";
+import { prisma } from "~/db.server";
+import { authenticateApiRequestWithPersonalAccessToken } from "~/services/personalAccessToken.server";
+
+async function requireAdmin(request: Request) {
+  const authResult = await authenticateApiRequestWithPersonalAccessToken(request);
+  if (!authResult) {
+    throw json({ error: "Invalid or Missing API key" }, { status: 401 });
+  }
+
+  const user = await prisma.user.findUnique({ where: { id: authResult.userId } });
+  if (!user?.admin) {
+    throw json({ error: "You must be an admin to perform this action" }, { status: 403 });
+  }
+
+  return user;
+}
+
+export async function loader({ request, params }: LoaderFunctionArgs) {
+  await requireAdmin(request);
+
+  const model = await prisma.llmModel.findUnique({
+    where: { id: params.modelId },
+    include: {
+      pricingTiers: {
+        include: { prices: true },
+        orderBy: { priority: "asc" },
+      },
+    },
+  });
+
+  if (!model) {
+    return json({ error: "Model not found" }, { status: 404 });
+  }
+
+  return json({ model });
+}
+
+const UpdateModelSchema = z.object({
+  modelName: z.string().min(1).optional(),
+  matchPattern: z.string().min(1).optional(),
+  startDate: z.string().nullable().optional(),
+  pricingTiers: z
+    .array(
+      z.object({
+        name: z.string().min(1),
+        isDefault: z.boolean().default(true),
+        priority: z.number().int().default(0),
+        conditions: z
+          .array(
+            z.object({
+              usageDetailPattern: z.string(),
+              operator: z.enum(["gt", "gte", "lt", "lte", "eq", "neq"]),
+              value: z.number(),
+            })
+          )
+          .default([]),
+        prices: z.record(z.string(), z.number()),
+      })
+    )
+    .optional(),
+});
+
+export async function action({ request, params }: ActionFunctionArgs) {
+  await requireAdmin(request);
+
+  const modelId = params.modelId!;
+
+  if (request.method === "DELETE") {
+    const existing = await prisma.llmModel.findUnique({ where: { id: modelId } });
+    if (!existing) {
+      return json({ error: "Model not found" }, { status: 404 });
+    }
+
+    await prisma.llmModel.delete({ where: { id: modelId } });
+    return json({ success: true });
+  }
+
+  if (request.method !== "PUT") {
+    return json({ error: "Method not allowed" }, { status: 405 });
+  }
+
+  let body: unknown;
+  try {
+    body = await request.json();
+  } catch {
+    return json({ error: "Invalid JSON body" }, { status: 400 });
+  }
+
+  const parsed = UpdateModelSchema.safeParse(body);
+
+  if (!parsed.success) {
+    return json({ error: "Invalid request body", details: parsed.error.issues }, { status: 400 });
+  }
+
+  const { modelName, matchPattern, startDate, pricingTiers } = parsed.data;
+
+  // Validate regex if provided — strip (?i) POSIX flag since our registry handles it
+  if (matchPattern) {
+    try {
+      const testPattern = matchPattern.startsWith("(?i)") ? matchPattern.slice(4) : matchPattern;
+      new RegExp(testPattern);
+    } catch {
+      return json({ error: "Invalid regex in matchPattern" }, { status: 400 });
+    }
+  }
+
+  // Update model + tiers atomically
+  const updated = await prisma.$transaction(async (tx) => {
+    await tx.llmModel.update({
+      where: { id: modelId },
+      data: {
+        ...(modelName !== undefined && { modelName }),
+        ...(matchPattern !== undefined && { matchPattern }),
+        ...(startDate !== undefined && { startDate: startDate ? new Date(startDate) : null }),
+      },
+    });
+
+    if (pricingTiers) {
+      await tx.llmPricingTier.deleteMany({ where: { modelId } });
+
+      for (const tier of pricingTiers) {
+        await tx.llmPricingTier.create({
+          data: {
+            modelId,
+            name: tier.name,
+            isDefault: tier.isDefault,
+            priority: tier.priority,
+            conditions: tier.conditions,
+            prices: {
+              create: Object.entries(tier.prices).map(([usageType, price]) => ({
+                modelId,
+                usageType,
+                price,
+              })),
+            },
+          },
+        });
+      }
+    }
+
+    return tx.llmModel.findUnique({
+      where: { id: modelId },
+      include: {
+        pricingTiers: { include: { prices: true }, orderBy: { priority: "asc" } },
+      },
+    });
+  });
+
+  return json({ model: updated });
+}
diff --git a/apps/webapp/app/routes/admin.api.v1.llm-models.missing.ts b/apps/webapp/app/routes/admin.api.v1.llm-models.missing.ts
new file mode 100644
index 00000000000..5ca7077e1cc
--- /dev/null
+++ b/apps/webapp/app/routes/admin.api.v1.llm-models.missing.ts
@@ -0,0 +1,33 @@
+import { type LoaderFunctionArgs, json } from "@remix-run/server-runtime";
+import { prisma } from "~/db.server";
+import { authenticateApiRequestWithPersonalAccessToken } from "~/services/personalAccessToken.server";
+import { getMissingLlmModels } from "~/services/admin/missingLlmModels.server";
+
+async function requireAdmin(request: Request) {
+  const authResult = await authenticateApiRequestWithPersonalAccessToken(request);
+  if (!authResult) {
+    throw json({ error: "Invalid or Missing API key" }, { status: 401 });
+  }
+
+  const user = await prisma.user.findUnique({ where: { id: authResult.userId } });
+  if (!user?.admin) {
+    throw json({ error: "You must be an admin to perform this action" }, { status: 403 });
+  }
+
+  return user;
+}
+
+export async function loader({ request }: LoaderFunctionArgs) {
+  await requireAdmin(request);
+
+  const url = new URL(request.url);
+  const lookbackHours = parseInt(url.searchParams.get("lookbackHours") ?? "24", 10);
+
+  if (isNaN(lookbackHours) || lookbackHours < 1 || lookbackHours > 720) {
+    return json({ error: "lookbackHours must be between 1 and 720" }, { status: 400 });
+  }
+
+  const models = await getMissingLlmModels({ lookbackHours });
+
+  return json({ models, lookbackHours });
+}
diff --git a/apps/webapp/app/routes/admin.api.v1.llm-models.reload.ts b/apps/webapp/app/routes/admin.api.v1.llm-models.reload.ts
new file mode 100644
index 00000000000..747722b352a
--- /dev/null
+++ b/apps/webapp/app/routes/admin.api.v1.llm-models.reload.ts
@@ -0,0 +1,24 @@
+import { type ActionFunctionArgs, json } from "@remix-run/server-runtime";
+import { prisma } from "~/db.server";
+import { authenticateApiRequestWithPersonalAccessToken } from "~/services/personalAccessToken.server";
+import { llmPricingRegistry } from "~/v3/llmPricingRegistry.server";
+
+export async function action({ request }: ActionFunctionArgs) {
+  const authResult = await authenticateApiRequestWithPersonalAccessToken(request);
+  if (!authResult) {
+    return json({ error: "Invalid or Missing API key" }, { status: 401 });
+  }
+
+  const user = await prisma.user.findUnique({ where: { id: authResult.userId } });
+  if (!user?.admin) {
+    return json({ error: "You must be an admin to perform this action" }, { status: 403 });
+  }
+
+  if (!llmPricingRegistry) {
+    return json({ error: "LLM cost tracking is disabled" }, { status: 400 });
+  }
+
+  await llmPricingRegistry.reload();
+
+  return json({ success: true, message: "LLM pricing registry reloaded" });
+}
diff --git a/apps/webapp/app/routes/admin.api.v1.llm-models.seed.ts b/apps/webapp/app/routes/admin.api.v1.llm-models.seed.ts
new file mode 100644
index 00000000000..805f97ad233
--- /dev/null
+++ b/apps/webapp/app/routes/admin.api.v1.llm-models.seed.ts
@@ -0,0 +1,30 @@
+import { type ActionFunctionArgs, json } from "@remix-run/server-runtime";
+import { seedLlmPricing } from "@internal/llm-pricing";
+import { prisma } from "~/db.server";
+import { authenticateApiRequestWithPersonalAccessToken } from "~/services/personalAccessToken.server";
+import { llmPricingRegistry } from "~/v3/llmPricingRegistry.server";
+
+export async function action({ request }: ActionFunctionArgs) {
+  const authResult = await authenticateApiRequestWithPersonalAccessToken(request);
+  if (!authResult) {
+    return json({ error: "Invalid or Missing API key" }, { status: 401 });
+  }
+
+  const user = await prisma.user.findUnique({ where: { id: authResult.userId } });
+  if (!user?.admin) {
+    return json({ error: "You must be an admin to perform this action" }, { status: 403 });
+  }
+
+  const result = await seedLlmPricing(prisma);
+
+  // Reload the in-memory registry after seeding (if enabled)
+  if (llmPricingRegistry) {
+    await llmPricingRegistry.reload();
+  }
+
+  return json({
+    success: true,
+    ...result,
+    message: `Seeded ${result.modelsCreated} models, skipped ${result.modelsSkipped} existing`,
+  });
+}
diff --git a/apps/webapp/app/routes/admin.api.v1.llm-models.ts b/apps/webapp/app/routes/admin.api.v1.llm-models.ts
new file mode 100644
index 00000000000..6305869c605
--- /dev/null
+++ b/apps/webapp/app/routes/admin.api.v1.llm-models.ts
@@ -0,0 +1,141 @@
+import { type ActionFunctionArgs, type LoaderFunctionArgs, json } from "@remix-run/server-runtime";
+import { z } from "zod";
+import { prisma } from "~/db.server";
+import { authenticateApiRequestWithPersonalAccessToken } from "~/services/personalAccessToken.server";
+import { generateFriendlyId } from "~/v3/friendlyIdentifiers";
+
+async function requireAdmin(request: Request) {
+  const authResult = await authenticateApiRequestWithPersonalAccessToken(request);
+  if (!authResult) {
+    throw json({ error: "Invalid or Missing API key" }, { status: 401 });
+  }
+
+  const user = await prisma.user.findUnique({ where: { id: authResult.userId } });
+  if (!user?.admin) {
+    throw json({ error: "You must be an admin to perform this action" }, { status: 403 });
+  }
+
+  return user;
+}
+
+export async function loader({ request }: LoaderFunctionArgs) {
+  await requireAdmin(request);
+
+  const url = new URL(request.url);
+  const page = parseInt(url.searchParams.get("page") ?? "1");
+  const pageSize = parseInt(url.searchParams.get("pageSize") ?? "50");
+
+  const [models, total] = await Promise.all([
+    prisma.llmModel.findMany({
+      where: { projectId: null },
+      include: {
+        pricingTiers: {
+          include: { prices: true },
+          orderBy: { priority: "asc" },
+        },
+      },
+      orderBy: { modelName: "asc" },
+      skip: (page - 1) * pageSize,
+      take: pageSize,
+    }),
+    prisma.llmModel.count({ where: { projectId: null } }),
+  ]);
+
+  return json({ models, total, page, pageSize });
+}
+
+const CreateModelSchema = z.object({
+  modelName: z.string().min(1),
+  matchPattern: z.string().min(1),
+  startDate: z.string().optional(),
+  source: z.enum(["default", "admin"]).optional().default("admin"),
+  pricingTiers: z.array(
+    z.object({
+      name: z.string().min(1),
+      isDefault: z.boolean().default(true),
+      priority: z.number().int().default(0),
+      conditions: z
+        .array(
+          z.object({
+            usageDetailPattern: z.string(),
+            operator: z.enum(["gt", "gte", "lt", "lte", "eq", "neq"]),
+            value: z.number(),
+          })
+        )
+        .default([]),
+      prices: z.record(z.string(), z.number()),
+    })
+  ),
+});
+
+export async function action({ request }: ActionFunctionArgs) {
+  await requireAdmin(request);
+
+  if (request.method !== "POST") {
+    return json({ error: "Method not allowed" }, { status: 405 });
+  }
+
+  let body: unknown;
+  try {
+    body = await request.json();
+  } catch {
+    return json({ error: "Invalid JSON body" }, { status: 400 });
+  }
+
+  const parsed = CreateModelSchema.safeParse(body);
+
+  if (!parsed.success) {
+    return json({ error: "Invalid request body", details: parsed.error.issues }, { status: 400 });
+  }
+
+  const { modelName, matchPattern, startDate, source, pricingTiers } = parsed.data;
+
+  // Validate regex pattern — strip (?i) POSIX flag since our registry handles it
+  try {
+    const testPattern = matchPattern.startsWith("(?i)") ? matchPattern.slice(4) : matchPattern;
+    new RegExp(testPattern);
+  } catch {
+    return json({ error: "Invalid regex in matchPattern" }, { status: 400 });
+  }
+
+  // Create model + tiers atomically
+  const created = await prisma.$transaction(async (tx) => {
+    const model = await tx.llmModel.create({
+      data: {
+        friendlyId: generateFriendlyId("llm_model"),
+        modelName,
+        matchPattern,
+        startDate: startDate ? new Date(startDate) : null,
+        source,
+      },
+    });
+
+    for (const tier of pricingTiers) {
+      await tx.llmPricingTier.create({
+        data: {
+          modelId: model.id,
+          name: tier.name,
+          isDefault: tier.isDefault,
+          priority: tier.priority,
+          conditions: tier.conditions,
+          prices: {
+            create: Object.entries(tier.prices).map(([usageType, price]) => ({
+              modelId: model.id,
+              usageType,
+              price,
+            })),
+          },
+        },
+      });
+    }
+
+    return tx.llmModel.findUnique({
+      where: { id: model.id },
+      include: {
+        pricingTiers: { include: { prices: true } },
+      },
+    });
+  });
+
+  return json({ model: created }, { status: 201 });
+}
diff --git a/apps/webapp/app/routes/admin.llm-models.$modelId.tsx b/apps/webapp/app/routes/admin.llm-models.$modelId.tsx
new file mode 100644
index 00000000000..e37491a1b4f
--- /dev/null
+++ b/apps/webapp/app/routes/admin.llm-models.$modelId.tsx
@@ -0,0 +1,461 @@
+import { Form, useActionData, useNavigate } from "@remix-run/react";
+import type { ActionFunctionArgs, LoaderFunctionArgs } from "@remix-run/server-runtime";
+import { redirect } from "@remix-run/server-runtime";
+import { typedjson, useTypedLoaderData } from "remix-typedjson";
+import { z } from "zod";
+import { useState } from "react";
+import { Button, LinkButton } from "~/components/primitives/Buttons";
+import { Input } from "~/components/primitives/Input";
+import { Paragraph } from "~/components/primitives/Paragraph";
+import { prisma } from "~/db.server";
+import { requireUserId } from "~/services/session.server";
+import { llmPricingRegistry } from "~/v3/llmPricingRegistry.server";
+
+export const loader = async ({ request, params }: LoaderFunctionArgs) => {
+  const userId = await requireUserId(request);
+  const user = await prisma.user.findUnique({ where: { id: userId } });
+  if (!user?.admin) throw redirect("/");
+
+  const model = await prisma.llmModel.findUnique({
+    where: { friendlyId: params.modelId },
+    include: {
+      pricingTiers: { include: { prices: true }, orderBy: { priority: "asc" } },
+    },
+  });
+
+  if (!model) throw new Response("Model not found", { status: 404 });
+
+  // Convert Prisma Decimal to plain numbers for serialization
+  const serialized = {
+    ...model,
+    pricingTiers: model.pricingTiers.map((t) => ({
+      ...t,
+      prices: t.prices.map((p) => ({ ...p, price: Number(p.price) })),
+    })),
+  };
+
+  return typedjson({ model: serialized });
+};
+
+const SaveSchema = z.object({
+  modelName: z.string().min(1),
+  matchPattern: z.string().min(1),
+  pricingTiersJson: z.string(),
+});
+
+export async function action({ request, params }: ActionFunctionArgs) {
+  const userId = await requireUserId(request);
+  const user = await prisma.user.findUnique({ where: { id: userId } });
+  if (!user?.admin) throw redirect("/");
+
+  const friendlyId = params.modelId!;
+  const existing = await prisma.llmModel.findUnique({ where: { friendlyId } });
+  if (!existing) throw new Response("Model not found", { status: 404 });
+  const modelId = existing.id;
+
+  const formData = await request.formData();
+  const _action = formData.get("_action");
+
+  if (_action === "delete") {
+    await prisma.llmModel.delete({ where: { id: modelId } });
+    await llmPricingRegistry?.reload();
+    return redirect("/admin/llm-models");
+  }
+
+  if (_action === "save") {
+    const raw = Object.fromEntries(formData);
+    const parsed = SaveSchema.safeParse(raw);
+
+    if (!parsed.success) {
+      return typedjson({ error: "Invalid form data", details: parsed.error.issues }, { status: 400 });
+    }
+
+    const { modelName, matchPattern, pricingTiersJson } = parsed.data;
+
+    // Validate regex — strip (?i) POSIX flag since our registry handles it
+    try {
+      const testPattern = matchPattern.startsWith("(?i)") ? matchPattern.slice(4) : matchPattern;
+      new RegExp(testPattern);
+    } catch {
+      return typedjson({ error: "Invalid regex in matchPattern" }, { status: 400 });
+    }
+
+    // Parse tiers
+    let pricingTiers: Array<{
+      name: string;
+      isDefault: boolean;
+      priority: number;
+      conditions: Array<{ usageDetailPattern: string; operator: string; value: number }>;
+      prices: Record<string, number>;
+    }>;
+    try {
+      pricingTiers = JSON.parse(pricingTiersJson) as typeof pricingTiers;
+    } catch {
+      return typedjson({ error: "Invalid pricing tiers JSON" }, { status: 400 });
+    }
+
+    // Update model
+    await prisma.llmModel.update({
+      where: { id: modelId },
+      data: { modelName, matchPattern },
+    });
+
+    // Replace tiers
+    await prisma.llmPricingTier.deleteMany({ where: { modelId } });
+    for (const tier of pricingTiers) {
+      await prisma.llmPricingTier.create({
+        data: {
+          modelId,
+          name: tier.name,
+          isDefault: tier.isDefault,
+          priority: tier.priority,
+          conditions: tier.conditions,
+          prices: {
+            create: Object.entries(tier.prices).map(([usageType, price]) => ({
+              modelId,
+              usageType,
+              price,
+            })),
+          },
+        },
+      });
+    }
+
+    await llmPricingRegistry?.reload();
+    return typedjson({ success: true });
+  }
+
+  return typedjson({ error: "Unknown action" }, { status: 400 });
+}
+
+export default function AdminLlmModelDetailRoute() {
+  const { model } = useTypedLoaderData<typeof loader>();
+  const actionData = useActionData<{ success?: boolean; error?: string; details?: unknown[] }>();
+  const navigate = useNavigate();
+
+  const [modelName, setModelName] = useState(model.modelName);
+  const [matchPattern, setMatchPattern] = useState(model.matchPattern);
+  const [testInput, setTestInput] = useState("");
+  const [tiers, setTiers] = useState(() =>
+    model.pricingTiers.map((t) => ({
+      name: t.name,
+      isDefault: t.isDefault,
+      priority: t.priority,
+      conditions: (t.conditions ?? []) as Array<{
+        usageDetailPattern: string;
+        operator: string;
+        value: number;
+      }>,
+      prices: Object.fromEntries(t.prices.map((p) => [p.usageType, p.price])),
+    }))
+  );
+
+  // Test regex match
+  let testResult: boolean | null = null;
+  if (testInput) {
+    try {
+      const pattern = matchPattern.startsWith("(?i)")
+        ? matchPattern.slice(4)
+        : matchPattern;
+      testResult = new RegExp(pattern, "i").test(testInput);
+    } catch {
+      testResult = null;
+    }
+  }
+
+  return (
+    <main className="flex h-full min-w-0 flex-1 flex-col overflow-y-auto px-4 pb-4">
+      <div className="max-w-3xl space-y-6">
+        <div className="flex items-center justify-between">
+          <h2 className="text-lg font-medium text-text-bright">{model.modelName}</h2>
+          <div className="flex items-center gap-2">
+            <span
+              className={`inline-flex rounded-sm px-1.5 py-0.5 text-[11px] font-medium ${
+                model.source === "admin"
+                  ? "bg-amber-500/20 text-amber-400"
+                  : "bg-charcoal-700 text-text-dimmed"
+              }`}
+            >
+              {model.source ?? "default"}
+            </span>
+            <LinkButton to="/admin/llm-models" variant="tertiary/small">
+              Back to list
+            </LinkButton>
+          </div>
+        </div>
+
+        <Form method="post">
+          <input type="hidden" name="_action" value="save" />
+          <input type="hidden" name="pricingTiersJson" value={JSON.stringify(tiers)} />
+
+          <div className="space-y-4">
+            {/* Model fields */}
+            <div className="space-y-2">
+              <label className="text-xs font-medium text-text-dimmed">Model Name</label>
+              <Input
+                name="modelName"
+                value={modelName}
+                onChange={(e) => setModelName(e.target.value)}
+                variant="medium"
+                fullWidth
+              />
+            </div>
+
+            <div className="space-y-2">
+              <label className="text-xs font-medium text-text-dimmed">Match Pattern (regex)</label>
+              <Input
+                name="matchPattern"
+                value={matchPattern}
+                onChange={(e) => setMatchPattern(e.target.value)}
+                variant="medium"
+                fullWidth
+                className="font-mono text-xs"
+              />
+            </div>
+
+            {/* Test pattern */}
+            <div className="space-y-2">
+              <label className="text-xs font-medium text-text-dimmed">Test pattern match</label>
+              <div className="flex items-center gap-2">
+                <Input
+                  value={testInput}
+                  onChange={(e) => setTestInput(e.target.value)}
+                  placeholder="Type a model name to test..."
+                  variant="medium"
+                  fullWidth
+                />
+                {testInput && (
+                  <span
+                    className={`text-xs font-medium ${
+                      testResult ? "text-green-400" : "text-red-400"
+                    }`}
+                  >
+                    {testResult ? "Match" : "No match"}
+                  </span>
+                )}
+              </div>
+            </div>
+
+            {/* Pricing tiers */}
+            <div className="space-y-3">
+              <div className="flex items-center justify-between">
+                <label className="text-sm font-medium text-text-bright">Pricing Tiers</label>
+                <Button
+                  type="button"
+                  variant="tertiary/small"
+                  onClick={() =>
+                    setTiers([
+                      ...tiers,
+                      {
+                        name: `Tier ${tiers.length + 1}`,
+                        isDefault: tiers.length === 0,
+                        priority: tiers.length,
+                        conditions: [],
+                        prices: {},
+                      },
+                    ])
+                  }
+                >
+                  Add tier
+                </Button>
+              </div>
+
+              {tiers.map((tier, tierIdx) => (
+                <TierEditor
+                  key={tierIdx}
+                  tier={tier}
+                  onChange={(updated) => {
+                    const next = [...tiers];
+                    next[tierIdx] = updated;
+                    setTiers(next);
+                  }}
+                  onRemove={() => setTiers(tiers.filter((_, i) => i !== tierIdx))}
+                />
+              ))}
+            </div>
+
+            {actionData?.error && (
+              <div className="rounded-md bg-red-500/10 border border-red-500/30 p-3 text-sm text-red-400">
+                {actionData.error}
+                {actionData.details && (
+                  <pre className="mt-1 text-xs text-red-300/70 overflow-auto">
+                    {JSON.stringify(actionData.details, null, 2)}
+                  </pre>
+                )}
+              </div>
+            )}
+
+            {/* Actions */}
+            <div className="flex items-center gap-2 border-t border-grid-dimmed pt-4">
+              <Button type="submit" variant="primary/medium">
+                Save
+              </Button>
+              <LinkButton to="/admin/llm-models" variant="tertiary/medium">
+                Cancel
+              </LinkButton>
+            </div>
+          </div>
+        </Form>
+
+        {/* Delete section */}
+        <div className="border-t border-grid-dimmed pt-4">
+          <Form method="post" onSubmit={(e) => {
+            if (!confirm(`Delete model "${model.modelName}"?`)) e.preventDefault();
+          }}>
+            <input type="hidden" name="_action" value="delete" />
+            <Button type="submit" variant="danger/small">
+              Delete model
+            </Button>
+          </Form>
+        </div>
+      </div>
+    </main>
+  );
+}
+
+// ---------------------------------------------------------------------------
+// Tier editor sub-component
+// ---------------------------------------------------------------------------
+
+type TierData = {
+  name: string;
+  isDefault: boolean;
+  priority: number;
+  conditions: Array<{ usageDetailPattern: string; operator: string; value: number }>;
+  prices: Record<string, number>;
+};
+
+const COMMON_USAGE_TYPES = [
+  "input",
+  "output",
+  "input_cached_tokens",
+  "cache_creation_input_tokens",
+  "reasoning_tokens",
+];
+
+function TierEditor({
+  tier,
+  onChange,
+  onRemove,
+}: {
+  tier: TierData;
+  onChange: (t: TierData) => void;
+  onRemove: () => void;
+}) {
+  const [newUsageType, setNewUsageType] = useState("");
+
+  return (
+    <div className="rounded-md border border-grid-dimmed bg-charcoal-800 p-3 space-y-3">
+      <div className="flex items-center justify-between">
+        <div className="flex items-center gap-3">
+          <input
+            className="bg-charcoal-750 text-text-bright rounded px-2 py-1 text-sm border border-grid-dimmed"
+            value={tier.name}
+            onChange={(e) => onChange({ ...tier, name: e.target.value })}
+            placeholder="Tier name"
+          />
+          <label className="flex items-center gap-1 text-xs text-text-dimmed">
+            <input
+              type="checkbox"
+              checked={tier.isDefault}
+              onChange={(e) => onChange({ ...tier, isDefault: e.target.checked })}
+            />
+            Default
+          </label>
+          <label className="flex items-center gap-1 text-xs text-text-dimmed">
+            Priority:
+            <input
+              type="number"
+              className="w-12 bg-charcoal-750 text-text-bright rounded px-1 py-0.5 text-xs border border-grid-dimmed"
+              value={tier.priority}
+              onChange={(e) => onChange({ ...tier, priority: parseInt(e.target.value) || 0 })}
+            />
+          </label>
+        </div>
+        <button
+          type="button"
+          onClick={onRemove}
+          className="text-xs text-red-400 hover:text-red-300"
+        >
+          Remove tier
+        </button>
+      </div>
+
+      {/* Prices */}
+      <div className="space-y-1">
+        <span className="text-xs font-medium text-text-dimmed">
+          Prices (per token)
+        </span>
+        <div className="space-y-1">
+          {Object.entries(tier.prices).map(([usageType, price]) => (
+            <div key={usageType} className="flex items-center gap-2">
+              <span className="w-48 text-xs font-mono text-text-dimmed">{usageType}</span>
+              <input
+                type="text"
+                className="w-32 bg-charcoal-750 text-text-bright rounded px-2 py-0.5 text-xs font-mono border border-grid-dimmed"
+                value={price}
+                onChange={(e) => {
+                  const val = parseFloat(e.target.value);
+                  if (!isNaN(val)) {
+                    onChange({
+                      ...tier,
+                      prices: { ...tier.prices, [usageType]: val },
+                    });
+                  }
+                }}
+              />
+              <button
+                type="button"
+                onClick={() => {
+                  const { [usageType]: _, ...rest } = tier.prices;
+                  onChange({ ...tier, prices: rest });
+                }}
+                className="text-xs text-red-400 hover:text-red-300"
+              >
+                x
+              </button>
+            </div>
+          ))}
+        </div>
+
+        {/* Add price */}
+        <div className="flex items-center gap-2 pt-1">
+          <select
+            className="bg-charcoal-750 text-text-dimmed rounded px-2 py-0.5 text-xs border border-grid-dimmed"
+            value={newUsageType}
+            onChange={(e) => setNewUsageType(e.target.value)}
+          >
+            <option value="">Add price...</option>
+            {COMMON_USAGE_TYPES.filter((t) => !(t in tier.prices)).map((t) => (
+              <option key={t} value={t}>
+                {t}
+              </option>
+            ))}
+            <option value="__custom">Custom...</option>
+          </select>
+          {newUsageType && (
+            <Button
+              type="button"
+              variant="tertiary/small"
+              onClick={() => {
+                const key =
+                  newUsageType === "__custom"
+                    ? prompt("Usage type name:") ?? ""
+                    : newUsageType;
+                if (key) {
+                  onChange({
+                    ...tier,
+                    prices: { ...tier.prices, [key]: 0 },
+                  });
+                  setNewUsageType("");
+                }
+              }}
+            >
+              Add
+            </Button>
+          )}
+        </div>
+      </div>
+    </div>
+  );
+}
diff --git a/apps/webapp/app/routes/admin.llm-models._index.tsx b/apps/webapp/app/routes/admin.llm-models._index.tsx
new file mode 100644
index 00000000000..fb2f6fdc491
--- /dev/null
+++ b/apps/webapp/app/routes/admin.llm-models._index.tsx
@@ -0,0 +1,346 @@
+import { MagnifyingGlassIcon } from "@heroicons/react/20/solid";
+import { Form, useFetcher, Link } from "@remix-run/react";
+import type { ActionFunctionArgs, LoaderFunctionArgs } from "@remix-run/server-runtime";
+import { redirect } from "@remix-run/server-runtime";
+import { typedjson, useTypedLoaderData } from "remix-typedjson";
+import { z } from "zod";
+import { Button, LinkButton } from "~/components/primitives/Buttons";
+import { Input } from "~/components/primitives/Input";
+import { PaginationControls } from "~/components/primitives/Pagination";
+import { Paragraph } from "~/components/primitives/Paragraph";
+import {
+  Table,
+  TableBlankRow,
+  TableBody,
+  TableCell,
+  TableHeader,
+  TableHeaderCell,
+  TableRow,
+} from "~/components/primitives/Table";
+import { prisma } from "~/db.server";
+import { requireUserId } from "~/services/session.server";
+import { createSearchParams } from "~/utils/searchParams";
+import { seedLlmPricing } from "@internal/llm-pricing";
+import { llmPricingRegistry } from "~/v3/llmPricingRegistry.server";
+
+const PAGE_SIZE = 50;
+
+const SearchParams = z.object({
+  page: z.coerce.number().optional(),
+  search: z.string().optional(),
+});
+
+export const loader = async ({ request }: LoaderFunctionArgs) => {
+  const userId = await requireUserId(request);
+  const user = await prisma.user.findUnique({ where: { id: userId } });
+  if (!user?.admin) throw redirect("/");
+
+  const searchParams = createSearchParams(request.url, SearchParams);
+  if (!searchParams.success) throw new Error(searchParams.error);
+  const { page: rawPage, search } = searchParams.params.getAll();
+  const page = rawPage ?? 1;
+
+  const where = {
+    projectId: null as string | null,
+    ...(search ? { modelName: { contains: search, mode: "insensitive" as const } } : {}),
+  };
+
+  const [rawModels, total] = await Promise.all([
+    prisma.llmModel.findMany({
+      where,
+      include: {
+        pricingTiers: { include: { prices: true }, orderBy: { priority: "asc" } },
+      },
+      orderBy: { modelName: "asc" },
+      skip: (page - 1) * PAGE_SIZE,
+      take: PAGE_SIZE,
+    }),
+    prisma.llmModel.count({ where }),
+  ]);
+
+  // Convert Prisma Decimal to plain numbers for serialization
+  const models = rawModels.map((m) => ({
+    ...m,
+    pricingTiers: m.pricingTiers.map((t) => ({
+      ...t,
+      prices: t.prices.map((p) => ({ ...p, price: Number(p.price) })),
+    })),
+  }));
+
+  return typedjson({
+    models,
+    total,
+    page,
+    pageCount: Math.ceil(total / PAGE_SIZE),
+    filters: { search },
+  });
+};
+
+export async function action({ request }: ActionFunctionArgs) {
+  const userId = await requireUserId(request);
+  const user = await prisma.user.findUnique({ where: { id: userId } });
+  if (!user?.admin) throw redirect("/");
+
+  const formData = await request.formData();
+  const _action = formData.get("_action");
+
+  if (_action === "seed") {
+    console.log("[admin] seed action started");
+    const result = await seedLlmPricing(prisma);
+    console.log(`[admin] seed complete: ${result.modelsCreated} created, ${result.modelsSkipped} skipped`);
+    await llmPricingRegistry?.reload();
+    console.log("[admin] registry reloaded after seed");
+    return typedjson({
+      success: true,
+      message: `Seeded: ${result.modelsCreated} created, ${result.modelsSkipped} skipped`,
+    });
+  }
+
+  if (_action === "reload") {
+    console.log("[admin] reload action started");
+    await llmPricingRegistry?.reload();
+    console.log("[admin] registry reloaded");
+    return typedjson({ success: true, message: "Registry reloaded" });
+  }
+
+  if (_action === "test") {
+    const modelString = formData.get("modelString");
+    if (typeof modelString !== "string" || !modelString) {
+      return typedjson({ testResult: null });
+    }
+
+    // Use the registry's match() which handles prefix stripping automatically
+    const matched = llmPricingRegistry?.match(modelString) ?? null;
+
+    return typedjson({
+      testResult: {
+        modelString,
+        match: matched
+          ? { friendlyId: matched.friendlyId, modelName: matched.modelName }
+          : null,
+      },
+    });
+  }
+
+  if (_action === "delete") {
+    const modelId = formData.get("modelId");
+    if (typeof modelId === "string") {
+      await prisma.llmModel.delete({ where: { id: modelId } });
+      await llmPricingRegistry?.reload();
+    }
+    return typedjson({ success: true });
+  }
+
+  return typedjson({ error: "Unknown action" }, { status: 400 });
+}
+
+export default function AdminLlmModelsRoute() {
+  const { models, filters, page, pageCount, total } =
+    useTypedLoaderData<typeof loader>();
+  const seedFetcher = useFetcher();
+  const reloadFetcher = useFetcher();
+  const testFetcher = useFetcher<{
+    testResult?: {
+      modelString: string;
+      match: { friendlyId: string; modelName: string } | null;
+    } | null;
+  }>();
+
+  const testResult = testFetcher.data?.testResult;
+
+  return (
+    <main className="flex h-full min-w-0 flex-1 flex-col overflow-y-auto px-4 pb-4">
+      <div className="space-y-4">
+        <div className="flex items-center justify-between">
+          <Form className="flex items-center gap-2">
+            <Input
+              placeholder="Search models..."
+              variant="medium"
+              icon={MagnifyingGlassIcon}
+              fullWidth={true}
+              name="search"
+              defaultValue={filters.search}
+              autoFocus
+            />
+            <Button type="submit" variant="secondary/medium">
+              Search
+            </Button>
+          </Form>
+
+          <div className="flex items-center gap-2">
+            <seedFetcher.Form method="post">
+              <input type="hidden" name="_action" value="seed" />
+              <Button
+                type="submit"
+                variant="tertiary/small"
+                disabled={seedFetcher.state !== "idle"}
+              >
+                {seedFetcher.state !== "idle" ? "Seeding..." : "Seed defaults"}
+              </Button>
+            </seedFetcher.Form>
+
+            <reloadFetcher.Form method="post">
+              <input type="hidden" name="_action" value="reload" />
+              <Button
+                type="submit"
+                variant="tertiary/small"
+                disabled={reloadFetcher.state !== "idle"}
+              >
+                {reloadFetcher.state !== "idle" ? "Reloading..." : "Reload registry"}
+              </Button>
+            </reloadFetcher.Form>
+
+            <LinkButton to="/admin/llm-models/missing" variant="tertiary/small">
+              Missing models
+            </LinkButton>
+
+            <LinkButton to="/admin/llm-models/new" variant="primary/small">
+              Add model
+            </LinkButton>
+          </div>
+        </div>
+
+        {/* Model tester */}
+        <div className="rounded-md border border-grid-dimmed bg-charcoal-800 p-3 space-y-2">
+          <label className="text-xs font-medium text-text-dimmed">
+            Test model string — paste a model name to see which pricing model matches
+          </label>
+          <testFetcher.Form method="post" className="flex items-center gap-2">
+            <input type="hidden" name="_action" value="test" />
+            <Input
+              name="modelString"
+              placeholder="e.g. anthropic/claude-haiku-4-5-20251001, gpt-4o-mini, mistral/mistral-large-3"
+              variant="medium"
+              fullWidth
+              className="font-mono text-xs"
+            />
+            <Button
+              type="submit"
+              variant="secondary/small"
+              disabled={testFetcher.state !== "idle"}
+            >
+              Test
+            </Button>
+          </testFetcher.Form>
+          {testResult !== undefined && testResult !== null && (
+            <div className="text-xs space-y-1">
+              <span className="text-text-dimmed">
+                Testing: <span className="font-mono text-text-bright">{testResult.modelString}</span>
+              </span>
+              {testResult.match ? (
+                <div className="text-green-400">
+                  Match:{" "}
+                  <Link
+                    to={`/admin/llm-models/${testResult.match.friendlyId}`}
+                    className="underline font-medium"
+                  >
+                    {testResult.match.modelName}
+                  </Link>
+                </div>
+              ) : (
+                <div className="text-red-400">
+                  No match found — this model has no pricing data
+                </div>
+              )}
+            </div>
+          )}
+        </div>
+
+        <div className="flex items-center justify-between">
+          <Paragraph className="text-text-dimmed">
+            {total} global models (page {page} of {pageCount})
+          </Paragraph>
+          <PaginationControls currentPage={page} totalPages={pageCount} />
+        </div>
+
+        <Table>
+          <TableHeader>
+            <TableRow>
+              <TableHeaderCell>Model Name</TableHeaderCell>
+              <TableHeaderCell>Source</TableHeaderCell>
+              <TableHeaderCell>Input $/tok</TableHeaderCell>
+              <TableHeaderCell>Output $/tok</TableHeaderCell>
+              <TableHeaderCell>Other prices</TableHeaderCell>
+            </TableRow>
+          </TableHeader>
+          <TableBody>
+            {models.length === 0 ? (
+              <TableBlankRow colSpan={5}>
+                <Paragraph>No models found</Paragraph>
+              </TableBlankRow>
+            ) : (
+              models.map((model) => {
+                // Get default tier prices
+                const defaultTier =
+                  model.pricingTiers.find((t) => t.isDefault) ?? model.pricingTiers[0];
+                const priceMap = defaultTier
+                  ? Object.fromEntries(defaultTier.prices.map((p) => [p.usageType, p.price]))
+                  : {};
+                const inputPrice = priceMap["input"];
+                const outputPrice = priceMap["output"];
+                const otherPrices = defaultTier
+                  ? defaultTier.prices.filter(
+                      (p) => p.usageType !== "input" && p.usageType !== "output"
+                    )
+                  : [];
+
+                return (
+                  <TableRow key={model.id}>
+                    <TableCell>
+                      <Link
+                        to={`/admin/llm-models/${model.friendlyId}`}
+                        className="font-medium text-indigo-500 underline"
+                      >
+                        {model.modelName}
+                      </Link>
+                    </TableCell>
+                    <TableCell>
+                      <span
+                        className={`inline-flex rounded-sm px-1.5 py-0.5 text-[11px] font-medium ${
+                          model.source === "admin"
+                            ? "bg-amber-500/20 text-amber-400"
+                            : "bg-charcoal-700 text-text-dimmed"
+                        }`}
+                      >
+                        {model.source ?? "default"}
+                      </span>
+                    </TableCell>
+                    <TableCell>
+                      <span className="text-xs font-mono text-text-bright">
+                        {inputPrice != null ? formatPrice(inputPrice) : "-"}
+                      </span>
+                    </TableCell>
+                    <TableCell>
+                      <span className="text-xs font-mono text-text-bright">
+                        {outputPrice != null ? formatPrice(outputPrice) : "-"}
+                      </span>
+                    </TableCell>
+                    <TableCell>
+                      {otherPrices.length > 0 ? (
+                        <span className="text-xs text-text-dimmed" title={otherPrices.map((p) => p.usageType).join(", ")}>
+                          +{otherPrices.length} more
+                        </span>
+                      ) : (
+                        <span className="text-xs text-text-dimmed">-</span>
+                      )}
+                    </TableCell>
+                  </TableRow>
+                );
+              })
+            )}
+          </TableBody>
+        </Table>
+
+        <PaginationControls currentPage={page} totalPages={pageCount} />
+      </div>
+    </main>
+  );
+}
+
+/** Format a per-token price as $/M tokens for readability */
+function formatPrice(perToken: number): string {
+  const perMillion = perToken * 1_000_000;
+  if (perMillion >= 1) return `$${perMillion.toFixed(2)}/M`;
+  if (perMillion >= 0.01) return `$${perMillion.toFixed(4)}/M`;
+  return `$${perMillion.toFixed(6)}/M`;
+}
diff --git a/apps/webapp/app/routes/admin.llm-models.missing.$model.tsx b/apps/webapp/app/routes/admin.llm-models.missing.$model.tsx
new file mode 100644
index 00000000000..78cb1c4fc91
--- /dev/null
+++ b/apps/webapp/app/routes/admin.llm-models.missing.$model.tsx
@@ -0,0 +1,469 @@
+import { useState } from "react";
+import type { LoaderFunctionArgs } from "@remix-run/server-runtime";
+import { redirect } from "@remix-run/server-runtime";
+import { typedjson, useTypedLoaderData } from "remix-typedjson";
+import { Button, LinkButton } from "~/components/primitives/Buttons";
+import { Paragraph } from "~/components/primitives/Paragraph";
+import { prisma } from "~/db.server";
+import { requireUserId } from "~/services/session.server";
+import {
+  getMissingModelSamples,
+  type MissingModelSample,
+} from "~/services/admin/missingLlmModels.server";
+
+export const loader = async ({ request, params }: LoaderFunctionArgs) => {
+  const userId = await requireUserId(request);
+  const user = await prisma.user.findUnique({ where: { id: userId } });
+  if (!user?.admin) throw redirect("/");
+
+  // Model name is URL-encoded in the URL param
+  const modelName = decodeURIComponent(params.model ?? "");
+  if (!modelName) throw new Response("Missing model param", { status: 400 });
+
+  const url = new URL(request.url);
+  const lookbackHours = parseInt(url.searchParams.get("lookbackHours") ?? "24", 10);
+
+  let samples: MissingModelSample[] = [];
+  let error: string | undefined;
+
+  try {
+    samples = await getMissingModelSamples({ model: modelName, lookbackHours, limit: 10 });
+  } catch (e) {
+    error = e instanceof Error ? e.message : "Failed to query ClickHouse";
+  }
+
+  return typedjson({ modelName, samples, lookbackHours, error });
+};
+
+export default function AdminMissingModelDetailRoute() {
+  const { modelName, samples, lookbackHours, error } = useTypedLoaderData<typeof loader>();
+  const [copied, setCopied] = useState(false);
+  const [expandedSpans, setExpandedSpans] = useState<Set<string>>(new Set());
+
+  const providerCosts = extractProviderCosts(samples);
+  const prompt = buildPrompt(modelName, samples, providerCosts);
+
+  function handleCopy() {
+    navigator.clipboard.writeText(prompt).then(() => {
+      setCopied(true);
+      setTimeout(() => setCopied(false), 2000);
+    });
+  }
+
+  function toggleSpan(spanId: string) {
+    setExpandedSpans((prev) => {
+      const next = new Set(prev);
+      if (next.has(spanId)) next.delete(spanId);
+      else next.add(spanId);
+      return next;
+    });
+  }
+
+  // Extract key token fields from the first sample for quick summary
+  const tokenSummary = samples.length > 0 ? extractTokenTypes(samples) : [];
+
+  return (
+    <main className="flex h-full min-w-0 flex-1 flex-col overflow-y-auto px-4 pb-4">
+      <div className="max-w-5xl space-y-6">
+        {/* Header */}
+        <div className="flex items-center justify-between">
+          <div>
+            <h2 className="text-lg font-medium text-text-bright font-mono">{modelName}</h2>
+            <Paragraph className="text-text-dimmed">
+              Missing pricing — {samples.length} sample span{samples.length !== 1 ? "s" : ""} from
+              last {lookbackHours}h
+            </Paragraph>
+          </div>
+          <div className="flex items-center gap-2">
+            <LinkButton
+              to={`/admin/llm-models/new?modelName=${encodeURIComponent(modelName)}`}
+              variant="primary/small"
+            >
+              Add pricing
+            </LinkButton>
+            <LinkButton to="/admin/llm-models/missing" variant="tertiary/small">
+              Back to missing
+            </LinkButton>
+          </div>
+        </div>
+
+        {error && (
+          <div className="rounded-md border border-red-500/30 bg-red-500/10 p-3 text-sm text-red-400">
+            {error}
+          </div>
+        )}
+
+        {/* Token types summary */}
+        {tokenSummary.length > 0 && (
+          <div className="rounded-md border border-grid-dimmed bg-charcoal-800 p-3 space-y-2">
+            <span className="text-xs font-medium text-text-dimmed">
+              Token types seen across samples
+            </span>
+            <div className="flex flex-wrap gap-2">
+              {tokenSummary.map((t) => (
+                <span
+                  key={t.key}
+                  className="inline-flex items-center gap-1.5 rounded-sm bg-charcoal-700 px-2 py-1 text-xs font-mono"
+                >
+                  <span className="text-text-bright">{t.key}</span>
+                  <span className="text-text-dimmed">
+                    {t.min === t.max ? t.min.toLocaleString() : `${t.min.toLocaleString()}-${t.max.toLocaleString()}`}
+                  </span>
+                </span>
+              ))}
+            </div>
+            <Paragraph className="text-text-dimmed text-xs">
+              These are the token usage types that need pricing entries (at minimum: input, output).
+            </Paragraph>
+          </div>
+        )}
+
+        {/* Provider-reported costs */}
+        {providerCosts.length > 0 && (
+          <div className="rounded-md border border-green-500/30 bg-green-500/5 p-3 space-y-2">
+            <span className="text-xs font-medium text-green-400">
+              Provider-reported cost data found in {providerCosts.length} span{providerCosts.length !== 1 ? "s" : ""}
+            </span>
+            <div className="space-y-1">
+              {providerCosts.map((c, i) => (
+                <div key={i} className="flex items-center gap-3 text-xs">
+                  <span className="text-text-dimmed">{c.source}</span>
+                  <span className="font-mono text-text-bright">${c.cost.toFixed(6)}</span>
+                  <span className="text-text-dimmed">
+                    ({c.inputTokens.toLocaleString()} in + {c.outputTokens.toLocaleString()} out)
+                  </span>
+                </div>
+              ))}
+            </div>
+            {providerCosts[0]?.estimatedInputPrice != null && (
+              <div className="border-t border-green-500/20 pt-2 text-xs">
+                <span className="text-green-300">
+                  Estimated per-token rates (assuming ~3x output/input ratio):
+                </span>
+                <div className="flex gap-4 mt-1 font-mono text-text-bright">
+                  <span>input: {providerCosts[0].estimatedInputPrice.toExponential(4)}</span>
+                  <span>output: {(providerCosts[0].estimatedOutputPrice ?? 0).toExponential(4)}</span>
+                </div>
+                <span className="text-text-dimmed mt-1 block">
+                  Cross-reference with the provider's pricing page before using these estimates.
+                </span>
+              </div>
+            )}
+          </div>
+        )}
+
+        {/* Prompt section */}
+        <div className="rounded-md border border-grid-dimmed bg-charcoal-800 p-3 space-y-2">
+          <div className="flex items-center justify-between">
+            <span className="text-xs font-medium text-text-dimmed">
+              Claude Code prompt — paste this to have it add pricing for this model
+            </span>
+            <Button variant="tertiary/small" onClick={handleCopy}>
+              {copied ? "Copied!" : "Copy prompt"}
+            </Button>
+          </div>
+          <pre className="max-h-64 overflow-auto rounded bg-charcoal-900 p-3 text-xs text-text-dimmed font-mono whitespace-pre-wrap">
+            {prompt}
+          </pre>
+        </div>
+
+        {/* Sample spans */}
+        <div className="space-y-2">
+          <span className="text-sm font-medium text-text-bright">
+            Sample spans ({samples.length})
+          </span>
+          {samples.map((s) => {
+            const expanded = expandedSpans.has(s.span_id);
+            let parsedAttrs: Record<string, unknown> | null = null;
+            try {
+              parsedAttrs = JSON.parse(s.attributes_text) as Record<string, unknown>;
+            } catch {
+              // ignore
+            }
+
+            return (
+              <div
+                key={s.span_id}
+                className="rounded-md border border-grid-dimmed bg-charcoal-800"
+              >
+                <button
+                  type="button"
+                  onClick={() => toggleSpan(s.span_id)}
+                  className="w-full flex items-center justify-between p-3 text-left hover:bg-charcoal-750"
+                >
+                  <div className="flex items-center gap-3 text-xs">
+                    <span className="font-mono text-text-dimmed">{s.span_id.slice(0, 8)}</span>
+                    <span className="text-text-bright">{s.message}</span>
+                    <span className="text-text-dimmed">{s.run_id}</span>
+                  </div>
+                  <span className="text-xs text-text-dimmed">{expanded ? "▼" : "▶"}</span>
+                </button>
+                {expanded && parsedAttrs && (
+                  <div className="border-t border-grid-dimmed p-3">
+                    <pre className="max-h-96 overflow-auto text-xs text-text-dimmed font-mono whitespace-pre-wrap">
+                      {JSON.stringify(parsedAttrs, null, 2)}
+                    </pre>
+                  </div>
+                )}
+              </div>
+            );
+          })}
+        </div>
+      </div>
+    </main>
+  );
+}
+
+// ---------------------------------------------------------------------------
+// Extract unique token usage types across all samples
+// ---------------------------------------------------------------------------
+
+type TokenTypeSummary = { key: string; min: number; max: number };
+
+function extractTokenTypes(samples: MissingModelSample[]): TokenTypeSummary[] {
+  const stats = new Map<string, { min: number; max: number }>();
+
+  for (const s of samples) {
+    let attrs: Record<string, unknown>;
+    try {
+      attrs = JSON.parse(s.attributes_text) as Record<string, unknown>;
+    } catch {
+      continue;
+    }
+
+    // Collect from gen_ai.usage.*
+    const genAiUsage = getNestedObj(attrs, ["gen_ai", "usage"]);
+    if (genAiUsage) {
+      for (const [k, v] of Object.entries(genAiUsage)) {
+        if (typeof v === "number" && v > 0) {
+          const existing = stats.get(`gen_ai.usage.${k}`);
+          if (existing) {
+            existing.min = Math.min(existing.min, v);
+            existing.max = Math.max(existing.max, v);
+          } else {
+            stats.set(`gen_ai.usage.${k}`, { min: v, max: v });
+          }
+        }
+      }
+    }
+
+    // Collect from ai.usage.*
+    const aiUsage = getNestedObj(attrs, ["ai", "usage"]);
+    if (aiUsage) {
+      for (const [k, v] of Object.entries(aiUsage)) {
+        if (typeof v === "number" && v > 0) {
+          const existing = stats.get(`ai.usage.${k}`);
+          if (existing) {
+            existing.min = Math.min(existing.min, v);
+            existing.max = Math.max(existing.max, v);
+          } else {
+            stats.set(`ai.usage.${k}`, { min: v, max: v });
+          }
+        }
+      }
+    }
+  }
+
+  return Array.from(stats.entries())
+    .map(([key, { min, max }]) => ({ key, min, max }))
+    .sort((a, b) => a.key.localeCompare(b.key));
+}
+
+function getNestedObj(
+  obj: Record<string, unknown>,
+  path: string[]
+): Record<string, unknown> | null {
+  let current: unknown = obj;
+  for (const key of path) {
+    if (!current || typeof current !== "object") return null;
+    current = (current as Record<string, unknown>)[key];
+  }
+  return current && typeof current === "object" ? (current as Record<string, unknown>) : null;
+}
+
+// ---------------------------------------------------------------------------
+// Extract provider-reported costs from providerMetadata
+// ---------------------------------------------------------------------------
+
+type ProviderCostInfo = {
+  source: string; // "gateway" or "openrouter"
+  cost: number;
+  inputTokens: number;
+  outputTokens: number;
+  estimatedInputPrice?: number;  // per-token estimate
+  estimatedOutputPrice?: number; // per-token estimate
+};
+
+function extractProviderCosts(samples: MissingModelSample[]): ProviderCostInfo[] {
+  const costs: ProviderCostInfo[] = [];
+
+  for (const s of samples) {
+    let attrs: Record<string, unknown>;
+    try {
+      attrs = JSON.parse(s.attributes_text) as Record<string, unknown>;
+    } catch {
+      continue;
+    }
+
+    // Parse providerMetadata — could be nested or stringified
+    let providerMeta: Record<string, unknown> | null = null;
+    const aiResponse = getNestedObj(attrs, ["ai", "response"]);
+    const rawMeta = aiResponse?.providerMetadata;
+    if (typeof rawMeta === "string") {
+      try { providerMeta = JSON.parse(rawMeta) as Record<string, unknown>; } catch {}
+    } else if (rawMeta && typeof rawMeta === "object") {
+      providerMeta = rawMeta as Record<string, unknown>;
+    }
+    if (!providerMeta) continue;
+
+    // Get token counts
+    const genAiUsage = getNestedObj(attrs, ["gen_ai", "usage"]);
+    const inputTokens = Number(genAiUsage?.input_tokens ?? 0);
+    const outputTokens = Number(genAiUsage?.output_tokens ?? 0);
+    if (inputTokens === 0 && outputTokens === 0) continue;
+
+    // Gateway: { gateway: { cost: "0.0006615" } }
+    const gw = getNestedObj(providerMeta, ["gateway"]);
+    if (gw) {
+      const cost = parseFloat(String(gw.cost ?? "0"));
+      if (cost > 0) {
+        costs.push({ source: "gateway", cost, inputTokens, outputTokens });
+        continue;
+      }
+    }
+
+    // OpenRouter: { openrouter: { usage: { cost: 0.000135 } } }
+    const or = getNestedObj(providerMeta, ["openrouter"]);
+    const orUsage = or ? getNestedObj(or, ["usage"]) : null;
+    if (orUsage) {
+      const cost = Number(orUsage.cost ?? 0);
+      if (cost > 0) {
+        costs.push({ source: "openrouter", cost, inputTokens, outputTokens });
+        continue;
+      }
+    }
+  }
+
+  // Estimate per-token prices from aggregate costs if we have enough data
+  if (costs.length > 0) {
+    // Use least-squares to estimate input/output price from cost = input*pi + output*po
+    // With 2+ samples we can solve; with 1 we can only estimate a blended rate
+    const totalInput = costs.reduce((s, c) => s + c.inputTokens, 0);
+    const totalOutput = costs.reduce((s, c) => s + c.outputTokens, 0);
+    const totalCost = costs.reduce((s, c) => s + c.cost, 0);
+
+    if (totalInput > 0 && totalOutput > 0) {
+      // Simple approach: assume output is 2-5x input price (common ratio)
+      // Use ratio r where output_price = r * input_price
+      // totalCost = input_price * (totalInput + r * totalOutput)
+      // Try r=3 (common for many models)
+      const r = 3;
+      const estimatedInputPrice = totalCost / (totalInput + r * totalOutput);
+      const estimatedOutputPrice = estimatedInputPrice * r;
+
+      for (const c of costs) {
+        c.estimatedInputPrice = estimatedInputPrice;
+        c.estimatedOutputPrice = estimatedOutputPrice;
+      }
+    }
+  }
+
+  return costs;
+}
+
+// ---------------------------------------------------------------------------
+// Prompt builder — focused on figuring out pricing, not API mechanics
+// ---------------------------------------------------------------------------
+
+function buildPrompt(modelName: string, samples: MissingModelSample[], providerCosts: ProviderCostInfo[]): string {
+  const hasPrefix = modelName.includes("/");
+  const prefix = hasPrefix ? modelName.split("/")[0] : null;
+  const baseName = hasPrefix ? modelName.split("/").slice(1).join("/") : modelName;
+
+  // Extract token types from samples
+  const tokenTypes = extractTokenTypes(samples);
+  const tokenTypeList = tokenTypes.length > 0
+    ? tokenTypes.map((t) => `  - ${t.key}: ${t.min === t.max ? t.min : `${t.min}-${t.max}`}`).join("\n")
+    : "  (no token data found in samples)";
+
+  // Get a compact sample of attributes for context
+  let sampleAttrs = "";
+  if (samples.length > 0) {
+    try {
+      const attrs = JSON.parse(samples[0].attributes_text) as Record<string, unknown>;
+      const ai = attrs.ai as Record<string, unknown> | undefined;
+      const aiResponse = (ai?.response ?? {}) as Record<string, unknown>;
+      // Extract just the relevant fields
+      const compact: Record<string, unknown> = {};
+      if (attrs.gen_ai) compact.gen_ai = attrs.gen_ai;
+      if (ai?.usage) compact["ai.usage"] = ai.usage;
+      if (aiResponse.providerMetadata) {
+        compact["ai.response.providerMetadata"] = aiResponse.providerMetadata;
+      }
+      sampleAttrs = JSON.stringify(compact, null, 2);
+    } catch {
+      // ignore
+    }
+  }
+
+  // Build suggested regex
+  const escapedBase = baseName.replace(/[.*+?^${}()|[\]\\]/g, "\\$&");
+  const suggestedPattern = prefix
+    ? `(?i)^(${prefix.replace(/[.*+?^${}()|[\]\\]/g, "\\$&")}/)?(${escapedBase})$`
+    : `(?i)^(${escapedBase})$`;
+
+  return `I need to add LLM pricing for the model "${modelName}".
+
+## Model info
+- Full model string from spans: \`${modelName}\`
+- Base model name: \`${baseName}\`${prefix ? `\n- Provider prefix: \`${prefix}\`` : ""}
+- This model appears in production spans but has no pricing data.
+
+## Token types seen in spans
+${tokenTypeList}
+
+## What I need you to do
+
+1. **Look up pricing**: Find the current per-token pricing for \`${baseName}\` from the provider's official pricing page. Search the web if needed.
+
+2. **Present the pricing to me** in the following format so I can review before adding:
+
+\`\`\`
+Model name: ${baseName}
+Match pattern: ${suggestedPattern}
+Pricing tier: Standard
+
+Prices (per token):
+  input: <cost per input token>
+  output: <cost per output token>
+  (add any additional token types if applicable)
+\`\`\`
+
+**IMPORTANT: Do NOT call the admin API or create the model yourself.** Just research the pricing and present it to me. I will add it via the admin dashboard or ask you to proceed once I've reviewed.
+
+## Pricing research notes
+
+- All prices should be in **cost per token** (NOT per million). To convert: divide $/M by 1,000,000.
+  - Example: $3.00/M tokens = 0.000003 per token
+- The \`matchPattern\` regex should match the model name both with and without the provider prefix.
+  - Suggested: \`${suggestedPattern}\`
+  - This matches both \`${baseName}\` and \`${modelName}\`
+- Based on the token types seen in spans, check if the provider charges differently for:
+  - \`input\` and \`output\` — always required
+  - \`input_cached_tokens\` — if the provider offers prompt caching discounts
+  - \`cache_creation_input_tokens\` — if there's a cache write cost
+  - \`reasoning_tokens\` — if the model has chain-of-thought/reasoning tokens${providerCosts.length > 0 ? `
+
+## Provider-reported costs (from ${providerCosts[0].source})
+The gateway/router is reporting costs for this model. Use these to cross-reference your pricing:
+${providerCosts.map((c) => `- $${c.cost.toFixed(6)} for ${c.inputTokens.toLocaleString()} input + ${c.outputTokens.toLocaleString()} output tokens`).join("\n")}${providerCosts[0].estimatedInputPrice != null ? `
+- Estimated per-token rates (rough, assuming ~3x output/input ratio):
+  - input: ${providerCosts[0].estimatedInputPrice.toExponential(4)} (${(providerCosts[0].estimatedInputPrice * 1_000_000).toFixed(4)} $/M)
+  - output: ${(providerCosts[0].estimatedOutputPrice ?? 0).toExponential(4)} (${((providerCosts[0].estimatedOutputPrice ?? 0) * 1_000_000).toFixed(4)} $/M)
+- Verify these against the official pricing page before using.` : ""}` : ""}${sampleAttrs ? `
+
+## Sample span attributes (first span)
+\`\`\`json
+${sampleAttrs}
+\`\`\`` : ""}`;
+}
diff --git a/apps/webapp/app/routes/admin.llm-models.missing._index.tsx b/apps/webapp/app/routes/admin.llm-models.missing._index.tsx
new file mode 100644
index 00000000000..fd933cd22e9
--- /dev/null
+++ b/apps/webapp/app/routes/admin.llm-models.missing._index.tsx
@@ -0,0 +1,158 @@
+import { useSearchParams } from "@remix-run/react";
+import type { LoaderFunctionArgs } from "@remix-run/server-runtime";
+import { redirect } from "@remix-run/server-runtime";
+import { typedjson, useTypedLoaderData } from "remix-typedjson";
+import { z } from "zod";
+import { LinkButton } from "~/components/primitives/Buttons";
+import { Paragraph } from "~/components/primitives/Paragraph";
+import {
+  Table,
+  TableBlankRow,
+  TableBody,
+  TableCell,
+  TableHeader,
+  TableHeaderCell,
+  TableRow,
+} from "~/components/primitives/Table";
+import { prisma } from "~/db.server";
+import { requireUserId } from "~/services/session.server";
+import { getMissingLlmModels } from "~/services/admin/missingLlmModels.server";
+
+const LOOKBACK_OPTIONS = [
+  { label: "1 hour", value: 1 },
+  { label: "6 hours", value: 6 },
+  { label: "24 hours", value: 24 },
+  { label: "7 days", value: 168 },
+  { label: "30 days", value: 720 },
+];
+
+const SearchParams = z.object({
+  lookbackHours: z.coerce.number().optional(),
+});
+
+export const loader = async ({ request }: LoaderFunctionArgs) => {
+  const userId = await requireUserId(request);
+  const user = await prisma.user.findUnique({ where: { id: userId } });
+  if (!user?.admin) throw redirect("/");
+
+  const url = new URL(request.url);
+  const lookbackHours = parseInt(url.searchParams.get("lookbackHours") ?? "24", 10);
+
+  let models: Awaited<ReturnType<typeof getMissingLlmModels>> = [];
+  let error: string | undefined;
+
+  try {
+    models = await getMissingLlmModels({ lookbackHours });
+  } catch (e) {
+    error = e instanceof Error ? e.message : "Failed to query ClickHouse";
+  }
+
+  return typedjson({ models, lookbackHours, error });
+};
+
+export default function AdminLlmModelsMissingRoute() {
+  const { models, lookbackHours, error } = useTypedLoaderData<typeof loader>();
+  const [searchParams, setSearchParams] = useSearchParams();
+
+  return (
+    <main className="flex h-full min-w-0 flex-1 flex-col overflow-y-auto px-4 pb-4">
+      <div className="space-y-4">
+        <div className="flex items-center justify-between">
+          <h2 className="text-lg font-medium text-text-bright">Missing LLM Models</h2>
+          <LinkButton to="/admin/llm-models" variant="tertiary/small">
+            Back to models
+          </LinkButton>
+        </div>
+
+        <Paragraph className="text-text-dimmed">
+          Models appearing in spans without cost enrichment. These models need pricing data added.
+        </Paragraph>
+
+        {/* Lookback selector */}
+        <div className="flex items-center gap-2">
+          <span className="text-xs text-text-dimmed">Lookback:</span>
+          {LOOKBACK_OPTIONS.map((opt) => (
+            <LinkButton
+              key={opt.value}
+              to={`/admin/llm-models/missing?lookbackHours=${opt.value}`}
+              variant={lookbackHours === opt.value ? "primary/small" : "tertiary/small"}
+            >
+              {opt.label}
+            </LinkButton>
+          ))}
+        </div>
+
+        {error && (
+          <div className="rounded-md border border-red-500/30 bg-red-500/10 p-3 text-sm text-red-400">
+            {error}
+          </div>
+        )}
+
+        <Paragraph className="text-text-dimmed">
+          {models.length} unpriced model{models.length !== 1 ? "s" : ""} found in the last{" "}
+          {lookbackHours < 24
+            ? `${lookbackHours}h`
+            : lookbackHours < 168
+              ? `${lookbackHours / 24}d`
+              : `${Math.round(lookbackHours / 24)}d`}
+        </Paragraph>
+
+        <Table>
+          <TableHeader>
+            <TableRow>
+              <TableHeaderCell>Model Name</TableHeaderCell>
+              <TableHeaderCell>Provider</TableHeaderCell>
+              <TableHeaderCell>Span Count</TableHeaderCell>
+              <TableHeaderCell>Actions</TableHeaderCell>
+            </TableRow>
+          </TableHeader>
+          <TableBody>
+            {models.length === 0 ? (
+              <TableBlankRow colSpan={4}>
+                <Paragraph>All models have pricing data</Paragraph>
+              </TableBlankRow>
+            ) : (
+              models.map((m) => (
+                <MissingModelRow key={`${m.system}/${m.model}`} model={m} />
+              ))
+            )}
+          </TableBody>
+        </Table>
+      </div>
+    </main>
+  );
+}
+
+// ---------------------------------------------------------------------------
+// Row component with link to detail page
+// ---------------------------------------------------------------------------
+
+function MissingModelRow({ model: m }: { model: { model: string; system: string; count: number } }) {
+  return (
+    <TableRow>
+      <TableCell>
+        <LinkButton
+          to={`/admin/llm-models/missing/${encodeURIComponent(m.model)}`}
+          variant="minimal/small"
+          className="font-mono text-sm text-indigo-500 underline"
+        >
+          {m.model}
+        </LinkButton>
+      </TableCell>
+      <TableCell>
+        <span className="text-xs text-text-dimmed">{m.system || "-"}</span>
+      </TableCell>
+      <TableCell>
+        <span className="text-sm text-text-bright">{m.count.toLocaleString()}</span>
+      </TableCell>
+      <TableCell>
+        <LinkButton
+          to={`/admin/llm-models/missing/${encodeURIComponent(m.model)}`}
+          variant="tertiary/small"
+        >
+          Details
+        </LinkButton>
+      </TableCell>
+    </TableRow>
+  );
+}
diff --git a/apps/webapp/app/routes/admin.llm-models.new.tsx b/apps/webapp/app/routes/admin.llm-models.new.tsx
new file mode 100644
index 00000000000..20c6e1461f2
--- /dev/null
+++ b/apps/webapp/app/routes/admin.llm-models.new.tsx
@@ -0,0 +1,397 @@
+import { Form, useActionData, useSearchParams } from "@remix-run/react";
+import type { ActionFunctionArgs, LoaderFunctionArgs } from "@remix-run/server-runtime";
+import { redirect } from "@remix-run/server-runtime";
+import { typedjson } from "remix-typedjson";
+import { z } from "zod";
+import { useState } from "react";
+import { Button, LinkButton } from "~/components/primitives/Buttons";
+import { Input } from "~/components/primitives/Input";
+import { prisma } from "~/db.server";
+import { requireUserId } from "~/services/session.server";
+import { generateFriendlyId } from "~/v3/friendlyIdentifiers";
+import { llmPricingRegistry } from "~/v3/llmPricingRegistry.server";
+
+export const loader = async ({ request }: LoaderFunctionArgs) => {
+  const userId = await requireUserId(request);
+  const user = await prisma.user.findUnique({ where: { id: userId } });
+  if (!user?.admin) throw redirect("/");
+  return typedjson({});
+};
+
+const CreateSchema = z.object({
+  modelName: z.string().min(1),
+  matchPattern: z.string().min(1),
+  pricingTiersJson: z.string(),
+});
+
+export async function action({ request }: ActionFunctionArgs) {
+  const userId = await requireUserId(request);
+  const user = await prisma.user.findUnique({ where: { id: userId } });
+  if (!user?.admin) throw redirect("/");
+
+  const formData = await request.formData();
+  const raw = Object.fromEntries(formData);
+  console.log("[admin] create model form data:", JSON.stringify(raw).slice(0, 500));
+  const parsed = CreateSchema.safeParse(raw);
+
+  if (!parsed.success) {
+    console.log("[admin] create model validation error:", JSON.stringify(parsed.error.issues));
+    return typedjson({ error: "Invalid form data", details: parsed.error.issues }, { status: 400 });
+  }
+
+  const { modelName, matchPattern, pricingTiersJson } = parsed.data;
+
+  // Validate regex — strip (?i) POSIX flag since our registry handles it
+  try {
+    const testPattern = matchPattern.startsWith("(?i)") ? matchPattern.slice(4) : matchPattern;
+    new RegExp(testPattern);
+  } catch {
+    return typedjson({ error: "Invalid regex in matchPattern" }, { status: 400 });
+  }
+
+  let pricingTiers: Array<{
+    name: string;
+    isDefault: boolean;
+    priority: number;
+    conditions: Array<{ usageDetailPattern: string; operator: string; value: number }>;
+    prices: Record<string, number>;
+  }>;
+  try {
+    pricingTiers = JSON.parse(pricingTiersJson) as typeof pricingTiers;
+  } catch {
+    return typedjson({ error: "Invalid pricing tiers JSON" }, { status: 400 });
+  }
+
+  const model = await prisma.llmModel.create({
+    data: {
+      friendlyId: generateFriendlyId("llm_model"),
+      modelName,
+      matchPattern,
+      source: "admin",
+    },
+  });
+
+  for (const tier of pricingTiers) {
+    await prisma.llmPricingTier.create({
+      data: {
+        modelId: model.id,
+        name: tier.name,
+        isDefault: tier.isDefault,
+        priority: tier.priority,
+        conditions: tier.conditions,
+        prices: {
+          create: Object.entries(tier.prices).map(([usageType, price]) => ({
+            modelId: model.id,
+            usageType,
+            price,
+          })),
+        },
+      },
+    });
+  }
+
+  await llmPricingRegistry?.reload();
+  return redirect(`/admin/llm-models/${model.friendlyId}`);
+}
+
+export default function AdminLlmModelNewRoute() {
+  const actionData = useActionData<{ error?: string; details?: unknown[] }>();
+  const [params] = useSearchParams();
+  const initialModelName = params.get("modelName") ?? "";
+  const [modelName, setModelName] = useState(initialModelName);
+  const [matchPattern, setMatchPattern] = useState("");
+  const [testInput, setTestInput] = useState("");
+  const [tiers, setTiers] = useState<TierData[]>([
+    { name: "Standard", isDefault: true, priority: 0, conditions: [], prices: { input: 0, output: 0 } },
+  ]);
+
+  let testResult: boolean | null = null;
+  if (testInput && matchPattern) {
+    try {
+      const pattern = matchPattern.startsWith("(?i)")
+        ? matchPattern.slice(4)
+        : matchPattern;
+      testResult = new RegExp(pattern, "i").test(testInput);
+    } catch {
+      testResult = null;
+    }
+  }
+
+  // Auto-generate match pattern from model name
+  function autoPattern() {
+    if (modelName) {
+      const escaped = modelName.replace(/[.*+?^${}()|[\]\\]/g, "\\$&");
+      setMatchPattern(`(?i)^(${escaped})$`);
+    }
+  }
+
+  return (
+    <main className="flex h-full min-w-0 flex-1 flex-col overflow-y-auto px-4 pb-4">
+      <div className="max-w-3xl space-y-6">
+        <div className="flex items-center justify-between">
+          <h2 className="text-lg font-medium text-text-bright">New LLM Model</h2>
+          <LinkButton to="/admin/llm-models" variant="tertiary/small">
+            Back to list
+          </LinkButton>
+        </div>
+
+        <Form method="post">
+          <input type="hidden" name="pricingTiersJson" value={JSON.stringify(tiers)} />
+
+          <div className="space-y-4">
+            <div className="space-y-2">
+              <label className="text-xs font-medium text-text-dimmed">Model Name</label>
+              <Input
+                name="modelName"
+                value={modelName}
+                onChange={(e) => setModelName(e.target.value)}
+                variant="medium"
+                fullWidth
+                placeholder="e.g. gemini-3-flash"
+              />
+            </div>
+
+            <div className="space-y-2">
+              <div className="flex items-center justify-between">
+                <label className="text-xs font-medium text-text-dimmed">Match Pattern (regex)</label>
+                <button
+                  type="button"
+                  onClick={autoPattern}
+                  className="text-xs text-indigo-400 hover:text-indigo-300"
+                >
+                  Auto-generate from name
+                </button>
+              </div>
+              <Input
+                name="matchPattern"
+                value={matchPattern}
+                onChange={(e) => setMatchPattern(e.target.value)}
+                variant="medium"
+                fullWidth
+                className="font-mono text-xs"
+                placeholder="(?i)^(google/)?(gemini-3-flash)$"
+              />
+            </div>
+
+            <div className="space-y-2">
+              <label className="text-xs font-medium text-text-dimmed">Test pattern match</label>
+              <div className="flex items-center gap-2">
+                <Input
+                  value={testInput}
+                  onChange={(e) => setTestInput(e.target.value)}
+                  placeholder="Type a model name to test..."
+                  variant="medium"
+                  fullWidth
+                />
+                {testInput && (
+                  <span
+                    className={`text-xs font-medium ${
+                      testResult ? "text-green-400" : "text-red-400"
+                    }`}
+                  >
+                    {testResult ? "Match" : "No match"}
+                  </span>
+                )}
+              </div>
+            </div>
+
+            {/* Pricing tiers */}
+            <div className="space-y-3">
+              <div className="flex items-center justify-between">
+                <label className="text-sm font-medium text-text-bright">Pricing Tiers</label>
+                <Button
+                  type="button"
+                  variant="tertiary/small"
+                  onClick={() =>
+                    setTiers([
+                      ...tiers,
+                      {
+                        name: `Tier ${tiers.length + 1}`,
+                        isDefault: tiers.length === 0,
+                        priority: tiers.length,
+                        conditions: [],
+                        prices: {},
+                      },
+                    ])
+                  }
+                >
+                  Add tier
+                </Button>
+              </div>
+
+              {tiers.map((tier, tierIdx) => (
+                <TierEditor
+                  key={tierIdx}
+                  tier={tier}
+                  onChange={(updated) => {
+                    const next = [...tiers];
+                    next[tierIdx] = updated;
+                    setTiers(next);
+                  }}
+                  onRemove={() => setTiers(tiers.filter((_, i) => i !== tierIdx))}
+                />
+              ))}
+            </div>
+
+            {actionData?.error && (
+              <div className="rounded-md bg-red-500/10 border border-red-500/30 p-3 text-sm text-red-400">
+                {actionData.error}
+                {actionData.details && (
+                  <pre className="mt-1 text-xs text-red-300/70 overflow-auto">
+                    {JSON.stringify(actionData.details, null, 2)}
+                  </pre>
+                )}
+              </div>
+            )}
+
+            <div className="flex items-center gap-2 border-t border-grid-dimmed pt-4">
+              <Button type="submit" variant="primary/medium">
+                Create model
+              </Button>
+              <LinkButton to="/admin/llm-models" variant="tertiary/medium">
+                Cancel
+              </LinkButton>
+            </div>
+          </div>
+        </Form>
+      </div>
+    </main>
+  );
+}
+
+// ---------------------------------------------------------------------------
+// Shared tier editor (duplicated from detail page — could be extracted later)
+// ---------------------------------------------------------------------------
+
+type TierData = {
+  name: string;
+  isDefault: boolean;
+  priority: number;
+  conditions: Array<{ usageDetailPattern: string; operator: string; value: number }>;
+  prices: Record<string, number>;
+};
+
+const COMMON_USAGE_TYPES = [
+  "input",
+  "output",
+  "input_cached_tokens",
+  "cache_creation_input_tokens",
+  "reasoning_tokens",
+];
+
+function TierEditor({
+  tier,
+  onChange,
+  onRemove,
+}: {
+  tier: TierData;
+  onChange: (t: TierData) => void;
+  onRemove: () => void;
+}) {
+  const [newUsageType, setNewUsageType] = useState("");
+
+  return (
+    <div className="rounded-md border border-grid-dimmed bg-charcoal-800 p-3 space-y-3">
+      <div className="flex items-center justify-between">
+        <div className="flex items-center gap-3">
+          <input
+            className="bg-charcoal-750 text-text-bright rounded px-2 py-1 text-sm border border-grid-dimmed"
+            value={tier.name}
+            onChange={(e) => onChange({ ...tier, name: e.target.value })}
+            placeholder="Tier name"
+          />
+          <label className="flex items-center gap-1 text-xs text-text-dimmed">
+            <input
+              type="checkbox"
+              checked={tier.isDefault}
+              onChange={(e) => onChange({ ...tier, isDefault: e.target.checked })}
+            />
+            Default
+          </label>
+          <label className="flex items-center gap-1 text-xs text-text-dimmed">
+            Priority:
+            <input
+              type="number"
+              className="w-12 bg-charcoal-750 text-text-bright rounded px-1 py-0.5 text-xs border border-grid-dimmed"
+              value={tier.priority}
+              onChange={(e) => onChange({ ...tier, priority: parseInt(e.target.value) || 0 })}
+            />
+          </label>
+        </div>
+        <button
+          type="button"
+          onClick={onRemove}
+          className="text-xs text-red-400 hover:text-red-300"
+        >
+          Remove tier
+        </button>
+      </div>
+
+      <div className="space-y-1">
+        <span className="text-xs font-medium text-text-dimmed">Prices (per token)</span>
+        <div className="space-y-1">
+          {Object.entries(tier.prices).map(([usageType, price]) => (
+            <div key={usageType} className="flex items-center gap-2">
+              <span className="w-48 text-xs font-mono text-text-dimmed">{usageType}</span>
+              <input
+                type="text"
+                className="w-32 bg-charcoal-750 text-text-bright rounded px-2 py-0.5 text-xs font-mono border border-grid-dimmed"
+                value={price}
+                onChange={(e) => {
+                  const val = parseFloat(e.target.value);
+                  if (!isNaN(val)) {
+                    onChange({ ...tier, prices: { ...tier.prices, [usageType]: val } });
+                  }
+                }}
+              />
+              <button
+                type="button"
+                onClick={() => {
+                  const { [usageType]: _, ...rest } = tier.prices;
+                  onChange({ ...tier, prices: rest });
+                }}
+                className="text-xs text-red-400 hover:text-red-300"
+              >
+                x
+              </button>
+            </div>
+          ))}
+        </div>
+
+        <div className="flex items-center gap-2 pt-1">
+          <select
+            className="bg-charcoal-750 text-text-dimmed rounded px-2 py-0.5 text-xs border border-grid-dimmed"
+            value={newUsageType}
+            onChange={(e) => setNewUsageType(e.target.value)}
+          >
+            <option value="">Add price...</option>
+            {COMMON_USAGE_TYPES.filter((t) => !(t in tier.prices)).map((t) => (
+              <option key={t} value={t}>
+                {t}
+              </option>
+            ))}
+            <option value="__custom">Custom...</option>
+          </select>
+          {newUsageType && (
+            <Button
+              type="button"
+              variant="tertiary/small"
+              onClick={() => {
+                const key =
+                  newUsageType === "__custom"
+                    ? prompt("Usage type name:") ?? ""
+                    : newUsageType;
+                if (key) {
+                  onChange({ ...tier, prices: { ...tier.prices, [key]: 0 } });
+                  setNewUsageType("");
+                }
+              }}
+            >
+              Add
+            </Button>
+          )}
+        </div>
+      </div>
+    </div>
+  );
+}
diff --git a/apps/webapp/app/routes/admin.tsx b/apps/webapp/app/routes/admin.tsx
index ac8e56c855e..34792e66ee5 100644
--- a/apps/webapp/app/routes/admin.tsx
+++ b/apps/webapp/app/routes/admin.tsx
@@ -32,6 +32,10 @@ export default function Page() {
               label: "Concurrency",
               to: "/admin/concurrency",
             },
+            {
+              label: "LLM Models",
+              to: "/admin/llm-models",
+            },
           ]}
           layoutId={"admin"}
         />
diff --git a/apps/webapp/app/routes/resources.metric.tsx b/apps/webapp/app/routes/resources.metric.tsx
index 3c19d3947f9..60d83f7a600 100644
--- a/apps/webapp/app/routes/resources.metric.tsx
+++ b/apps/webapp/app/routes/resources.metric.tsx
@@ -44,6 +44,7 @@ const MetricWidgetQuery = z.object({
   to: z.string().nullable(),
   taskIdentifiers: z.array(z.string()).optional(),
   queues: z.array(z.string()).optional(),
+  responseModels: z.array(z.string()).optional(),
   tags: z.array(z.string()).optional(),
 });
 
@@ -74,6 +75,7 @@ export const action = async ({ request }: ActionFunctionArgs) => {
     to,
     taskIdentifiers,
     queues,
+    responseModels,
     tags,
   } = submission.data;
 
@@ -107,6 +109,7 @@ export const action = async ({ request }: ActionFunctionArgs) => {
     to,
     taskIdentifiers,
     queues,
+    responseModels,
     // Set higher concurrency if many widgets are on screen at once
     customOrgConcurrencyLimit: env.METRIC_WIDGET_DEFAULT_ORG_CONCURRENCY_LIMIT,
   });
@@ -257,6 +260,7 @@ export function MetricWidget({
     props.scope,
     JSON.stringify(props.taskIdentifiers),
     JSON.stringify(props.queues),
+    JSON.stringify(props.responseModels),
   ]);
 
   const data = response?.success
diff --git a/apps/webapp/app/routes/resources.orgs.$organizationSlug.projects.$projectParam.env.$envParam.runs.$runParam.spans.$spanParam/route.tsx b/apps/webapp/app/routes/resources.orgs.$organizationSlug.projects.$projectParam.env.$envParam.runs.$runParam.spans.$spanParam/route.tsx
index e46eaa5148f..8f7ae61b5d5 100644
--- a/apps/webapp/app/routes/resources.orgs.$organizationSlug.projects.$projectParam.env.$envParam.runs.$runParam.spans.$spanParam/route.tsx
+++ b/apps/webapp/app/routes/resources.orgs.$organizationSlug.projects.$projectParam.env.$envParam.runs.$runParam.spans.$spanParam/route.tsx
@@ -19,7 +19,7 @@ import {
   taskRunErrorEnhancer,
 } from "@trigger.dev/core/v3";
 import { assertNever } from "assert-never";
-import { useEffect } from "react";
+import { useEffect, useState } from "react";
 import { typedjson, useTypedFetcher } from "remix-typedjson";
 import { ExitIcon } from "~/assets/icons/ExitIcon";
 import { FlagIcon } from "~/assets/icons/RegionIcons";
@@ -60,6 +60,7 @@ import { RunIcon } from "~/components/runs/v3/RunIcon";
 import { RunTag } from "~/components/runs/v3/RunTag";
 import { TruncatedCopyableValue } from "~/components/primitives/TruncatedCopyableValue";
 import { SpanEvents } from "~/components/runs/v3/SpanEvents";
+import { AISpanDetails } from "~/components/runs/v3/ai";
 import { SpanTitle } from "~/components/runs/v3/SpanTitle";
 import { TaskRunAttemptStatusCombo } from "~/components/runs/v3/TaskRunAttemptStatus";
 import {
@@ -252,6 +253,8 @@ function SpanBody({
 
   span = applySpanOverrides(span, spanOverrides);
 
+  const isAiGeneration = span.entity?.type === "ai-generation";
+
   return (
     <div className="grid h-full max-h-full grid-rows-[2.5rem_1fr] overflow-hidden bg-background-bright">
       <div className="flex items-center justify-between gap-2 overflow-x-hidden border-b border-grid-bright px-3 pr-2">
@@ -276,9 +279,13 @@ function SpanBody({
           />
         )}
       </div>
-      <div className="overflow-y-auto scrollbar-thin scrollbar-track-transparent scrollbar-thumb-charcoal-600">
+      {isAiGeneration ? (
         <SpanEntity span={span} />
-      </div>
+      ) : (
+        <div className="scrollbar-gutter-stable overflow-y-auto scrollbar-thin scrollbar-track-transparent scrollbar-thumb-charcoal-600">
+          <SpanEntity span={span} />
+        </div>
+      )}
     </div>
   );
 }
@@ -1155,6 +1162,35 @@ function RunError({ error }: { error: TaskRunError }) {
   }
 }
 
+function CollapsibleProperties({ code }: { code: string }) {
+  const [open, setOpen] = useState(false);
+  return (
+    <div className="border-t border-grid-bright pt-2">
+      <button
+        onClick={() => setOpen(!open)}
+        className="flex w-full items-center gap-1 text-xs font-medium text-text-dimmed hover:text-text-bright"
+      >
+        <ChevronUpIcon
+          className={cn("size-3.5 transition-transform", open ? "rotate-180" : "rotate-90")}
+        />
+        Raw properties
+      </button>
+      {open && (
+        <div className="mt-1.5">
+          <CodeBlock
+            code={code}
+            maxLines={20}
+            showLineNumbers={false}
+            showCopyButton
+            showTextWrapping
+            showOpenInModal
+          />
+        </div>
+      )}
+    </div>
+  );
+}
+
 function SpanEntity({ span }: { span: Span }) {
   const isAdmin = useHasAdminAccess();
 
@@ -1352,6 +1388,14 @@ function SpanEntity({ span }: { span: Span }) {
         />
       );
     }
+    case "ai-generation": {
+      return (
+        <AISpanDetails
+          aiData={span.entity.object}
+          rawProperties={typeof span.properties === "string" ? span.properties : span.properties != null ? JSON.stringify(span.properties, null, 2) : undefined}
+        />
+      );
+    }
     default: {
       assertNever(span.entity);
     }
diff --git a/apps/webapp/app/services/admin/missingLlmModels.server.ts b/apps/webapp/app/services/admin/missingLlmModels.server.ts
new file mode 100644
index 00000000000..7ce6bc2ab7e
--- /dev/null
+++ b/apps/webapp/app/services/admin/missingLlmModels.server.ts
@@ -0,0 +1,129 @@
+import { adminClickhouseClient } from "~/services/clickhouseInstance.server";
+import { llmPricingRegistry } from "~/v3/llmPricingRegistry.server";
+
+export type MissingLlmModel = {
+  model: string;
+  system: string;
+  count: number;
+};
+
+export async function getMissingLlmModels(opts: {
+  lookbackHours?: number;
+} = {}): Promise<MissingLlmModel[]> {
+  const lookbackHours = opts.lookbackHours ?? 24;
+  const since = new Date(Date.now() - lookbackHours * 60 * 60 * 1000);
+
+  // queryBuilderFast returns a factory function — call it to get the builder
+  const createBuilder = adminClickhouseClient.reader.queryBuilderFast<{
+    model: string;
+    system: string;
+    cnt: string;
+  }>({
+    name: "missingLlmModels",
+    table: "trigger_dev.task_events_v2",
+    columns: [
+      { name: "model", expression: "attributes.gen_ai.response.model.:String" },
+      { name: "system", expression: "attributes.gen_ai.system.:String" },
+      { name: "cnt", expression: "count()" },
+    ],
+  });
+  const qb = createBuilder();
+
+  // Partition pruning on inserted_at (partition key is toDate(inserted_at))
+  qb.where("inserted_at >= {since: DateTime64(3)}", {
+    since: formatDateTime(since),
+  });
+
+  // Only spans that have a model set
+  qb.where("attributes.gen_ai.response.model.:String != {empty: String}", { empty: "" });
+
+  // Only spans that were NOT cost-enriched (trigger.llm.total_cost is NULL)
+  qb.where("attributes.trigger.llm.total_cost.:Float64 IS NULL", {});
+
+  // Only completed spans
+  qb.where("kind = {kind: String}", { kind: "SPAN" });
+  qb.where("status = {status: String}", { status: "OK" });
+
+  qb.groupBy("model, system");
+  qb.orderBy("cnt DESC");
+  qb.limit(100);
+
+  const [err, rows] = await qb.execute();
+
+  if (err) {
+    throw err;
+  }
+
+  if (!rows) {
+    return [];
+  }
+
+  const candidates = rows
+    .filter((r) => r.model)
+    .map((r) => ({
+      model: r.model,
+      system: r.system,
+      count: parseInt(r.cnt, 10),
+    }));
+
+  if (candidates.length === 0) return [];
+
+  // Filter out models that now have pricing in the database (added after spans were inserted).
+  // The registry's match() handles prefix stripping for gateway/openrouter models.
+  if (!llmPricingRegistry || !llmPricingRegistry.isLoaded) return candidates;
+  const registry = llmPricingRegistry;
+  return candidates.filter((c) => !registry.match(c.model));
+}
+
+export type MissingModelSample = {
+  span_id: string;
+  run_id: string;
+  message: string;
+  attributes_text: string;
+  duration: string;
+  start_time: string;
+};
+
+export async function getMissingModelSamples(opts: {
+  model: string;
+  lookbackHours?: number;
+  limit?: number;
+}): Promise<MissingModelSample[]> {
+  const lookbackHours = opts.lookbackHours ?? 24;
+  const limit = opts.limit ?? 10;
+  const since = new Date(Date.now() - lookbackHours * 60 * 60 * 1000);
+
+  const createBuilder = adminClickhouseClient.reader.queryBuilderFast<MissingModelSample>({
+    name: "missingModelSamples",
+    table: "trigger_dev.task_events_v2",
+    columns: [
+      "span_id",
+      "run_id",
+      "message",
+      "attributes_text",
+      "duration",
+      "start_time",
+    ],
+  });
+  const qb = createBuilder();
+
+  qb.where("inserted_at >= {since: DateTime64(3)}", { since: formatDateTime(since) });
+  qb.where("attributes.gen_ai.response.model.:String = {model: String}", { model: opts.model });
+  qb.where("attributes.trigger.llm.total_cost.:Float64 IS NULL", {});
+  qb.where("kind = {kind: String}", { kind: "SPAN" });
+  qb.where("status = {status: String}", { status: "OK" });
+  qb.orderBy("start_time DESC");
+  qb.limit(limit);
+
+  const [err, rows] = await qb.execute();
+
+  if (err) {
+    throw err;
+  }
+
+  return rows ?? [];
+}
+
+function formatDateTime(date: Date): string {
+  return date.toISOString().replace("T", " ").replace("Z", "");
+}
diff --git a/apps/webapp/app/services/clickhouseInstance.server.ts b/apps/webapp/app/services/clickhouseInstance.server.ts
index 61494811a0e..9c4941671f3 100644
--- a/apps/webapp/app/services/clickhouseInstance.server.ts
+++ b/apps/webapp/app/services/clickhouseInstance.server.ts
@@ -71,6 +71,34 @@ function initializeLogsClickhouseClient() {
   });
 }
 
+export const adminClickhouseClient = singleton(
+  "adminClickhouseClient",
+  initializeAdminClickhouseClient
+);
+
+function initializeAdminClickhouseClient() {
+  if (!env.ADMIN_CLICKHOUSE_URL) {
+    throw new Error("ADMIN_CLICKHOUSE_URL is not set");
+  }
+
+  const url = new URL(env.ADMIN_CLICKHOUSE_URL);
+  url.searchParams.delete("secure");
+
+  return new ClickHouse({
+    url: url.toString(),
+    name: "admin-clickhouse",
+    keepAlive: {
+      enabled: env.CLICKHOUSE_KEEP_ALIVE_ENABLED === "1",
+      idleSocketTtl: env.CLICKHOUSE_KEEP_ALIVE_IDLE_SOCKET_TTL_MS,
+    },
+    logLevel: env.CLICKHOUSE_LOG_LEVEL,
+    compression: {
+      request: true,
+    },
+    maxOpenConnections: env.CLICKHOUSE_MAX_OPEN_CONNECTIONS,
+  });
+}
+
 export const queryClickhouseClient = singleton(
   "queryClickhouseClient",
   initializeQueryClickhouseClient
diff --git a/apps/webapp/app/services/queryService.server.ts b/apps/webapp/app/services/queryService.server.ts
index 6cd2af03b16..ce3444902d8 100644
--- a/apps/webapp/app/services/queryService.server.ts
+++ b/apps/webapp/app/services/queryService.server.ts
@@ -73,6 +73,8 @@ export type ExecuteQueryOptions<TOut extends z.ZodSchema> = Omit<
   taskIdentifiers?: string[];
   /** Filter to specific queues */
   queues?: string[];
+  /** Filter to specific response models */
+  responseModels?: string[];
   /** History options for saving query to billing/audit */
   history?: {
     /** Where the query originated from */
@@ -127,6 +129,7 @@ export async function executeQuery<TOut extends z.ZodSchema>(
     environmentId,
     taskIdentifiers,
     queues,
+    responseModels,
     history,
     customOrgConcurrencyLimit,
     ...baseOptions
@@ -210,6 +213,10 @@ export async function executeQuery<TOut extends z.ZodSchema>(
         ? { op: "in", values: taskIdentifiers }
         : undefined,
     queue: queues && queues.length > 0 ? { op: "in", values: queues } : undefined,
+    response_model:
+      responseModels && responseModels.length > 0
+        ? { op: "in", values: responseModels }
+        : undefined,
   } satisfies Record<string, WhereClauseCondition | undefined>;
 
   // Compute the effective time range for timeBucket() interval calculation
diff --git a/apps/webapp/app/tailwind.css b/apps/webapp/app/tailwind.css
index 2e435a032b7..8ec29b91568 100644
--- a/apps/webapp/app/tailwind.css
+++ b/apps/webapp/app/tailwind.css
@@ -85,6 +85,10 @@
 }
 
 @layer utilities {
+  .scrollbar-gutter-stable {
+    scrollbar-gutter: stable;
+  }
+
   .animated-gradient-glow {
     position: relative;
     overflow: visible;
diff --git a/apps/webapp/app/utils/columnFormat.ts b/apps/webapp/app/utils/columnFormat.ts
index 731b42fdb9f..c11226123ab 100644
--- a/apps/webapp/app/utils/columnFormat.ts
+++ b/apps/webapp/app/utils/columnFormat.ts
@@ -39,6 +39,19 @@ export function formatQuantity(value: number): string {
   return value.toLocaleString();
 }
 
+/**
+ * Format a dollar amount with adaptive precision — avoids trailing zeros.
+ */
+function formatCostAdaptive(dollars: number): string {
+  if (dollars === 0) return "$0";
+  const abs = Math.abs(dollars);
+  if (abs >= 1000) return `$${dollars.toFixed(2)}`;
+  if (abs >= 1) return `$${dollars.toFixed(2)}`;
+  if (abs >= 0.01) return `$${dollars.toFixed(4)}`;
+  if (abs >= 0.0001) return `$${dollars.toFixed(6)}`;
+  return formatCurrencyAccurate(dollars);
+}
+
 /**
  * Creates a value formatter function for a given column format type.
  * Used by chart tooltips, legend values, and big number cards.
@@ -61,9 +74,9 @@ export function createValueFormatter(
     case "durationSeconds":
       return (v) => formatDurationMilliseconds(v * 1000, { style: "short" });
     case "costInDollars":
-      return (v) => formatCurrencyAccurate(v);
+      return (v) => formatCostAdaptive(v);
     case "cost":
-      return (v) => formatCurrencyAccurate(v / 100);
+      return (v) => formatCostAdaptive(v / 100);
     default:
       return undefined;
   }
diff --git a/apps/webapp/app/v3/eventRepository/clickhouseEventRepository.server.ts b/apps/webapp/app/v3/eventRepository/clickhouseEventRepository.server.ts
index 9100ad84fec..de6d77835d0 100644
--- a/apps/webapp/app/v3/eventRepository/clickhouseEventRepository.server.ts
+++ b/apps/webapp/app/v3/eventRepository/clickhouseEventRepository.server.ts
@@ -1,5 +1,6 @@
 import type {
   ClickHouse,
+  LlmMetricsV1Input,
   TaskEventDetailedSummaryV1Result,
   TaskEventDetailsV1Result,
   TaskEventSummaryV1Result,
@@ -7,6 +8,7 @@ import type {
   TaskEventV2Input,
 } from "@internal/clickhouse";
 import { Attributes, startSpan, trace, Tracer } from "@internal/tracing";
+
 import { createJsonErrorObject } from "@trigger.dev/core/v3/errors";
 import { serializeTraceparent } from "@trigger.dev/core/v3/isomorphic";
 import {
@@ -84,6 +86,11 @@ export type ClickhouseEventRepositoryConfig = {
    * - "v2": Uses task_events_v2 (partitioned by inserted_at to avoid "too many parts" errors)
    */
   version?: "v1" | "v2";
+  /** LLM metrics flush scheduler config */
+  llmMetricsBatchSize?: number;
+  llmMetricsFlushInterval?: number;
+  llmMetricsMaxBatchSize?: number;
+  llmMetricsMaxConcurrency?: number;
 };
 
 /**
@@ -94,6 +101,7 @@ export class ClickhouseEventRepository implements IEventRepository {
   private _clickhouse: ClickHouse;
   private _config: ClickhouseEventRepositoryConfig;
   private readonly _flushScheduler: DynamicFlushScheduler<TaskEventV1Input | TaskEventV2Input>;
+  private readonly _llmMetricsFlushScheduler: DynamicFlushScheduler<LlmMetricsV1Input>;
   private _tracer: Tracer;
   private _version: "v1" | "v2";
 
@@ -118,6 +126,17 @@ export class ClickhouseEventRepository implements IEventRepository {
         return event.kind === "DEBUG_EVENT";
       },
     });
+
+    this._llmMetricsFlushScheduler = new DynamicFlushScheduler({
+      batchSize: config.llmMetricsBatchSize ?? 5000,
+      flushInterval: config.llmMetricsFlushInterval ?? 2000,
+      callback: this.#flushLlmMetricsBatch.bind(this),
+      minConcurrency: 1,
+      maxConcurrency: config.llmMetricsMaxConcurrency ?? 2,
+      maxBatchSize: config.llmMetricsMaxBatchSize ?? 10000,
+      memoryPressureThreshold: config.llmMetricsMaxBatchSize ?? 10000,
+      loadSheddingEnabled: false,
+    });
   }
 
   get version() {
@@ -216,6 +235,60 @@ export class ClickhouseEventRepository implements IEventRepository {
     });
   }
 
+  async #flushLlmMetricsBatch(flushId: string, rows: LlmMetricsV1Input[]) {
+
+    const [insertError] = await this._clickhouse.llmMetrics.insert(rows, {
+      params: {
+        clickhouse_settings: this.#getClickhouseInsertSettings(),
+      },
+    });
+
+    if (insertError) {
+      throw insertError;
+    }
+
+    logger.info("ClickhouseEventRepository.flushLlmMetricsBatch Inserted LLM metrics batch", {
+      rows: rows.length,
+    });
+  }
+
+  #createLlmMetricsInput(event: CreateEventInput): LlmMetricsV1Input {
+    const llmMetrics = event._llmMetrics!;
+
+    return {
+      organization_id: event.organizationId,
+      project_id: event.projectId,
+      environment_id: event.environmentId,
+      run_id: event.runId,
+      task_identifier: event.taskSlug,
+      trace_id: event.traceId,
+      span_id: event.spanId,
+      gen_ai_system: llmMetrics.genAiSystem,
+      request_model: llmMetrics.requestModel,
+      response_model: llmMetrics.responseModel,
+      matched_model_id: llmMetrics.matchedModelId,
+      operation_id: llmMetrics.operationId,
+      finish_reason: llmMetrics.finishReason,
+      cost_source: llmMetrics.costSource,
+      pricing_tier_id: llmMetrics.pricingTierId,
+      pricing_tier_name: llmMetrics.pricingTierName,
+      input_tokens: llmMetrics.inputTokens,
+      output_tokens: llmMetrics.outputTokens,
+      total_tokens: llmMetrics.totalTokens,
+      usage_details: llmMetrics.usageDetails,
+      input_cost: llmMetrics.inputCost,
+      output_cost: llmMetrics.outputCost,
+      total_cost: llmMetrics.totalCost,
+      cost_details: llmMetrics.costDetails,
+      provider_cost: llmMetrics.providerCost,
+      ms_to_first_chunk: llmMetrics.msToFirstChunk,
+      tokens_per_second: llmMetrics.tokensPerSecond,
+      metadata: llmMetrics.metadata,
+      start_time: this.#clampAndFormatStartTime(event.startTime.toString()),
+      duration: formatClickhouseUnsignedIntegerString(event.duration ?? 0),
+    };
+  }
+
   #getClickhouseInsertSettings() {
     if (this._config.insertStrategy === "insert") {
       return {};
@@ -236,6 +309,15 @@ export class ClickhouseEventRepository implements IEventRepository {
 
   async insertMany(events: CreateEventInput[]): Promise<void> {
     this.addToBatch(events.flatMap((event) => this.createEventToTaskEventV1Input(event)));
+
+    // Dual-write LLM metrics records for spans with cost enrichment
+    const llmMetricsRows = events
+      .filter((e) => e._llmMetrics != null)
+      .map((e) => this.#createLlmMetricsInput(e));
+
+    if (llmMetricsRows.length > 0) {
+      this._llmMetricsFlushScheduler.addToBatch(llmMetricsRows);
+    }
   }
 
   async insertManyImmediate(events: CreateEventInput[]): Promise<void> {
@@ -1302,19 +1384,26 @@ export class ClickhouseEventRepository implements IEventRepository {
         }
       }
 
-      if (
-        (span.properties == null ||
-          (typeof span.properties === "object" && Object.keys(span.properties).length === 0)) &&
-        typeof record.attributes_text === "string"
-      ) {
-        const parsedAttributes = this.#parseAttributes(record.attributes_text);
-        const resourceAttributes = parsedAttributes["$resource"];
-
-        // Remove the $resource key from the attributes
-        delete parsedAttributes["$resource"];
-
-        span.properties = parsedAttributes;
-        span.resourceProperties = resourceAttributes as Record<string, unknown> | undefined;
+      // Parse attributes from the first record that has them, then re-parse for the
+      // completed SPAN record. The completed record's attributes are a superset of the
+      // partial's (includes enriched trigger.llm.* cost data added during ingestion).
+      // This means at most 2x JSON.parse per span detail query, but only on this
+      // read path (span detail view), not on ingestion.
+      if (typeof record.attributes_text === "string") {
+        const shouldUpdate =
+          span.properties == null ||
+          (typeof span.properties === "object" && Object.keys(span.properties).length === 0) ||
+          (record.kind === "SPAN" && record.status !== "PARTIAL");
+
+        if (shouldUpdate) {
+          const parsedAttributes = this.#parseAttributes(record.attributes_text);
+          const resourceAttributes = parsedAttributes["$resource"];
+
+          delete parsedAttributes["$resource"];
+
+          span.properties = parsedAttributes;
+          span.resourceProperties = resourceAttributes as Record<string, unknown> | undefined;
+        }
       }
     }
 
@@ -1525,7 +1614,13 @@ export class ClickhouseEventRepository implements IEventRepository {
       }
 
       if (parsedMetadata && "style" in parsedMetadata && parsedMetadata.style) {
-        span.data.style = parsedMetadata.style as TaskEventStyle;
+        const newStyle = parsedMetadata.style as TaskEventStyle;
+        // Merge styles: prefer the most complete value for each field
+        span.data.style = {
+          icon: newStyle.icon ?? span.data.style.icon,
+          variant: newStyle.variant ?? span.data.style.variant,
+          accessory: newStyle.accessory ?? span.data.style.accessory,
+        };
       }
 
       if (record.kind === "SPAN") {
diff --git a/apps/webapp/app/v3/eventRepository/clickhouseEventRepositoryInstance.server.ts b/apps/webapp/app/v3/eventRepository/clickhouseEventRepositoryInstance.server.ts
index 36fb13c6e96..d4e28c5841a 100644
--- a/apps/webapp/app/v3/eventRepository/clickhouseEventRepositoryInstance.server.ts
+++ b/apps/webapp/app/v3/eventRepository/clickhouseEventRepositoryInstance.server.ts
@@ -64,6 +64,10 @@ function initializeClickhouseRepository() {
     asyncInsertMaxDataSize: env.EVENTS_CLICKHOUSE_ASYNC_INSERT_MAX_DATA_SIZE,
     asyncInsertBusyTimeoutMs: env.EVENTS_CLICKHOUSE_ASYNC_INSERT_BUSY_TIMEOUT_MS,
     startTimeMaxAgeMs: env.EVENTS_CLICKHOUSE_START_TIME_MAX_AGE_MS,
+    llmMetricsBatchSize: env.LLM_METRICS_BATCH_SIZE,
+    llmMetricsFlushInterval: env.LLM_METRICS_FLUSH_INTERVAL_MS,
+    llmMetricsMaxBatchSize: env.LLM_METRICS_MAX_BATCH_SIZE,
+    llmMetricsMaxConcurrency: env.LLM_METRICS_MAX_CONCURRENCY,
     version: "v1",
   });
 
@@ -97,6 +101,10 @@ function initializeClickhouseRepositoryV2() {
     waitForAsyncInsert: env.EVENTS_CLICKHOUSE_WAIT_FOR_ASYNC_INSERT === "1",
     asyncInsertMaxDataSize: env.EVENTS_CLICKHOUSE_ASYNC_INSERT_MAX_DATA_SIZE,
     asyncInsertBusyTimeoutMs: env.EVENTS_CLICKHOUSE_ASYNC_INSERT_BUSY_TIMEOUT_MS,
+    llmMetricsBatchSize: env.LLM_METRICS_BATCH_SIZE,
+    llmMetricsFlushInterval: env.LLM_METRICS_FLUSH_INTERVAL_MS,
+    llmMetricsMaxBatchSize: env.LLM_METRICS_MAX_BATCH_SIZE,
+    llmMetricsMaxConcurrency: env.LLM_METRICS_MAX_CONCURRENCY,
     version: "v2",
   });
 
diff --git a/apps/webapp/app/v3/eventRepository/common.server.ts b/apps/webapp/app/v3/eventRepository/common.server.ts
index 2e3bdf37c50..3ba8a50c7f7 100644
--- a/apps/webapp/app/v3/eventRepository/common.server.ts
+++ b/apps/webapp/app/v3/eventRepository/common.server.ts
@@ -140,7 +140,8 @@ export function createExceptionPropertiesFromError(error: TaskRunError): Excepti
   }
 }
 
-// removes keys that start with a $ sign. If there are no keys left, return undefined
+// Removes internal/private attribute keys from span properties.
+// Filters: "$" prefixed keys (private metadata) and "ctx." prefixed keys (Trigger.dev run context)
 export function removePrivateProperties(
   attributes: Attributes | undefined | null
 ): Attributes | undefined {
@@ -151,7 +152,7 @@ export function removePrivateProperties(
   const result: Attributes = {};
 
   for (const [key, value] of Object.entries(attributes)) {
-    if (key.startsWith("$")) {
+    if (key.startsWith("$") || key.startsWith("ctx.")) {
       continue;
     }
 
diff --git a/apps/webapp/app/v3/eventRepository/eventRepository.types.ts b/apps/webapp/app/v3/eventRepository/eventRepository.types.ts
index 75664ad0525..fcef0010ee0 100644
--- a/apps/webapp/app/v3/eventRepository/eventRepository.types.ts
+++ b/apps/webapp/app/v3/eventRepository/eventRepository.types.ts
@@ -21,6 +21,30 @@ export type { ExceptionEventProperties };
 // Event Creation Types
 // ============================================================================
 
+export type LlmMetricsData = {
+  genAiSystem: string;
+  requestModel: string;
+  responseModel: string;
+  matchedModelId: string;
+  operationId: string;
+  finishReason: string;
+  costSource: string;
+  pricingTierId: string;
+  pricingTierName: string;
+  inputTokens: number;
+  outputTokens: number;
+  totalTokens: number;
+  usageDetails: Record<string, number>;
+  inputCost: number;
+  outputCost: number;
+  totalCost: number;
+  costDetails: Record<string, number>;
+  providerCost: number;
+  msToFirstChunk: number;
+  tokensPerSecond: number;
+  metadata: Record<string, string>;
+};
+
 export type CreateEventInput = Omit<
   Prisma.TaskEventCreateInput,
   | "id"
@@ -57,6 +81,9 @@ export type CreateEventInput = Omit<
   metadata: Attributes | undefined;
   style: Attributes | undefined;
   machineId?: string;
+  runTags?: string[];
+  /** Side-channel data for LLM cost tracking, populated by enrichCreatableEvents */
+  _llmMetrics?: LlmMetricsData;
 };
 
 export type CreatableEventKind = TaskEventKind;
diff --git a/apps/webapp/app/v3/llmPricingRegistry.server.ts b/apps/webapp/app/v3/llmPricingRegistry.server.ts
new file mode 100644
index 00000000000..627609bb1d8
--- /dev/null
+++ b/apps/webapp/app/v3/llmPricingRegistry.server.ts
@@ -0,0 +1,62 @@
+import { ModelPricingRegistry, seedLlmPricing } from "@internal/llm-pricing";
+import { prisma, $replica } from "~/db.server";
+import { env } from "~/env.server";
+import { signalsEmitter } from "~/services/signals.server";
+import { singleton } from "~/utils/singleton";
+import { setLlmPricingRegistry } from "./utils/enrichCreatableEvents.server";
+
+async function initRegistry(registry: ModelPricingRegistry) {
+  if (env.LLM_PRICING_SEED_ON_STARTUP) {
+    await seedLlmPricing(prisma);
+  }
+
+  await registry.loadFromDatabase();
+}
+
+export const llmPricingRegistry = singleton("llmPricingRegistry", () => {
+  if (!env.LLM_COST_TRACKING_ENABLED) {
+    return null;
+  }
+
+  const registry = new ModelPricingRegistry($replica);
+
+  // Wire up the registry so enrichCreatableEvents can use it
+  setLlmPricingRegistry(registry);
+
+  initRegistry(registry).catch((err) => {
+    console.error("Failed to initialize LLM pricing registry", err);
+  });
+
+  // Periodic reload
+  const reloadInterval = env.LLM_PRICING_RELOAD_INTERVAL_MS;
+  const interval = setInterval(() => {
+    registry.reload().catch((err) => {
+      console.error("Failed to reload LLM pricing registry", err);
+    });
+  }, reloadInterval);
+
+  signalsEmitter.on("SIGTERM", () => {
+    clearInterval(interval);
+  });
+  signalsEmitter.on("SIGINT", () => {
+    clearInterval(interval);
+  });
+
+  return registry;
+});
+
+/**
+ * Wait for the LLM pricing registry to finish its initial load, with a timeout.
+ * After the first call resolves (or times out), subsequent calls are no-ops.
+ */
+export async function waitForLlmPricingReady(): Promise<void> {
+  if (!llmPricingRegistry || llmPricingRegistry.isLoaded) return;
+
+  const timeoutMs = env.LLM_PRICING_READY_TIMEOUT_MS;
+  if (timeoutMs <= 0) return;
+
+  await Promise.race([
+    llmPricingRegistry.isReady,
+    new Promise<void>((resolve) => setTimeout(resolve, timeoutMs)),
+  ]);
+}
diff --git a/apps/webapp/app/v3/otlpExporter.server.ts b/apps/webapp/app/v3/otlpExporter.server.ts
index 837071b7de7..5fe2624557d 100644
--- a/apps/webapp/app/v3/otlpExporter.server.ts
+++ b/apps/webapp/app/v3/otlpExporter.server.ts
@@ -37,6 +37,7 @@ import type {
 } from "./eventRepository/eventRepository.types";
 import { startSpan } from "./tracing.server";
 import { enrichCreatableEvents } from "./utils/enrichCreatableEvents.server";
+import { waitForLlmPricingReady } from "./llmPricingRegistry.server";
 import { env } from "~/env.server";
 import { detectBadJsonStrings } from "~/utils/detectBadJsonStrings";
 import { singleton } from "~/utils/singleton";
@@ -128,6 +129,7 @@ class OTLPExporter {
     for (const [store, events] of Object.entries(eventsGroupedByStore)) {
       const eventRepository = this.#getEventRepositoryForStore(store);
 
+      await waitForLlmPricingReady();
       const enrichedEvents = enrichCreatableEvents(events);
 
       this.#logEventsVerbose(enrichedEvents, `exportEvents ${store}`);
@@ -391,6 +393,8 @@ function convertSpansToCreateableEvents(
           SemanticInternalAttributes.METADATA
         );
 
+        const runTags = extractArrayAttribute(span.attributes ?? [], SemanticInternalAttributes.RUN_TAGS);
+
         const properties =
           truncateAttributes(
             convertKeyValueItemsToMap(span.attributes ?? [], [], undefined, [
@@ -439,6 +443,7 @@ function convertSpansToCreateableEvents(
           runId: spanProperties.runId ?? resourceProperties.runId ?? "unknown",
           taskSlug: spanProperties.taskSlug ?? resourceProperties.taskSlug ?? "unknown",
           machineId: spanProperties.machineId ?? resourceProperties.machineId,
+          runTags,
           attemptNumber:
             extractNumberAttribute(
               span.attributes ?? [],
@@ -708,6 +713,8 @@ function convertKeyValueItemsToMap(
         ? attribute.value.boolValue
         : isBytesValue(attribute.value)
         ? binaryToHex(attribute.value.bytesValue)
+        : isArrayValue(attribute.value)
+        ? serializeArrayValue(attribute.value.arrayValue!.values)
         : undefined;
 
       return map;
@@ -744,6 +751,8 @@ function convertSelectedKeyValueItemsToMap(
         ? attribute.value.boolValue
         : isBytesValue(attribute.value)
         ? binaryToHex(attribute.value.bytesValue)
+        : isArrayValue(attribute.value)
+        ? serializeArrayValue(attribute.value.arrayValue!.values)
         : undefined;
 
       return map;
@@ -1000,6 +1009,21 @@ function extractBooleanAttribute(
   return isBoolValue(attribute?.value) ? attribute.value.boolValue : fallback;
 }
 
+function extractArrayAttribute(
+  attributes: KeyValue[],
+  name: string | Array<string | undefined>
+): string[] | undefined {
+  const key = Array.isArray(name) ? name.filter(Boolean).join(".") : name;
+
+  const attribute = attributes.find((attribute) => attribute.key === key);
+
+  if (!attribute?.value?.arrayValue?.values) return undefined;
+
+  return attribute.value.arrayValue.values
+    .filter((v): v is { stringValue: string } => isStringValue(v))
+    .map((v) => v.stringValue);
+}
+
 function isPartialSpan(span: Span): boolean {
   if (!span.attributes) return false;
 
@@ -1042,6 +1066,31 @@ function isBytesValue(value: AnyValue | undefined): value is { bytesValue: Buffe
   return Buffer.isBuffer(value.bytesValue);
 }
 
+function isArrayValue(
+  value: AnyValue | undefined
+): value is { arrayValue: { values: AnyValue[] } } {
+  if (!value) return false;
+
+  return value.arrayValue != null && Array.isArray(value.arrayValue.values);
+}
+
+/**
+ * Serialize an OTEL array value into a JSON string.
+ * For arrays of strings, produces a JSON array: `["item1","item2"]`
+ * For mixed types, extracts primitives and serializes.
+ */
+function serializeArrayValue(values: AnyValue[]): string {
+  const items = values.map((v) => {
+    if (isStringValue(v)) return v.stringValue;
+    if (isIntValue(v)) return Number(v.intValue);
+    if (isDoubleValue(v)) return v.doubleValue;
+    if (isBoolValue(v)) return v.boolValue;
+    return null;
+  });
+
+  return JSON.stringify(items);
+}
+
 function binaryToHex(buffer: Buffer | string): string;
 function binaryToHex(buffer: Buffer | string | undefined): string | undefined;
 function binaryToHex(buffer: Buffer | string | undefined): string | undefined {
diff --git a/apps/webapp/app/v3/querySchemas.ts b/apps/webapp/app/v3/querySchemas.ts
index 53c3be60fa2..6a6c8758fdb 100644
--- a/apps/webapp/app/v3/querySchemas.ts
+++ b/apps/webapp/app/v3/querySchemas.ts
@@ -599,7 +599,240 @@ export const metricsSchema: TableSchema = {
 /**
  * All available schemas for the query editor
  */
-export const querySchemas: TableSchema[] = [runsSchema, metricsSchema];
+/**
+ * Schema definition for the llm_metrics table (trigger_dev.llm_metrics_v1)
+ */
+export const llmMetricsSchema: TableSchema = {
+  name: "llm_metrics",
+  clickhouseName: "trigger_dev.llm_metrics_v1",
+  description: "LLM metrics: token usage, cost, performance, and behavior from GenAI spans",
+  timeConstraint: "start_time",
+  tenantColumns: {
+    organizationId: "organization_id",
+    projectId: "project_id",
+    environmentId: "environment_id",
+  },
+  columns: {
+    environment: {
+      name: "environment",
+      clickhouseName: "environment_id",
+      ...column("String", { description: "The environment slug", example: "prod" }),
+      fieldMapping: "environment",
+      customRenderType: "environment",
+    },
+    project: {
+      name: "project",
+      clickhouseName: "project_id",
+      ...column("String", {
+        description: "The project reference, they always start with `proj_`.",
+        example: "proj_howcnaxbfxdmwmxazktx",
+      }),
+      fieldMapping: "project",
+      customRenderType: "project",
+    },
+    run_id: {
+      name: "run_id",
+      ...column("String", {
+        description: "The run ID",
+        customRenderType: "runId",
+        coreColumn: true,
+      }),
+    },
+    task_identifier: {
+      name: "task_identifier",
+      ...column("LowCardinality(String)", {
+        description: "The task identifier",
+        example: "my-task",
+        coreColumn: true,
+      }),
+    },
+    gen_ai_system: {
+      name: "gen_ai_system",
+      ...column("LowCardinality(String)", {
+        description: "AI provider (e.g. openai, anthropic)",
+        example: "openai",
+        coreColumn: true,
+      }),
+    },
+    request_model: {
+      name: "request_model",
+      ...column("String", {
+        description: "The model name requested",
+        example: "gpt-4o",
+      }),
+    },
+    response_model: {
+      name: "response_model",
+      ...column("String", {
+        description: "The model name returned by the provider",
+        example: "gpt-4o-2024-08-06",
+        coreColumn: true,
+      }),
+    },
+    operation_id: {
+      name: "operation_id",
+      ...column("LowCardinality(String)", {
+        description: "Operation type (e.g. ai.streamText.doStream, ai.generateText.doGenerate)",
+        example: "ai.streamText.doStream",
+      }),
+    },
+    finish_reason: {
+      name: "finish_reason",
+      ...column("LowCardinality(String)", {
+        description: "Why the LLM stopped generating (e.g. stop, tool-calls, length)",
+        example: "stop",
+        coreColumn: true,
+      }),
+    },
+    cost_source: {
+      name: "cost_source",
+      ...column("LowCardinality(String)", {
+        description: "Where cost data came from (registry, gateway, openrouter)",
+        example: "registry",
+      }),
+    },
+    input_tokens: {
+      name: "input_tokens",
+      ...column("UInt64", {
+        description: "Number of input tokens",
+        example: "702",
+      }),
+    },
+    output_tokens: {
+      name: "output_tokens",
+      ...column("UInt64", {
+        description: "Number of output tokens",
+        example: "22",
+      }),
+    },
+    total_tokens: {
+      name: "total_tokens",
+      ...column("UInt64", {
+        description: "Total token count",
+        example: "724",
+      }),
+    },
+    cached_read_tokens: {
+      name: "cached_read_tokens",
+      ...column("UInt64", {
+        description:
+          "Input tokens served from the provider's prompt cache (cheaper than regular input tokens). Supported by Anthropic and OpenAI.",
+        example: "8200",
+      }),
+      expression: "usage_details['input_cached_tokens']",
+    },
+    cache_creation_tokens: {
+      name: "cache_creation_tokens",
+      ...column("UInt64", {
+        description:
+          "Input tokens written to create a new prompt cache entry. Supported by Anthropic.",
+        example: "1751",
+      }),
+      expression: "usage_details['cache_creation_input_tokens']",
+    },
+    reasoning_tokens: {
+      name: "reasoning_tokens",
+      ...column("UInt64", {
+        description:
+          "Tokens used for chain-of-thought reasoning (e.g. OpenAI o-series, DeepSeek R1). These count toward output but are not visible in the response.",
+        example: "512",
+      }),
+      expression: "usage_details['reasoning_tokens']",
+    },
+    input_cost: {
+      name: "input_cost",
+      ...column("Decimal64(12)", {
+        description: "Input cost in USD (from pricing registry)",
+        customRenderType: "costInDollars",
+      }),
+    },
+    output_cost: {
+      name: "output_cost",
+      ...column("Decimal64(12)", {
+        description: "Output cost in USD (from pricing registry)",
+        customRenderType: "costInDollars",
+      }),
+    },
+    total_cost: {
+      name: "total_cost",
+      ...column("Decimal64(12)", {
+        description: "Total cost in USD",
+        customRenderType: "costInDollars",
+        coreColumn: true,
+      }),
+    },
+    cached_read_cost: {
+      name: "cached_read_cost",
+      ...column("Decimal64(12)", {
+        description:
+          "Cost of cached input tokens (discounted vs regular input). Only present when the pricing tier has a separate cached input price.",
+        customRenderType: "costInDollars",
+      }),
+      expression: "cost_details['input_cached_tokens']",
+    },
+    cache_creation_cost: {
+      name: "cache_creation_cost",
+      ...column("Decimal64(12)", {
+        description: "Cost of tokens written to create a prompt cache entry.",
+        customRenderType: "costInDollars",
+      }),
+      expression: "cost_details['cache_creation_input_tokens']",
+    },
+    provider_cost: {
+      name: "provider_cost",
+      ...column("Decimal64(12)", {
+        description: "Provider-reported cost in USD (from gateway or openrouter)",
+        customRenderType: "costInDollars",
+      }),
+    },
+    ms_to_first_chunk: {
+      name: "ms_to_first_chunk",
+      ...column("Float64", {
+        description: "Time to first chunk in milliseconds (TTFC)",
+        example: "245.3",
+        coreColumn: true,
+      }),
+    },
+    tokens_per_second: {
+      name: "tokens_per_second",
+      ...column("Float64", {
+        description: "Average output tokens per second",
+        example: "72.5",
+      }),
+    },
+    pricing_tier_name: {
+      name: "pricing_tier_name",
+      ...column("LowCardinality(String)", {
+        description: "The matched pricing tier name",
+        example: "Standard",
+      }),
+    },
+    start_time: {
+      name: "start_time",
+      ...column("DateTime64(9)", {
+        description: "When the LLM call started",
+        coreColumn: true,
+      }),
+    },
+    duration: {
+      name: "duration",
+      ...column("UInt64", {
+        description: "Span duration in nanoseconds",
+        customRenderType: "durationNs",
+      }),
+    },
+    metadata: {
+      name: "metadata",
+      ...column("Map(LowCardinality(String), String)", {
+        description:
+          "Key-value metadata from run tags (key:value format) and AI SDK telemetry metadata. Access keys with dot notation (metadata.userId) or bracket syntax (metadata['userId']).",
+        example: "{'userId':'user_123','org':'acme'}",
+      }),
+    },
+  },
+};
+
+export const querySchemas: TableSchema[] = [runsSchema, metricsSchema, llmMetricsSchema];
 
 /**
  * Default query for the query editor
diff --git a/apps/webapp/app/v3/utils/enrichCreatableEvents.server.ts b/apps/webapp/app/v3/utils/enrichCreatableEvents.server.ts
index f718c13d2dd..06458c396f9 100644
--- a/apps/webapp/app/v3/utils/enrichCreatableEvents.server.ts
+++ b/apps/webapp/app/v3/utils/enrichCreatableEvents.server.ts
@@ -1,4 +1,30 @@
-import type { CreateEventInput } from "../eventRepository/eventRepository.types";
+import type { CreateEventInput, LlmMetricsData } from "../eventRepository/eventRepository.types";
+
+// Registry interface — matches ModelPricingRegistry from @internal/llm-pricing
+type CostRegistry = {
+  isLoaded: boolean;
+  calculateCost(
+    responseModel: string,
+    usageDetails: Record<string, number>
+  ): {
+    matchedModelId: string;
+    matchedModelName: string;
+    pricingTierId: string;
+    pricingTierName: string;
+    inputCost: number;
+    outputCost: number;
+    totalCost: number;
+    costDetails: Record<string, number>;
+  } | null;
+};
+
+let _registry: CostRegistry | undefined;
+
+const ENRICHABLE_KINDS = new Set(["INTERNAL", "SERVER", "CLIENT", "CONSUMER", "PRODUCER"]);
+
+export function setLlmPricingRegistry(registry: CostRegistry): void {
+  _registry = registry;
+}
 
 export function enrichCreatableEvents(events: CreateEventInput[]) {
   return events.map((event) => {
@@ -12,9 +38,205 @@ function enrichCreatableEvent(event: CreateEventInput): CreateEventInput {
   event.message = message;
   event.style = enrichStyle(event);
 
+  enrichLlmMetrics(event);
+
   return event;
 }
 
+function enrichLlmMetrics(event: CreateEventInput): void {
+  const props = event.properties;
+  if (!props) return;
+
+  // Only enrich span-like events (INTERNAL, SERVER, CLIENT, CONSUMER, PRODUCER — not LOG, UNSPECIFIED)
+  if (!ENRICHABLE_KINDS.has(event.kind as string)) return;
+
+  // Skip partial spans (they don't have final token counts)
+  if (event.isPartial) return;
+
+  // Only use gen_ai.* attributes for model resolution to avoid double-counting.
+  // The Vercel AI SDK emits both a parent span (ai.streamText with ai.usage.*)
+  // and a child span (ai.streamText.doStream with gen_ai.*). We only enrich the
+  // child span that has the canonical gen_ai.response.model attribute.
+  const responseModel =
+    typeof props["gen_ai.response.model"] === "string"
+      ? props["gen_ai.response.model"]
+      : typeof props["gen_ai.request.model"] === "string"
+        ? props["gen_ai.request.model"]
+        : null;
+
+  if (!responseModel) {
+    return;
+  }
+
+  // Extract usage details, normalizing attribute names
+  const usageDetails = extractUsageDetails(props);
+
+  // Need at least some token usage
+  const hasTokens = Object.values(usageDetails).some((v) => v > 0);
+  if (!hasTokens) {
+    return;
+  }
+
+  // Add style accessories for model and tokens (even without cost data)
+  const inputTokens = usageDetails["input"] ?? 0;
+  const outputTokens = usageDetails["output"] ?? 0;
+  const totalTokens = usageDetails["total"] ?? inputTokens + outputTokens;
+
+  const pillItems: Array<{ text: string; icon: string }> = [
+    { text: responseModel, icon: "tabler-cube" },
+    { text: formatTokenCount(totalTokens), icon: "tabler-hash" },
+  ];
+
+  // Try cost enrichment if the registry is loaded.
+  // The registry handles prefix stripping (e.g. "mistral/mistral-large-3" → "mistral-large-3")
+  // for gateway/openrouter models automatically in its match() method.
+  let cost: ReturnType<NonNullable<typeof _registry>["calculateCost"]> | null = null;
+  if (_registry?.isLoaded) {
+    cost = _registry.calculateCost(responseModel, usageDetails);
+  }
+
+  // Fallback: extract cost from provider metadata (gateway/openrouter report per-request cost)
+  let providerCost: { totalCost: number; source: string } | null = null;
+  if (!cost) {
+    providerCost = extractProviderCost(props);
+  }
+
+  if (cost) {
+    // Add trigger.llm.* attributes to the span from our pricing registry
+    event.properties = {
+      ...props,
+      "trigger.llm.input_cost": cost.inputCost,
+      "trigger.llm.output_cost": cost.outputCost,
+      "trigger.llm.total_cost": cost.totalCost,
+      "trigger.llm.matched_model": cost.matchedModelName,
+      "trigger.llm.matched_model_id": cost.matchedModelId,
+      "trigger.llm.pricing_tier": cost.pricingTierName,
+      "trigger.llm.pricing_tier_id": cost.pricingTierId,
+    };
+
+    pillItems.push({ text: formatCost(cost.totalCost), icon: "tabler-currency-dollar" });
+  } else if (providerCost) {
+    // Use provider-reported cost as fallback (no input/output breakdown available)
+    event.properties = {
+      ...props,
+      "trigger.llm.total_cost": providerCost.totalCost,
+      "trigger.llm.cost_source": providerCost.source,
+    };
+
+    pillItems.push({ text: formatCost(providerCost.totalCost), icon: "tabler-currency-dollar" });
+  }
+
+  event.style = {
+    ...(event.style as Record<string, unknown> | undefined),
+    accessory: {
+      style: "pills",
+      items: pillItems,
+    },
+  } as unknown as typeof event.style;
+
+  // Only write llm_metrics when cost data is available
+  if (!cost && !providerCost) return;
+
+  // Build metadata map from run tags and ai.telemetry.metadata.*
+  const metadata: Record<string, string> = {};
+
+  if (event.runTags) {
+    for (const tag of event.runTags) {
+      const colonIdx = tag.indexOf(":");
+      if (colonIdx > 0) {
+        metadata[tag.substring(0, colonIdx)] = tag.substring(colonIdx + 1);
+      }
+    }
+  }
+
+  for (const [key, value] of Object.entries(props)) {
+    if (key.startsWith("ai.telemetry.metadata.") && typeof value === "string") {
+      metadata[key.slice("ai.telemetry.metadata.".length)] = value;
+    }
+  }
+
+  // Extract new performance/behavioral fields
+  const finishReason = typeof props["ai.response.finishReason"] === "string"
+    ? props["ai.response.finishReason"]
+    : typeof props["gen_ai.response.finish_reasons"] === "string"
+      ? props["gen_ai.response.finish_reasons"]
+      : "";
+  const operationId = typeof props["ai.operationId"] === "string"
+    ? props["ai.operationId"]
+    : typeof props["gen_ai.operation.name"] === "string"
+      ? props["gen_ai.operation.name"]
+      : typeof props["operation.name"] === "string"
+        ? props["operation.name"]
+        : "";
+  const msToFirstChunk = typeof props["ai.response.msToFirstChunk"] === "number"
+    ? props["ai.response.msToFirstChunk"]
+    : 0;
+  const avgTokensPerSec = typeof props["ai.response.avgOutputTokensPerSecond"] === "number"
+    ? props["ai.response.avgOutputTokensPerSecond"]
+    : 0;
+  const costSource = cost ? "registry" : providerCost ? providerCost.source : "";
+  const providerCostValue = providerCost?.totalCost ?? 0;
+
+  // Set _llmMetrics side-channel for dual-write to llm_metrics_v1
+  const llmMetrics: LlmMetricsData = {
+    genAiSystem: typeof props["gen_ai.system"] === "string" ? props["gen_ai.system"] : "unknown",
+    requestModel: typeof props["gen_ai.request.model"] === "string" ? props["gen_ai.request.model"] : responseModel,
+    responseModel,
+    matchedModelId: cost?.matchedModelId ?? "",
+    operationId,
+    finishReason,
+    costSource,
+    pricingTierId: cost?.pricingTierId ?? (providerCost ? `provider:${providerCost.source}` : ""),
+    pricingTierName: cost?.pricingTierName ?? (providerCost ? `${providerCost.source} reported` : ""),
+    inputTokens: usageDetails["input"] ?? 0,
+    outputTokens: usageDetails["output"] ?? 0,
+    totalTokens: usageDetails["total"] ?? (usageDetails["input"] ?? 0) + (usageDetails["output"] ?? 0),
+    usageDetails,
+    inputCost: cost?.inputCost ?? 0,
+    outputCost: cost?.outputCost ?? 0,
+    totalCost: cost?.totalCost ?? providerCost?.totalCost ?? 0,
+    costDetails: cost?.costDetails ?? {},
+    providerCost: providerCostValue,
+    msToFirstChunk,
+    tokensPerSecond: avgTokensPerSec,
+    metadata,
+  };
+
+  event._llmMetrics = llmMetrics;
+}
+
+function extractUsageDetails(props: Record<string, unknown>): Record<string, number> {
+  const details: Record<string, number> = {};
+
+  // Only map gen_ai.usage.* attributes — NOT ai.usage.* from parent spans.
+  // This prevents double-counting when both parent (ai.streamText) and child
+  // (ai.streamText.doStream) spans carry token counts.
+  const mappings: Record<string, string> = {
+    "gen_ai.usage.input_tokens": "input",
+    "gen_ai.usage.output_tokens": "output",
+    "gen_ai.usage.prompt_tokens": "input",
+    "gen_ai.usage.completion_tokens": "output",
+    "gen_ai.usage.total_tokens": "total",
+    "gen_ai.usage.cache_read_input_tokens": "input_cached_tokens",
+    "gen_ai.usage.input_tokens_cache_read": "input_cached_tokens",
+    "gen_ai.usage.cache_creation_input_tokens": "cache_creation_input_tokens",
+    "gen_ai.usage.input_tokens_cache_write": "cache_creation_input_tokens",
+    "gen_ai.usage.reasoning_tokens": "reasoning_tokens",
+  };
+
+  for (const [attrKey, usageKey] of Object.entries(mappings)) {
+    const value = props[attrKey];
+    if (typeof value === "number" && value > 0) {
+      // Don't overwrite if already set (first mapping wins)
+      if (details[usageKey] === undefined) {
+        details[usageKey] = value;
+      }
+    }
+  }
+
+  return details;
+}
+
 function enrichStyle(event: CreateEventInput) {
   const baseStyle = event.style ?? {};
   const props = event.properties;
@@ -23,11 +245,16 @@ function enrichStyle(event: CreateEventInput) {
     return baseStyle;
   }
 
-  // Direct property access and early returns
-  // GenAI System check
   const system = props["gen_ai.system"];
-  if (typeof system === "string") {
-    return { ...baseStyle, icon: `tabler-brand-${system.split(".")[0]}` };
+  const modelId = props["gen_ai.request.model"] ?? props["ai.model.id"];
+
+  const provider = resolveAiProvider(
+    typeof system === "string" ? system : undefined,
+    typeof modelId === "string" ? modelId : undefined
+  );
+
+  if (provider) {
+    return { ...baseStyle, icon: `ai-provider-${provider}` };
   }
 
   // Agent workflow check
@@ -39,16 +266,69 @@ function enrichStyle(event: CreateEventInput) {
   const message = event.message;
 
   if (typeof message === "string" && message === "ai.toolCall") {
-    return { ...baseStyle, icon: "tabler-tool" };
+    return { ...baseStyle, icon: "hero-wrench" };
   }
 
   if (typeof message === "string" && message.startsWith("ai.")) {
-    return { ...baseStyle, icon: "tabler-sparkles" };
+    return { ...baseStyle, icon: "hero-sparkles" };
   }
 
   return baseStyle;
 }
 
+function formatTokenCount(tokens: number): string {
+  if (tokens >= 1_000_000) return `${(tokens / 1_000_000).toFixed(1)}M`;
+  if (tokens >= 1_000) return `${(tokens / 1_000).toFixed(1)}k`;
+  return tokens.toString();
+}
+
+/**
+ * Extract provider-reported cost from ai.response.providerMetadata.
+ * Gateway and OpenRouter include per-request cost in their metadata.
+ */
+function extractProviderCost(
+  props: Record<string, unknown>
+): { totalCost: number; source: string } | null {
+  const rawMeta = props["ai.response.providerMetadata"];
+  if (typeof rawMeta !== "string") return null;
+
+  let meta: Record<string, unknown>;
+  try {
+    meta = JSON.parse(rawMeta) as Record<string, unknown>;
+  } catch {
+    return null;
+  }
+
+  if (!meta || typeof meta !== "object") return null;
+
+  // Gateway: { gateway: { cost: "0.0006615" } }
+  const gateway = meta.gateway;
+  if (gateway && typeof gateway === "object") {
+    const gw = gateway as Record<string, unknown>;
+    const cost = parseFloat(String(gw.cost ?? "0"));
+    if (cost > 0) return { totalCost: cost, source: "gateway" };
+  }
+
+  // OpenRouter: { openrouter: { usage: { cost: 0.000135 } } }
+  const openrouter = meta.openrouter;
+  if (openrouter && typeof openrouter === "object") {
+    const or = openrouter as Record<string, unknown>;
+    const usage = or.usage;
+    if (usage && typeof usage === "object") {
+      const cost = Number((usage as Record<string, unknown>).cost ?? 0);
+      if (cost > 0) return { totalCost: cost, source: "openrouter" };
+    }
+  }
+
+  return null;
+}
+
+function formatCost(cost: number): string {
+  if (cost >= 1) return `$${cost.toFixed(2)}`;
+  if (cost >= 0.01) return `$${cost.toFixed(4)}`;
+  return `$${cost.toFixed(6)}`;
+}
+
 function repr(value: any): string {
   if (typeof value === "string") {
     return `'${value}'`;
@@ -79,3 +359,65 @@ function formatPythonStyle(template: string, values: Record<string, any>): strin
     return hasRepr ? repr(value) : String(value);
   });
 }
+
+type AiProvider =
+  | "anthropic"
+  | "openai"
+  | "gemini"
+  | "llama"
+  | "deepseek"
+  | "xai"
+  | "perplexity"
+  | "cerebras"
+  | "azure"
+  | "mistral";
+
+const systemToProvider: Record<string, AiProvider> = {
+  anthropic: "anthropic",
+  openai: "openai",
+  azure: "azure",
+  "google.generative-ai": "gemini",
+  google: "gemini",
+  xai: "xai",
+  deepseek: "deepseek",
+  cerebras: "cerebras",
+  perplexity: "perplexity",
+  "meta-llama": "llama",
+  mistral: "mistral",
+};
+
+const modelPatterns: [RegExp, AiProvider][] = [
+  [/\banthropic\b|claude/i, "anthropic"],
+  [/\bopenai\b|gpt-|o[134]-|chatgpt/i, "openai"],
+  [/gemini/i, "gemini"],
+  [/llama/i, "llama"],
+  [/deepseek/i, "deepseek"],
+  [/grok/i, "xai"],
+  [/sonar/i, "perplexity"],
+  [/cerebras/i, "cerebras"],
+  [/mistral|mixtral|codestral|pixtral/i, "mistral"],
+];
+
+function resolveAiProvider(
+  system: string | undefined,
+  modelId: string | undefined
+): AiProvider | undefined {
+  if (modelId) {
+    if (modelId.includes("/")) {
+      const prefix = modelId.split("/")[0].toLowerCase();
+      const fromPrefix = systemToProvider[prefix];
+      if (fromPrefix) return fromPrefix;
+    }
+
+    for (const [pattern, provider] of modelPatterns) {
+      if (pattern.test(modelId)) return provider;
+    }
+  }
+
+  if (system) {
+    const normalized = system.toLowerCase().split(".")[0];
+    return systemToProvider[system] ?? systemToProvider[normalized];
+  }
+
+  return undefined;
+}
diff --git a/apps/webapp/package.json b/apps/webapp/package.json
index 139a0ce2d0d..48994376066 100644
--- a/apps/webapp/package.json
+++ b/apps/webapp/package.json
@@ -16,6 +16,7 @@
     "start:local": "cross-env node --max-old-space-size=8192 ./build/server.js",
     "typecheck": "cross-env NODE_OPTIONS=\"--max-old-space-size=8192\" tsc --noEmit -p ./tsconfig.check.json",
     "db:seed": "tsx seed.mts",
+    "db:seed:ai-spans": "tsx seed-ai-spans.mts",
     "upload:sourcemaps": "bash ./upload-sourcemaps.sh",
     "test": "vitest --no-file-parallelism",
     "eval:dev": "evalite watch"
@@ -56,6 +57,7 @@
     "@heroicons/react": "^2.0.12",
     "@jsonhero/schema-infer": "^0.1.5",
     "@internal/cache": "workspace:*",
+    "@internal/llm-pricing": "workspace:*",
     "@internal/redis": "workspace:*",
     "@internal/run-engine": "workspace:*",
     "@internal/schedule-engine": "workspace:*",
diff --git a/apps/webapp/seed-ai-spans.mts b/apps/webapp/seed-ai-spans.mts
new file mode 100644
index 00000000000..35ec3d5851e
--- /dev/null
+++ b/apps/webapp/seed-ai-spans.mts
@@ -0,0 +1,1797 @@
+import { prisma } from "./app/db.server";
+import { createOrganization } from "./app/models/organization.server";
+import { createProject } from "./app/models/project.server";
+import { ClickHouse } from "@internal/clickhouse";
+import type { TaskEventV2Input, LlmMetricsV1Input } from "@internal/clickhouse";
+import {
+  generateTraceId,
+  generateSpanId,
+} from "./app/v3/eventRepository/common.server";
+import {
+  enrichCreatableEvents,
+  setLlmPricingRegistry,
+} from "./app/v3/utils/enrichCreatableEvents.server";
+import { ModelPricingRegistry, seedLlmPricing } from "@internal/llm-pricing";
+import { nanoid } from "nanoid";
+import { unflattenAttributes } from "@trigger.dev/core/v3/utils/flattenAttributes";
+import type { Attributes } from "@opentelemetry/api";
+import type { CreateEventInput } from "./app/v3/eventRepository/eventRepository.types";
+
+const ORG_TITLE = "AI Spans Dev";
+const PROJECT_NAME = "ai-chat-demo";
+const TASK_SLUG = "ai-chat";
+const QUEUE_NAME = "task/ai-chat";
+const WORKER_VERSION = "seed-ai-spans-v1";
+
+const SEED_USER_IDS = [
+  "user_alice", "user_bob", "user_carol", "user_dave",
+  "user_eve", "user_frank", "user_grace", "user_heidi",
+  "user_ivan", "user_judy", "user_karl", "user_liam",
+];
+
+function randomUserId(): string {
+  return SEED_USER_IDS[Math.floor(Math.random() * SEED_USER_IDS.length)];
+}
+
+// ---------------------------------------------------------------------------
+// ClickHouse formatting helpers (replicated from clickhouseEventRepository)
+// ---------------------------------------------------------------------------
+
+function formatStartTime(startTimeNs: bigint): string {
+  const str = startTimeNs.toString();
+  if (str.length !== 19) return str;
+  return str.substring(0, 10) + "." + str.substring(10);
+}
+
+function formatDuration(value: number | bigint): string {
+  if (value < 0) return "0";
+  if (typeof value === "bigint") return value.toString();
+  return Math.floor(value).toString();
+}
+
+function formatClickhouseDateTime(date: Date): string {
+  return date.toISOString().replace("T", " ").replace("Z", "");
+}
+
+function removePrivateProperties(attributes: Attributes): Attributes | undefined {
+  const result: Attributes = {};
+  for (const [key, value] of Object.entries(attributes)) {
+    if (key.startsWith("$") || key.startsWith("ctx.")) continue;
+    result[key] = value;
+  }
+  return Object.keys(result).length === 0 ? undefined : result;
+}
+
+function eventToClickhouseRow(event: CreateEventInput): TaskEventV2Input {
+  // kind
+  let kind: string;
+  if (event.kind === "UNSPECIFIED") kind = "ANCESTOR_OVERRIDE";
+  else if (event.level === "TRACE") kind = "SPAN";
+  else if (event.isDebug) kind = "DEBUG_EVENT";
+  else kind = `LOG_${(event.level ?? "LOG").toString().toUpperCase()}`;
+
+  // status
+  let status: string;
+  if (event.isPartial) status = "PARTIAL";
+  else if (event.isError) status = "ERROR";
+  else if (event.isCancelled) status = "CANCELLED";
+  else status = "OK";
+
+  // attributes
+  const publicAttrs = removePrivateProperties(event.properties as Attributes);
+  const unflattened = publicAttrs ? unflattenAttributes(publicAttrs) : {};
+  const attributes =
+    unflattened && typeof unflattened === "object" ? { ...unflattened } : {};
+
+  // metadata — mirrors createEventToTaskEventV1InputMetadata
+  const metadataObj: Record<string, unknown> = {};
+  if (event.style) {
+    metadataObj.style = unflattenAttributes(event.style as Attributes);
+  }
+  if (event.attemptNumber) {
+    metadataObj.attemptNumber = event.attemptNumber;
+  }
+  // Extract entity from properties (SemanticInternalAttributes)
+  const entityType = event.properties?.["$entity.type"];
+  if (typeof entityType === "string") {
+    metadataObj.entity = {
+      entityType,
+      entityId: event.properties?.["$entity.id"] as string | undefined,
+      entityMetadata: event.properties?.["$entity.metadata"] as string | undefined,
+    };
+  }
+  const metadata = JSON.stringify(metadataObj);
+
+  return {
+    environment_id: event.environmentId,
+    organization_id: event.organizationId,
+    project_id: event.projectId,
+    task_identifier: event.taskSlug,
+    run_id: event.runId,
+    start_time: formatStartTime(BigInt(event.startTime)),
+    duration: formatDuration(event.duration ?? 0),
+    trace_id: event.traceId,
+    span_id: event.spanId,
+    parent_span_id: event.parentId ?? "",
+    message: event.message,
+    kind,
+    status,
+    attributes,
+    metadata,
+    expires_at: formatClickhouseDateTime(
+      new Date(Date.now() + 365 * 24 * 60 * 60 * 1000)
+    ),
+    machine_id: "",
+  };
+}
+
+function eventToLlmMetricsRow(event: CreateEventInput): LlmMetricsV1Input {
+  const llm = event._llmMetrics!;
+  return {
+    organization_id: event.organizationId,
+    project_id: event.projectId,
+    environment_id: event.environmentId,
+    run_id: event.runId,
+    task_identifier: event.taskSlug,
+    trace_id: event.traceId,
+    span_id: event.spanId,
+    gen_ai_system: llm.genAiSystem,
+    request_model: llm.requestModel,
+    response_model: llm.responseModel,
+    matched_model_id: llm.matchedModelId,
+    operation_id: llm.operationId,
+    finish_reason: llm.finishReason,
+    cost_source: llm.costSource,
+    pricing_tier_id: llm.pricingTierId,
+    pricing_tier_name: llm.pricingTierName,
+    input_tokens: llm.inputTokens,
+    output_tokens: llm.outputTokens,
+    total_tokens: llm.totalTokens,
+    usage_details: llm.usageDetails,
+    input_cost: llm.inputCost,
+    output_cost: llm.outputCost,
+    total_cost: llm.totalCost,
+    cost_details: llm.costDetails,
+    provider_cost: llm.providerCost,
+    ms_to_first_chunk: llm.msToFirstChunk,
+    tokens_per_second: llm.tokensPerSecond,
+    metadata: llm.metadata,
+    start_time: formatStartTime(BigInt(event.startTime)),
+    duration: formatDuration(event.duration ?? 0),
+  };
+}
+
+// ---------------------------------------------------------------------------
+// Main
+// ---------------------------------------------------------------------------
+
+async function seedAiSpans() {
+  const seedUserId = randomUserId();
+  console.log(`Starting AI span seed (userId: ${seedUserId})...\n`);
+
+  // 1. Find user
+  const user = await prisma.user.findUnique({
+    where: { email: "local@trigger.dev" },
+  });
+  if (!user) {
+    console.error("User local@trigger.dev not found. Run `pnpm run db:seed` first.");
+    process.exit(1);
+  }
+
+  // 2. Find or create org
+  let org = await prisma.organization.findFirst({
+    where: { title: ORG_TITLE, members: { some: { userId: user.id } } },
+  });
+  if (!org) {
+    org = await createOrganization({ title: ORG_TITLE, userId: user.id, companySize: "1-10" });
+    console.log(`Created org: ${org.title} (${org.slug})`);
+  } else {
+    console.log(`Org exists: ${org.title} (${org.slug})`);
+  }
+
+  // 3. Find or create project
+  let project = await prisma.project.findFirst({
+    where: { name: PROJECT_NAME, organizationId: org.id },
+  });
+  if (!project) {
+    project = await createProject({
+      organizationSlug: org.slug,
+      name: PROJECT_NAME,
+      userId: user.id,
+      version: "v3",
+    });
+    console.log(`Created project: ${project.name} (${project.externalRef})`);
+  } else {
+    console.log(`Project exists: ${project.name} (${project.externalRef})`);
+  }
+
+  // 4. Get DEVELOPMENT environment
+  const runtimeEnv = await prisma.runtimeEnvironment.findFirst({
+    where: { projectId: project.id, type: "DEVELOPMENT" },
+  });
+  if (!runtimeEnv) {
+    console.error("No DEVELOPMENT environment found for project.");
+    process.exit(1);
+  }
+
+  // 5. Upsert background worker
+  const worker = await prisma.backgroundWorker.upsert({
+    where: {
+      projectId_runtimeEnvironmentId_version: {
+        projectId: project.id,
+        runtimeEnvironmentId: runtimeEnv.id,
+        version: WORKER_VERSION,
+      },
+    },
+    update: {},
+    create: {
+      friendlyId: `worker_${nanoid()}`,
+      engine: "V2",
+      contentHash: `seed-ai-spans-${Date.now()}`,
+      sdkVersion: "3.0.0",
+      cliVersion: "3.0.0",
+      projectId: project.id,
+      runtimeEnvironmentId: runtimeEnv.id,
+      version: WORKER_VERSION,
+      metadata: {},
+    },
+  });
+
+  // 6. Upsert task
+  await prisma.backgroundWorkerTask.upsert({
+    where: { workerId_slug: { workerId: worker.id, slug: TASK_SLUG } },
+    update: {},
+    create: {
+      friendlyId: `task_${nanoid()}`,
+      slug: TASK_SLUG,
+      filePath: "src/trigger/ai-chat.ts",
+      exportName: "aiChat",
+      workerId: worker.id,
+      projectId: project.id,
+      runtimeEnvironmentId: runtimeEnv.id,
+    },
+  });
+
+  // 7. Upsert queue
+  await prisma.taskQueue.upsert({
+    where: {
+      runtimeEnvironmentId_name: {
+        runtimeEnvironmentId: runtimeEnv.id,
+        name: QUEUE_NAME,
+      },
+    },
+    update: {},
+    create: {
+      friendlyId: `queue_${nanoid()}`,
+      name: QUEUE_NAME,
+      projectId: project.id,
+      runtimeEnvironmentId: runtimeEnv.id,
+    },
+  });
+
+  // 8. Create the TaskRun
+  const traceId = generateTraceId();
+  const rootSpanId = generateSpanId();
+  const now = Date.now();
+  // Spans start at `now` and extend into the future. completedAt must cover
+  // the full span tree so getSpan's start_time <= completedAt filter works.
+  const startedAt = new Date(now);
+  const completedAt = new Date(now + 150_000); // 2.5 min to cover all spans
+
+  const run = await prisma.taskRun.create({
+    data: {
+      friendlyId: `run_${nanoid()}`,
+      engine: "V2",
+      status: "COMPLETED_SUCCESSFULLY",
+      taskIdentifier: TASK_SLUG,
+      payload: JSON.stringify({
+        message: `I need a comprehensive analysis of the current Federal Reserve interest rate policy and its broader economic implications. Please cover all of the following areas in detail:
+
+## 1. Current Rate Policy
+
+- What is the **current federal funds target rate** range?
+- When was it last changed, and by how much?
+- What was the FOMC vote breakdown — were there any dissents?
+- What key language changes appeared in the most recent FOMC statement compared to the prior meeting?
+
+## 2. Rate History & Trajectory
+
+- Provide a complete timeline of rate decisions over the past **18 months**, including the size of each move
+- How does the current rate compare to the **pre-pandemic neutral rate** estimate?
+- What does the latest **dot plot** (Summary of Economic Projections) show for 2025, 2026, and the longer-run rate?
+- How has the **median longer-run rate estimate** shifted over the past year?
+
+## 3. Inflation & Economic Data Context
+
+- What are the latest readings for **Core PCE**, **headline CPI**, and **trimmed mean CPI**?
+- How does current inflation compare to the Fed's 2% symmetric target?
+- What does the **breakeven inflation rate** (5-year and 10-year TIPS spreads) suggest about market inflation expectations?
+- Are there any notable divergences between goods inflation and services inflation?
+
+## 4. Labor Market Assessment
+
+- What is the current **unemployment rate**, and how has it trended over the past 6 months?
+- What do **nonfarm payrolls**, **JOLTs job openings**, and **initial jobless claims** indicate about labor market health?
+- Is wage growth (via the **Employment Cost Index** and **Average Hourly Earnings**) still running above levels consistent with 2% inflation?
+- How does the Fed view the balance between its **maximum employment** and **price stability** mandates right now?
+
+## 5. Forward Guidance & Market Expectations
+
+- What are the upcoming **FOMC meeting dates** for the next 6 months?
+- What does the **CME FedWatch Tool** show for the probability of rate changes at each upcoming meeting?
+- How do **fed funds futures** and **OIS swaps** price the terminal rate for this cycle?
+- Are there any notable divergences between Fed guidance and market pricing?
+
+## 6. Global Context & Risk Factors
+
+- How do US rates compare to the **ECB**, **Bank of England**, and **Bank of Japan** policy rates?
+- What role are **tariff and trade policy** uncertainties playing in Fed deliberations?
+- How might **fiscal policy** changes (tax cuts, spending proposals) impact the rate outlook?
+- What are the key **upside and downside risks** to the current rate path?
+
+## 7. Financial Conditions
+
+- What is the current reading of the **Goldman Sachs Financial Conditions Index** and the **Chicago Fed National Financial Conditions Index**?
+- How have **10-year Treasury yields**, **corporate credit spreads**, and **equity valuations** responded to recent policy signals?
+- Is the **yield curve** currently inverted, and what does that historically signal?
+
+Please structure your response with clear headings, use tables for comparative data, include specific numbers and dates, and cite your sources. Flag any data points that may be stale or subject to revision.`,
+      }),
+      payloadType: "application/json",
+      traceId,
+      spanId: rootSpanId,
+      runtimeEnvironmentId: runtimeEnv.id,
+      projectId: project.id,
+      organizationId: org.id,
+      queue: QUEUE_NAME,
+      lockedToVersionId: worker.id,
+      startedAt,
+      completedAt,
+      runTags: [`user:${seedUserId}`, "chat:seed_session"],
+      taskEventStore: "clickhouse_v2",
+    },
+  });
+
+  console.log(`Created TaskRun: ${run.friendlyId}`);
+
+  // 9. Build span tree
+  const events = buildAiSpanTree({
+    traceId,
+    rootSpanId,
+    runId: run.friendlyId,
+    environmentId: runtimeEnv.id,
+    projectId: project.id,
+    organizationId: org.id,
+    taskSlug: TASK_SLUG,
+    baseTimeMs: now,
+    seedUserId,
+  });
+
+  console.log(`Built ${events.length} spans`);
+
+  // 10. Seed LLM pricing and enrich
+  const seedResult = await seedLlmPricing(prisma);
+  console.log(
+    `LLM pricing: ${seedResult.modelsCreated} created, ${seedResult.modelsSkipped} skipped`
+  );
+
+  const registry = new ModelPricingRegistry(prisma);
+  setLlmPricingRegistry(registry);
+  await registry.loadFromDatabase();
+
+  const enriched = enrichCreatableEvents(events);
+
+  const enrichedCount = enriched.filter((e) => e._llmMetrics != null).length;
+  const totalCost = enriched.reduce((sum, e) => sum + (e._llmMetrics?.totalCost ?? 0), 0);
+  console.log(
+    `Enriched ${enrichedCount} spans with LLM cost (total: $${totalCost.toFixed(6)})`
+  );
+
+  // 11. Insert into ClickHouse
+  const clickhouseUrl = process.env.CLICKHOUSE_URL ?? process.env.EVENTS_CLICKHOUSE_URL;
+  if (!clickhouseUrl) {
+    console.error("CLICKHOUSE_URL or EVENTS_CLICKHOUSE_URL not set");
+    process.exit(1);
+  }
+
+  const url = new URL(clickhouseUrl);
+  url.searchParams.delete("secure");
+  const clickhouse = new ClickHouse({ url: url.toString() });
+
+  // Convert to ClickHouse rows and insert
+  const chRows = enriched.map(eventToClickhouseRow);
+  await clickhouse.taskEventsV2.insert(chRows);
+
+  // Insert LLM usage rows
+  const llmRows = enriched.filter((e) => e._llmMetrics != null).map(eventToLlmMetricsRow);
+  if (llmRows.length > 0) {
+    await clickhouse.llmMetrics.insert(llmRows);
+  }
+
+  // 12. Output
+  console.log("\nDone!\n");
+  console.log(
+    `Run URL: http://localhost:3030/orgs/${org.slug}/projects/${project.slug}/env/dev/runs/${run.friendlyId}`
+  );
+  console.log(`Spans: ${events.length}`);
+  console.log(`LLM cost enriched: ${enrichedCount}`);
+  console.log(`Total cost: $${totalCost.toFixed(6)}`);
+  process.exit(0);
+}
+
+// ---------------------------------------------------------------------------
+// Span tree builder
+// ---------------------------------------------------------------------------
+
+type SpanTreeParams = {
+  traceId: string;
+  rootSpanId: string;
+  runId: string;
+  environmentId: string;
+  projectId: string;
+  organizationId: string;
+  taskSlug: string;
+  baseTimeMs: number;
+  seedUserId: string;
+};
+
+function buildAiSpanTree(params: SpanTreeParams): CreateEventInput[] {
+  const {
+    traceId,
+    rootSpanId,
+    runId,
+    environmentId,
+    projectId,
+    organizationId,
+    taskSlug,
+    baseTimeMs,
+    seedUserId,
+  } = params;
+
+  const events: CreateEventInput[] = [];
+  const runTags = [`user:${seedUserId}`, "chat:seed_session"];
+
+  // Timing cursor — each span advances this
+  let cursor = baseTimeMs;
+  function next(durationMs: number) {
+    const start = cursor;
+    cursor += durationMs + 50; // 50ms gap between spans
+    return { startMs: start, durationMs };
+  }
+
+  function makeEvent(opts: {
+    message: string;
+    spanId: string;
+    parentId: string | undefined;
+    startMs: number;
+    durationMs: number;
+    properties: Record<string, unknown>;
+    style?: Record<string, unknown>;
+    attemptNumber?: number;
+  }): CreateEventInput {
+    const startNs = BigInt(opts.startMs) * BigInt(1_000_000);
+    const durationNs = opts.durationMs * 1_000_000;
+    return {
+      traceId,
+      spanId: opts.spanId,
+      parentId: opts.parentId,
+      message: opts.message,
+      kind: "INTERNAL" as any,
+      status: "OK" as any,
+      level: "TRACE" as any,
+      startTime: startNs,
+      duration: durationNs,
+      isError: false,
+      isPartial: false,
+      isCancelled: false,
+      isDebug: false,
+      runId,
+      environmentId,
+      projectId,
+      organizationId,
+      taskSlug,
+      properties: opts.properties,
+      metadata: undefined,
+      style: opts.style as any,
+      events: undefined,
+      runTags,
+      attemptNumber: opts.attemptNumber,
+    };
+  }
+
+  // --- Shared prompt content ---
+  const userMessage = `I need a detailed analysis of the current Federal Reserve interest rate policy, including:
+
+1. The **current target rate** range
+2. How it compares to rates over the past 12 months
+3. Any upcoming FOMC meetings and market expectations
+
+Please include relevant data points and sources where possible.`;
+
+  const systemPrompt = `You are a senior financial analyst AI assistant with expertise in monetary policy, macroeconomics, and Federal Reserve operations.
+
+## Your Capabilities
+- Access to real-time web search for current financial data
+- Deep knowledge of FOMC meeting schedules, dot plots, and forward guidance
+- Ability to interpret economic indicators (CPI, PCE, employment data)
+
+## Response Guidelines
+- Always cite specific dates and data sources
+- Use tables for comparative data when appropriate
+- Flag any uncertainty or conflicting signals in the data
+- Present information in a structured, scannable format
+
+## Important Notes
+> Never provide investment advice. Present factual analysis only.
+> When data is older than 48 hours, note the timestamp explicitly.`;
+
+  const assistantResponse = `## Current Federal Reserve Interest Rate
+
+The Federal Open Market Committee (FOMC) has set the **federal funds target rate** at a range of **4.25% to 4.50%**, effective since the December 18, 2024 meeting.
+
+### Rate Trajectory (Past 12 Months)
+
+| Meeting Date | Decision | Target Range |
+|:---|:---|:---|
+| Dec 18, 2024 | -25 bps | 4.25% – 4.50% |
+| Nov 7, 2024 | -25 bps | 4.50% – 4.75% |
+| Sep 18, 2024 | -50 bps | 4.75% – 5.00% |
+| Jul 31, 2024 | Hold | 5.25% – 5.50% |
+| Jun 12, 2024 | Hold | 5.25% – 5.50% |
+| May 1, 2024 | Hold | 5.25% – 5.50% |
+| Mar 20, 2024 | Hold | 5.25% – 5.50% |
+
+### Key Observations
+
+1. **Easing Cycle Began**: The Fed started cutting rates in September 2024 with an aggressive 50 bps cut, followed by two 25 bps cuts
+2. **Cumulative Reduction**: Rates have been lowered by **100 basis points** total from the cycle peak of 5.25%–5.50%
+3. **Pause Signals**: Recent FOMC language suggests a *cautious approach* to further cuts, citing:
+   - Persistent core inflation above the 2% target
+   - Strong labor market conditions
+   - Uncertainty around fiscal policy changes
+
+### Upcoming FOMC Schedule
+
+The next scheduled meeting is **January 28–29, 2025**. Market expectations via CME FedWatch:
+
+\`\`\`
+Hold (no change):  89.3%
+Cut (-25 bps):     10.7%
+\`\`\`
+
+> **Note**: Market pricing strongly favors a hold at the January meeting, with the first expected cut pushed to mid-2025.
+
+### Sources
+- [Federal Reserve Board – Policy Actions](https://federalreserve.gov)
+- CME FedWatch Tool (as of Jan 15, 2025)
+- FOMC Statement, December 18, 2024`;
+  const toolCallResult = JSON.stringify({
+    status: 200,
+    contentType: "text/html",
+    body: "<html>...Federal Reserve maintains the target range for the federal funds rate at 4-1/4 to 4-1/2 percent...</html>",
+    truncated: true,
+  });
+  const promptMessages = JSON.stringify([
+    { role: "system", content: systemPrompt },
+    { role: "user", content: userMessage },
+  ]);
+  const toolDefs = JSON.stringify([
+    JSON.stringify({
+      type: "function",
+      name: "webSearch",
+      description: "Search the web for information",
+      inputSchema: {
+        type: "object",
+        properties: {
+          query: { type: "string" },
+          num: { type: "number" },
+        },
+        required: ["query"],
+      },
+    }),
+  ]);
+  const toolCallsJson = JSON.stringify([
+    {
+      id: "call_seed_001",
+      type: "function",
+      function: {
+        name: "webSearch",
+        arguments: '{"query":"federal reserve interest rate 2024","num":5}',
+      },
+    },
+  ]);
+
+  // --- Span IDs ---
+  const attemptId = generateSpanId();
+  const runFnId = generateSpanId();
+
+  // streamText sub-tree IDs
+  const streamWrapId = generateSpanId();
+  const stream1Id = generateSpanId();
+  const toolCall1Id = generateSpanId();
+  const stream2Id = generateSpanId();
+
+  // generateText sub-tree IDs (Anthropic with cache)
+  const genTextWrapId = generateSpanId();
+  const genTextDoId = generateSpanId();
+  const toolCall2Id = generateSpanId();
+
+  // generateObject sub-tree IDs (gateway → xAI)
+  const genObjWrapId = generateSpanId();
+  const genObjDoId = generateSpanId();
+
+  // generateObject sub-tree IDs (Google Gemini)
+  const genObjGeminiWrapId = generateSpanId();
+  const genObjGeminiDoId = generateSpanId();
+
+  // =====================================================================
+  // Structural spans: root → attempt → run()
+  // =====================================================================
+  const rootStart = baseTimeMs;
+  const totalDuration = 120_000; // 2 minutes to cover all ~18 scenarios
+
+  events.push(
+    makeEvent({
+      message: taskSlug,
+      spanId: rootSpanId,
+      parentId: undefined,
+      startMs: rootStart,
+      durationMs: totalDuration,
+      properties: {},
+    })
+  );
+
+  events.push(
+    makeEvent({
+      message: "Attempt 1",
+      spanId: attemptId,
+      parentId: rootSpanId,
+      startMs: rootStart + 30,
+      durationMs: totalDuration - 60,
+      properties: { "$entity.type": "attempt" },
+      style: { icon: "attempt", variant: "cold" },
+      attemptNumber: 1,
+    })
+  );
+
+  events.push(
+    makeEvent({
+      message: "run()",
+      spanId: runFnId,
+      parentId: attemptId,
+      startMs: rootStart + 60,
+      durationMs: totalDuration - 120,
+      properties: {},
+      style: { icon: "task-fn-run" },
+      attemptNumber: 1,
+    })
+  );
+
+  // =====================================================================
+  // 1) ai.streamText — OpenAI gpt-4o-mini with tool use (2 LLM calls)
+  // =====================================================================
+  cursor = rootStart + 100;
+  const stWrap = next(9_500);
+
+  events.push(
+    makeEvent({
+      message: "ai.streamText",
+      spanId: streamWrapId,
+      parentId: runFnId,
+      ...stWrap,
+      properties: {
+        "ai.operationId": "ai.streamText",
+        "ai.model.id": "gpt-4o-mini",
+        "ai.model.provider": "openai.responses",
+        "ai.response.finishReason": "stop",
+        "ai.response.text": assistantResponse,
+        "ai.usage.inputTokens": 807,
+        "ai.usage.outputTokens": 242,
+        "ai.usage.totalTokens": 1049,
+        "ai.telemetry.metadata.userId": seedUserId,
+        "ai.telemetry.functionId": "ai-chat",
+        "operation.name": "ai.streamText",
+      },
+    })
+  );
+
+  cursor = stWrap.startMs + 50;
+  const st1 = next(2_500);
+  events.push(
+    makeEvent({
+      message: "ai.streamText.doStream",
+      spanId: stream1Id,
+      parentId: streamWrapId,
+      ...st1,
+      properties: {
+        "gen_ai.system": "openai.responses",
+        "gen_ai.request.model": "gpt-4o-mini",
+        "gen_ai.response.model": "gpt-4o-mini-2024-07-18",
+        "gen_ai.usage.input_tokens": 284,
+        "gen_ai.usage.output_tokens": 55,
+        "ai.model.id": "gpt-4o-mini",
+        "ai.model.provider": "openai.responses",
+        "ai.operationId": "ai.streamText.doStream",
+        "ai.prompt.messages": promptMessages,
+        "ai.prompt.tools": toolDefs,
+        "ai.prompt.toolChoice": '{"type":"auto"}',
+        "ai.settings.maxRetries": 2,
+        "ai.response.finishReason": "tool-calls",
+        "ai.response.toolCalls": toolCallsJson,
+        "ai.response.text": "",
+        "ai.response.id": "resp_seed_001",
+        "ai.response.model": "gpt-4o-mini-2024-07-18",
+        "ai.response.msToFirstChunk": 891.37,
+        "ai.response.msToFinish": 2321.12,
+        "ai.response.timestamp": new Date(st1.startMs + st1.durationMs).toISOString(),
+        "ai.usage.inputTokens": 284,
+        "ai.usage.outputTokens": 55,
+        "ai.usage.totalTokens": 339,
+        "ai.telemetry.metadata.userId": seedUserId,
+        "ai.telemetry.functionId": "ai-chat",
+        "operation.name": "ai.streamText.doStream",
+      },
+    })
+  );
+
+  const tc1 = next(3_000);
+  events.push(
+    makeEvent({
+      message: "ai.toolCall",
+      spanId: toolCall1Id,
+      parentId: streamWrapId,
+      ...tc1,
+      properties: {
+        "ai.operationId": "ai.toolCall",
+        "ai.toolCall.name": "webSearch",
+        "ai.toolCall.id": "call_seed_001",
+        "ai.toolCall.args": '{"query":"federal reserve interest rate 2024","num":5}',
+        "ai.toolCall.result": toolCallResult,
+        "operation.name": "ai.toolCall",
+      },
+    })
+  );
+
+  const st2 = next(3_500);
+  events.push(
+    makeEvent({
+      message: "ai.streamText.doStream",
+      spanId: stream2Id,
+      parentId: streamWrapId,
+      ...st2,
+      properties: {
+        "gen_ai.system": "openai.responses",
+        "gen_ai.request.model": "gpt-4o-mini",
+        "gen_ai.response.model": "gpt-4o-mini-2024-07-18",
+        "gen_ai.usage.input_tokens": 523,
+        "gen_ai.usage.output_tokens": 187,
+        "ai.model.id": "gpt-4o-mini",
+        "ai.model.provider": "openai.responses",
+        "ai.operationId": "ai.streamText.doStream",
+        "ai.prompt.messages": promptMessages,
+        "ai.settings.maxRetries": 2,
+        "ai.response.finishReason": "stop",
+        "ai.response.text": assistantResponse,
+        "ai.response.reasoning":
+          "Let me analyze the Federal Reserve data to provide the current rate.",
+        "ai.response.id": "resp_seed_002",
+        "ai.response.model": "gpt-4o-mini-2024-07-18",
+        "ai.response.msToFirstChunk": 672.45,
+        "ai.response.msToFinish": 3412.89,
+        "ai.response.timestamp": new Date(st2.startMs + st2.durationMs).toISOString(),
+        "ai.usage.inputTokens": 523,
+        "ai.usage.outputTokens": 187,
+        "ai.usage.totalTokens": 710,
+        "ai.usage.reasoningTokens": 42,
+        "ai.telemetry.metadata.userId": seedUserId,
+        "ai.telemetry.functionId": "ai-chat",
+        "operation.name": "ai.streamText.doStream",
+      },
+    })
+  );
+
+  // =====================================================================
+  // 2) ai.generateText — Anthropic claude-haiku-4-5 with tool call + cache
+  // =====================================================================
+  const gtWrap = next(4_200);
+
+  events.push(
+    makeEvent({
+      message: "ai.generateText",
+      spanId: genTextWrapId,
+      parentId: runFnId,
+      ...gtWrap,
+      properties: {
+        "ai.operationId": "ai.generateText",
+        "ai.model.id": "claude-haiku-4-5",
+        "ai.model.provider": "anthropic.messages",
+        "ai.response.finishReason": "stop",
+        "ai.response.text": "Based on the search results, the current rate is 4.25%-4.50%.",
+        "ai.usage.promptTokens": 9951,
+        "ai.usage.completionTokens": 803,
+        "ai.telemetry.metadata.agentName": "research-agent",
+        "ai.telemetry.functionId": "ai-chat",
+        "operation.name": "ai.generateText",
+      },
+    })
+  );
+
+  cursor = gtWrap.startMs + 50;
+  const gtDo = next(3_200);
+  events.push(
+    makeEvent({
+      message: "ai.generateText.doGenerate",
+      spanId: genTextDoId,
+      parentId: genTextWrapId,
+      ...gtDo,
+      properties: {
+        "gen_ai.system": "anthropic.messages",
+        "gen_ai.request.model": "claude-haiku-4-5",
+        "gen_ai.response.model": "claude-haiku-4-5-20251001",
+        "gen_ai.usage.input_tokens": 9951,
+        "gen_ai.usage.output_tokens": 803,
+        "gen_ai.usage.cache_read_input_tokens": 8200,
+        "gen_ai.usage.cache_creation_input_tokens": 1751,
+        "ai.model.id": "claude-haiku-4-5",
+        "ai.model.provider": "anthropic.messages",
+        "ai.operationId": "ai.generateText.doGenerate",
+        "ai.prompt.messages": promptMessages,
+        "ai.prompt.toolChoice": '{"type":"auto"}',
+        "ai.settings.maxRetries": 2,
+        "ai.response.finishReason": "tool-calls",
+        "ai.response.id": "msg_seed_003",
+        "ai.response.model": "claude-haiku-4-5-20251001",
+        "ai.response.text":
+          "I'll search for the latest Federal Reserve interest rate information.",
+        "ai.response.toolCalls": JSON.stringify([
+          {
+            toolCallId: "toolu_seed_001",
+            toolName: "webSearch",
+            input: '{"query":"federal reserve interest rate current"}',
+          },
+        ]),
+        "ai.response.providerMetadata": JSON.stringify({
+          anthropic: {
+            usage: {
+              input_tokens: 9951,
+              output_tokens: 803,
+              cache_creation_input_tokens: 1751,
+              cache_read_input_tokens: 8200,
+              service_tier: "standard",
+            },
+          },
+        }),
+        "ai.response.timestamp": new Date(gtDo.startMs + gtDo.durationMs).toISOString(),
+        "ai.usage.promptTokens": 9951,
+        "ai.usage.completionTokens": 803,
+        "ai.telemetry.metadata.agentName": "research-agent",
+        "ai.telemetry.functionId": "ai-chat",
+        "operation.name": "ai.generateText.doGenerate",
+      },
+    })
+  );
+
+  const tc2 = next(500);
+  events.push(
+    makeEvent({
+      message: "ai.toolCall",
+      spanId: toolCall2Id,
+      parentId: genTextWrapId,
+      ...tc2,
+      properties: {
+        "ai.operationId": "ai.toolCall",
+        "ai.toolCall.name": "webSearch",
+        "ai.toolCall.id": "toolu_seed_001",
+        "ai.toolCall.args": '{"query":"federal reserve interest rate current"}',
+        "ai.toolCall.result":
+          '[{"title":"Federal Reserve Board - Policy Rate","link":"https://federalreserve.gov/rates","snippet":"The target range is 4.25% to 4.50%"}]',
+        "operation.name": "ai.toolCall",
+        "resource.name": "ai-chat",
+      },
+    })
+  );
+
+  // =====================================================================
+  // 3) ai.generateObject — Gateway → xAI/grok with structured output
+  // =====================================================================
+  const goWrap = next(1_800);
+
+  events.push(
+    makeEvent({
+      message: "ai.generateObject",
+      spanId: genObjWrapId,
+      parentId: runFnId,
+      ...goWrap,
+      properties: {
+        "ai.operationId": "ai.generateObject",
+        "ai.model.id": "xai/grok-4.1-fast-non-reasoning",
+        "ai.model.provider": "gateway",
+        "ai.response.finishReason": "stop",
+        "ai.response.object": JSON.stringify({
+          summary: "Fed rate at 4.25%-4.50%",
+          confidence: 0.95,
+          sources: ["federalreserve.gov"],
+        }),
+        "ai.telemetry.metadata.model": "xai/grok-4.1-fast-non-reasoning",
+        "ai.telemetry.metadata.schemaType": "schema",
+        "ai.telemetry.functionId": "generateObject",
+        "operation.name": "ai.generateObject",
+      },
+    })
+  );
+
+  cursor = goWrap.startMs + 50;
+  const goDo = next(1_600);
+  events.push(
+    makeEvent({
+      message: "ai.generateObject.doGenerate",
+      spanId: genObjDoId,
+      parentId: genObjWrapId,
+      ...goDo,
+      properties: {
+        "gen_ai.system": "gateway",
+        "gen_ai.request.model": "xai/grok-4.1-fast-non-reasoning",
+        "gen_ai.response.model": "xai/grok-4.1-fast-non-reasoning",
+        "gen_ai.usage.input_tokens": 1629,
+        "gen_ai.usage.output_tokens": 158,
+        "ai.model.id": "xai/grok-4.1-fast-non-reasoning",
+        "ai.model.provider": "gateway",
+        "ai.operationId": "ai.generateObject.doGenerate",
+        "ai.prompt.messages": promptMessages,
+        "ai.settings.maxRetries": 3,
+        "ai.response.finishReason": "stop",
+        "ai.response.id": "aiobj_seed_001",
+        "ai.response.model": "xai/grok-4.1-fast-non-reasoning",
+        "ai.response.object": JSON.stringify({
+          summary: "Fed rate at 4.25%-4.50%",
+          confidence: 0.95,
+          sources: ["federalreserve.gov"],
+        }),
+        "ai.response.providerMetadata": JSON.stringify({
+          gateway: {
+            routing: {
+              originalModelId: "xai/grok-4.1-fast-non-reasoning",
+              resolvedProvider: "xai",
+              canonicalSlug: "xai/grok-4.1-fast-non-reasoning",
+              finalProvider: "xai",
+              modelAttemptCount: 1,
+            },
+            cost: "0.0002905",
+            generationId: "gen_seed_001",
+          },
+        }),
+        "ai.response.timestamp": new Date(goDo.startMs + goDo.durationMs).toISOString(),
+        "ai.usage.completionTokens": 158,
+        "ai.usage.promptTokens": 1629,
+        "ai.request.headers.user-agent": "ai/5.0.60",
+        "operation.name": "ai.generateObject.doGenerate",
+      },
+    })
+  );
+
+  // =====================================================================
+  // 4) ai.generateObject — Google Gemini (generative-ai) with thinking tokens
+  // =====================================================================
+  const goGemWrap = next(2_200);
+
+  events.push(
+    makeEvent({
+      message: "ai.generateObject",
+      spanId: genObjGeminiWrapId,
+      parentId: runFnId,
+      ...goGemWrap,
+      properties: {
+        "ai.operationId": "ai.generateObject",
+        "ai.model.id": "gemini-2.5-flash",
+        "ai.model.provider": "google.generative-ai",
+        "ai.response.finishReason": "stop",
+        "ai.response.object": JSON.stringify({
+          category: "financial_data",
+          label: "interest_rate",
+        }),
+        "ai.telemetry.functionId": "classify-content",
+        "operation.name": "ai.generateObject",
+      },
+    })
+  );
+
+  cursor = goGemWrap.startMs + 50;
+  const goGemDo = next(2_000);
+  events.push(
+    makeEvent({
+      message: "ai.generateObject.doGenerate",
+      spanId: genObjGeminiDoId,
+      parentId: genObjGeminiWrapId,
+      ...goGemDo,
+      properties: {
+        "gen_ai.system": "google.generative-ai",
+        "gen_ai.request.model": "gemini-2.5-flash",
+        "gen_ai.response.model": "gemini-2.5-flash",
+        "gen_ai.usage.input_tokens": 898,
+        "gen_ai.usage.output_tokens": 521,
+        "ai.model.id": "gemini-2.5-flash",
+        "ai.model.provider": "google.generative-ai",
+        "ai.operationId": "ai.generateObject.doGenerate",
+        "ai.prompt.messages": JSON.stringify([
+          {
+            role: "user",
+            content: [
+              {
+                type: "text",
+                text: "Classify this content: Federal Reserve interest rate analysis",
+              },
+            ],
+          },
+        ]),
+        "ai.settings.maxRetries": 3,
+        "ai.response.finishReason": "stop",
+        "ai.response.id": "aiobj_seed_gemini",
+        "ai.response.model": "gemini-2.5-flash",
+        "ai.response.object": JSON.stringify({
+          category: "financial_data",
+          label: "interest_rate",
+        }),
+        "ai.response.providerMetadata": JSON.stringify({
+          google: {
+            usageMetadata: {
+              thoughtsTokenCount: 510,
+              promptTokenCount: 898,
+              candidatesTokenCount: 11,
+              totalTokenCount: 1419,
+            },
+          },
+        }),
+        "ai.response.timestamp": new Date(goGemDo.startMs + goGemDo.durationMs).toISOString(),
+        "ai.usage.completionTokens": 521,
+        "ai.usage.promptTokens": 898,
+        "operation.name": "ai.generateObject.doGenerate",
+      },
+    })
+  );
+
+  // =====================================================================
+  // Helper: add a wrapper + doGenerate/doStream pair
+  // =====================================================================
+  function addLlmPair(opts: {
+    wrapperMsg: string; // e.g. "ai.generateText"
+    doMsg: string; // e.g. "ai.generateText.doGenerate"
+    system: string;
+    reqModel: string;
+    respModel: string;
+    inputTokens: number;
+    outputTokens: number;
+    finishReason: string;
+    wrapperDurationMs: number;
+    doDurationMs: number;
+    responseText?: string;
+    responseObject?: string;
+    responseReasoning?: string;
+    toolCallsJson?: string;
+    providerMetadata?: Record<string, unknown>;
+    telemetryMetadata?: Record<string, string>;
+    settings?: Record<string, unknown>;
+    /** Use completionTokens/promptTokens instead of inputTokens/outputTokens */
+    useCompletionStyle?: boolean;
+    cacheReadTokens?: number;
+    cacheCreationTokens?: number;
+    reasoningTokens?: number;
+    extraDoProps?: Record<string, unknown>;
+  }) {
+    const wId = generateSpanId();
+    const dId = generateSpanId();
+
+    const wrap = next(opts.wrapperDurationMs);
+    const wrapperProps: Record<string, unknown> = {
+      "ai.operationId": opts.wrapperMsg,
+      "ai.model.id": opts.reqModel,
+      "ai.model.provider": opts.system,
+      "ai.response.finishReason": opts.finishReason,
+      "operation.name": opts.wrapperMsg,
+    };
+    if (opts.responseText) wrapperProps["ai.response.text"] = opts.responseText;
+    if (opts.responseObject) wrapperProps["ai.response.object"] = opts.responseObject;
+    if (opts.telemetryMetadata) {
+      for (const [k, v] of Object.entries(opts.telemetryMetadata)) {
+        wrapperProps[`ai.telemetry.metadata.${k}`] = v;
+      }
+    }
+
+    events.push(makeEvent({ message: opts.wrapperMsg, spanId: wId, parentId: runFnId, ...wrap, properties: wrapperProps }));
+
+    cursor = wrap.startMs + 50;
+    const doTiming = next(opts.doDurationMs);
+
+    const doProps: Record<string, unknown> = {
+      "gen_ai.system": opts.system,
+      "gen_ai.request.model": opts.reqModel,
+      "gen_ai.response.model": opts.respModel,
+      "gen_ai.usage.input_tokens": opts.inputTokens,
+      "gen_ai.usage.output_tokens": opts.outputTokens,
+      "ai.model.id": opts.reqModel,
+      "ai.model.provider": opts.system,
+      "ai.operationId": opts.doMsg,
+      "ai.prompt.messages": promptMessages,
+      "ai.response.finishReason": opts.finishReason,
+      "ai.response.id": `resp_seed_${generateSpanId().slice(0, 8)}`,
+      "ai.response.model": opts.respModel,
+      "ai.response.timestamp": new Date(doTiming.startMs + doTiming.durationMs).toISOString(),
+      "operation.name": opts.doMsg,
+    };
+
+    // Token style
+    if (opts.useCompletionStyle) {
+      doProps["ai.usage.completionTokens"] = opts.outputTokens;
+      doProps["ai.usage.promptTokens"] = opts.inputTokens;
+    } else {
+      doProps["ai.usage.inputTokens"] = opts.inputTokens;
+      doProps["ai.usage.outputTokens"] = opts.outputTokens;
+      doProps["ai.usage.totalTokens"] = opts.inputTokens + opts.outputTokens;
+    }
+
+    if (opts.responseText) doProps["ai.response.text"] = opts.responseText;
+    if (opts.responseObject) doProps["ai.response.object"] = opts.responseObject;
+    if (opts.responseReasoning) doProps["ai.response.reasoning"] = opts.responseReasoning;
+    if (opts.toolCallsJson) doProps["ai.response.toolCalls"] = opts.toolCallsJson;
+    if (opts.cacheReadTokens) {
+      doProps["gen_ai.usage.cache_read_input_tokens"] = opts.cacheReadTokens;
+    }
+    if (opts.cacheCreationTokens) {
+      doProps["gen_ai.usage.cache_creation_input_tokens"] = opts.cacheCreationTokens;
+    }
+    if (opts.reasoningTokens) {
+      doProps["ai.usage.reasoningTokens"] = opts.reasoningTokens;
+    }
+    if (opts.providerMetadata) {
+      doProps["ai.response.providerMetadata"] = JSON.stringify(opts.providerMetadata);
+    }
+    if (opts.settings) {
+      for (const [k, v] of Object.entries(opts.settings)) {
+        doProps[`ai.settings.${k}`] = v;
+      }
+    }
+    if (opts.telemetryMetadata) {
+      for (const [k, v] of Object.entries(opts.telemetryMetadata)) {
+        doProps[`ai.telemetry.metadata.${k}`] = v;
+      }
+    }
+    if (opts.extraDoProps) Object.assign(doProps, opts.extraDoProps);
+
+    events.push(makeEvent({ message: opts.doMsg, spanId: dId, parentId: wId, ...doTiming, properties: doProps }));
+
+    return { wrapperId: wId, doId: dId };
+  }
+
+  // Helper: add a tool call span
+  function addToolCall(parentId: string, name: string, args: string, result: string, durationMs = 500) {
+    const id = generateSpanId();
+    const timing = next(durationMs);
+    events.push(makeEvent({
+      message: "ai.toolCall",
+      spanId: id,
+      parentId,
+      ...timing,
+      properties: {
+        "ai.operationId": "ai.toolCall",
+        "ai.toolCall.name": name,
+        "ai.toolCall.id": `call_${generateSpanId().slice(0, 8)}`,
+        "ai.toolCall.args": args,
+        "ai.toolCall.result": result,
+        "operation.name": "ai.toolCall",
+      },
+    }));
+    return id;
+  }
+
+  // =====================================================================
+  // 5) Gateway → Mistral mistral-large-3
+  // =====================================================================
+  addLlmPair({
+    wrapperMsg: "ai.generateText",
+    doMsg: "ai.generateText.doGenerate",
+    system: "gateway",
+    reqModel: "mistral/mistral-large-3",
+    respModel: "mistral/mistral-large-3",
+    inputTokens: 1179,
+    outputTokens: 48,
+    finishReason: "stop",
+    wrapperDurationMs: 1_400,
+    doDurationMs: 1_200,
+    responseText: `### Document Analysis
+
+The document primarily discusses **quarterly earnings guidance** for the technology sector, with the following key themes:
+
+- Revenue growth projections of *12–15%* YoY
+- Margin compression due to increased R&D spending
+- Forward guidance citing \`macroeconomic headwinds\`
+
+**Confidence**: High (0.92)`,
+    useCompletionStyle: true,
+    providerMetadata: {
+      gateway: {
+        routing: {
+          originalModelId: "mistral/mistral-large-3",
+          resolvedProvider: "mistral",
+          resolvedProviderApiModelId: "mistral-large-latest",
+          canonicalSlug: "mistral/mistral-large-3",
+          finalProvider: "mistral",
+          modelAttemptCount: 1,
+        },
+        cost: "0.0006615",
+        marketCost: "0.0006615",
+        generationId: "gen_seed_mistral_001",
+      },
+    },
+    extraDoProps: { "ai.request.headers.user-agent": "ai/5.0.60" },
+  });
+
+  // =====================================================================
+  // 6) Gateway → OpenAI gpt-5-mini (with fallback metadata)
+  // =====================================================================
+  addLlmPair({
+    wrapperMsg: "ai.generateText",
+    doMsg: "ai.generateText.doGenerate",
+    system: "gateway",
+    reqModel: "openai/gpt-5-mini",
+    respModel: "openai/gpt-5-mini",
+    inputTokens: 2450,
+    outputTokens: 312,
+    finishReason: "stop",
+    wrapperDurationMs: 5_000,
+    doDurationMs: 4_800,
+    responseText: "NO",
+    useCompletionStyle: true,
+    providerMetadata: {
+      openai: { responseId: "resp_seed_gw_openai", serviceTier: "default" },
+      gateway: {
+        routing: {
+          originalModelId: "openai/gpt-5-mini",
+          resolvedProvider: "openai",
+          resolvedProviderApiModelId: "gpt-5-mini-2025-08-07",
+          canonicalSlug: "openai/gpt-5-mini",
+          finalProvider: "openai",
+          fallbacksAvailable: ["azure"],
+          planningReasoning: "System credentials planned for: openai, azure. Total execution order: openai(system) → azure(system)",
+          modelAttemptCount: 1,
+        },
+        cost: "0.000482",
+        generationId: "gen_seed_gpt5mini_001",
+      },
+    },
+    extraDoProps: { "ai.request.headers.user-agent": "ai/6.0.49" },
+  });
+
+  // =====================================================================
+  // 7) Gateway → DeepSeek deepseek-v3.2 (tool-calls)
+  // =====================================================================
+  const ds = addLlmPair({
+    wrapperMsg: "ai.generateObject",
+    doMsg: "ai.generateObject.doGenerate",
+    system: "gateway",
+    reqModel: "deepseek/deepseek-v3.2",
+    respModel: "deepseek/deepseek-v3.2",
+    inputTokens: 3200,
+    outputTokens: 420,
+    finishReason: "tool-calls",
+    wrapperDurationMs: 2_800,
+    doDurationMs: 2_500,
+    responseObject: JSON.stringify({ action: "search", query: "fed rate history" }),
+    useCompletionStyle: true,
+    providerMetadata: {
+      gateway: {
+        routing: {
+          originalModelId: "deepseek/deepseek-v3.2",
+          resolvedProvider: "deepseek",
+          canonicalSlug: "deepseek/deepseek-v3.2",
+          finalProvider: "deepseek",
+          modelAttemptCount: 1,
+        },
+        cost: "0.000156",
+        generationId: "gen_seed_deepseek_001",
+      },
+    },
+  });
+  addToolCall(ds.wrapperId, "classifyContent", '{"text":"Federal Reserve rate analysis"}', '{"category":"finance","confidence":0.98}');
+
+  // =====================================================================
+  // 8) Gateway → Anthropic claude-haiku via gateway prefix
+  // =====================================================================
+  addLlmPair({
+    wrapperMsg: "ai.generateText",
+    doMsg: "ai.generateText.doGenerate",
+    system: "gateway",
+    reqModel: "anthropic/claude-haiku-4-5-20251001",
+    respModel: "anthropic/claude-haiku-4-5-20251001",
+    inputTokens: 5400,
+    outputTokens: 220,
+    finishReason: "stop",
+    wrapperDurationMs: 1_800,
+    doDurationMs: 1_500,
+    responseText: `## Content Classification Report
+
+**Category**: Financial News Article
+**Risk Level**: SAFE ✓
+
+### Analysis Breakdown
+
+| Criteria | Result | Score |
+|:---|:---|---:|
+| Factual accuracy | Verified | 0.94 |
+| Bias detection | Minimal | 0.12 |
+| Misinformation risk | Low | 0.08 |
+| Regulatory sensitivity | None detected | 0.02 |
+
+> This content follows standard financial journalism conventions and references official Federal Reserve communications directly.`,
+    useCompletionStyle: true,
+    providerMetadata: {
+      gateway: {
+        routing: {
+          originalModelId: "anthropic/claude-haiku-4-5-20251001",
+          resolvedProvider: "anthropic",
+          canonicalSlug: "anthropic/claude-haiku-4-5-20251001",
+          finalProvider: "anthropic",
+          modelAttemptCount: 1,
+        },
+        cost: "0.00312",
+        generationId: "gen_seed_gw_anthropic_001",
+      },
+    },
+  });
+
+  // =====================================================================
+  // 9) Gateway → Google gemini-3-flash-preview (structured output)
+  // =====================================================================
+  addLlmPair({
+    wrapperMsg: "ai.generateObject",
+    doMsg: "ai.generateObject.doGenerate",
+    system: "gateway",
+    reqModel: "google/gemini-3-flash-preview",
+    respModel: "google/gemini-3-flash-preview",
+    inputTokens: 720,
+    outputTokens: 85,
+    finishReason: "stop",
+    wrapperDurationMs: 1_200,
+    doDurationMs: 1_000,
+    responseObject: JSON.stringify({ sentiment: "neutral", topics: ["monetary_policy", "interest_rates"] }),
+    useCompletionStyle: true,
+    providerMetadata: {
+      gateway: {
+        routing: {
+          originalModelId: "google/gemini-3-flash-preview",
+          resolvedProvider: "google",
+          canonicalSlug: "google/gemini-3-flash-preview",
+          finalProvider: "google",
+          modelAttemptCount: 1,
+        },
+        cost: "0.0000803",
+        generationId: "gen_seed_gw_gemini_001",
+      },
+    },
+  });
+
+  // =====================================================================
+  // 10) OpenRouter → x-ai/grok-4-fast (with reasoning_details)
+  // =====================================================================
+  addLlmPair({
+    wrapperMsg: "ai.generateObject",
+    doMsg: "ai.generateObject.doGenerate",
+    system: "openrouter",
+    reqModel: "x-ai/grok-4-fast",
+    respModel: "x-ai/grok-4-fast",
+    inputTokens: 375,
+    outputTokens: 226,
+    finishReason: "stop",
+    wrapperDurationMs: 1_600,
+    doDurationMs: 1_400,
+    responseObject: JSON.stringify({ hook: "Breaking: Fed holds rates steady", isValidHook: true }),
+    useCompletionStyle: true,
+    telemetryMetadata: { model: "x-ai/grok-4-fast", schemaType: "schema", temperature: "1" },
+    settings: { maxRetries: 2, temperature: 1 },
+    providerMetadata: {
+      openrouter: {
+        provider: "xAI",
+        reasoning_details: [{ type: "reasoning.encrypted", data: "encrypted_seed_data..." }],
+        usage: {
+          promptTokens: 375,
+          promptTokensDetails: { cachedTokens: 343 },
+          completionTokens: 226,
+          completionTokensDetails: { reasoningTokens: 210 },
+          totalTokens: 601,
+          cost: 0.0001351845,
+          costDetails: { upstreamInferenceCost: 0.00013655 },
+        },
+      },
+    },
+  });
+
+  // =====================================================================
+  // 11) OpenRouter → google/gemini-2.5-flash
+  // =====================================================================
+  addLlmPair({
+    wrapperMsg: "ai.generateText",
+    doMsg: "ai.generateText.doGenerate",
+    system: "openrouter",
+    reqModel: "google/gemini-2.5-flash",
+    respModel: "google/gemini-2.5-flash",
+    inputTokens: 1840,
+    outputTokens: 320,
+    finishReason: "stop",
+    wrapperDurationMs: 2_000,
+    doDurationMs: 1_800,
+    responseText: `Based on the latest FOMC minutes, the committee voted **unanimously** to maintain rates at the current target range.
+
+### Key Takeaways from the Minutes
+
+1. **Labor Market**: Participants noted that employment conditions remain *"solid"* but acknowledged some cooling in job openings
+2. **Inflation Outlook**: Core PCE inflation running at 2.8% — still above the 2% target
+3. **Forward Guidance**: Several participants emphasized the need for \`patience\` before additional rate adjustments
+
+#### Notable Quotes
+
+> "The Committee judges that the risks to achieving its employment and inflation goals are roughly in balance." — *FOMC Statement*
+
+The next decision point will hinge on incoming data, particularly:
+- January CPI release (Feb 12)
+- January employment report (Feb 7)
+- Q4 GDP second estimate (Feb 27)`,
+    useCompletionStyle: true,
+    providerMetadata: {
+      openrouter: {
+        provider: "Google AI Studio",
+        usage: {
+          promptTokens: 1840,
+          completionTokens: 320,
+          totalTokens: 2160,
+          cost: 0.000264,
+          costDetails: { upstreamInferenceCost: 0.000232 },
+        },
+      },
+    },
+  });
+
+  // =====================================================================
+  // 12) OpenRouter → openai/gpt-4.1-mini (req ≠ resp model name)
+  // =====================================================================
+  addLlmPair({
+    wrapperMsg: "ai.generateObject",
+    doMsg: "ai.generateObject.doGenerate",
+    system: "openrouter",
+    reqModel: "openai/gpt-4.1-mini",
+    respModel: "openai/gpt-4.1-mini-2025-04-14",
+    inputTokens: 890,
+    outputTokens: 145,
+    finishReason: "stop",
+    wrapperDurationMs: 1_400,
+    doDurationMs: 1_200,
+    responseObject: JSON.stringify({ summary: "Rate unchanged at 4.25-4.50%", date: "2024-12-18" }),
+    useCompletionStyle: true,
+    providerMetadata: {
+      openrouter: {
+        provider: "OpenAI",
+        usage: {
+          promptTokens: 890,
+          completionTokens: 145,
+          totalTokens: 1035,
+          cost: 0.0000518,
+        },
+      },
+    },
+  });
+
+  // =====================================================================
+  // 13) Azure → gpt-5 with tool-calls
+  // =====================================================================
+  const az = addLlmPair({
+    wrapperMsg: "ai.generateText",
+    doMsg: "ai.generateText.doGenerate",
+    system: "azure.responses",
+    reqModel: "gpt-5-2025-08-07",
+    respModel: "gpt-5-2025-08-07",
+    inputTokens: 2038,
+    outputTokens: 239,
+    finishReason: "tool-calls",
+    wrapperDurationMs: 3_500,
+    doDurationMs: 3_000,
+    responseText: "Let me look up the latest rate decision.",
+    toolCallsJson: JSON.stringify([{
+      toolCallId: "call_azure_001",
+      toolName: "lookupRate",
+      input: '{"source":"federal_reserve","metric":"funds_rate"}',
+    }]),
+    providerMetadata: {
+      azure: { responseId: "resp_seed_azure_001", serviceTier: "default" },
+    },
+  });
+  addToolCall(az.wrapperId, "lookupRate", '{"source":"federal_reserve","metric":"funds_rate"}', '{"rate":"4.25-4.50%","effectiveDate":"2024-12-18"}');
+
+  // =====================================================================
+  // 14) Perplexity → sonar-pro
+  // =====================================================================
+  addLlmPair({
+    wrapperMsg: "ai.generateText",
+    doMsg: "ai.generateText.doGenerate",
+    system: "perplexity",
+    reqModel: "sonar-pro",
+    respModel: "sonar-pro",
+    inputTokens: 151,
+    outputTokens: 428,
+    finishReason: "stop",
+    wrapperDurationMs: 4_500,
+    doDurationMs: 4_200,
+    responseText: `According to the Federal Reserve's most recent announcement on **December 18, 2024**, the federal funds rate target range was maintained at **4.25% to 4.50%**.
+
+### Context
+
+This decision was made during the December FOMC meeting, where the committee:
+
+- Acknowledged *"solid"* economic activity and a labor market that has *"generally eased"*
+- Noted inflation remains *"somewhat elevated"* relative to the 2% target
+- Projected only **two rate cuts** in 2025 (down from four projected in September)
+
+### Market Impact
+
+The announcement triggered a sharp market reaction:
+
+\`\`\`
+S&P 500:    -2.95%  (largest FOMC-day drop since 2001)
+10Y Yield:  +11 bps to 4.52%
+DXY Index:  +1.2% to 108.3
+\`\`\`
+
+> **Sources**: Federal Reserve Board press release, CME FedWatch, Bloomberg Terminal`,
+  });
+
+  // =====================================================================
+  // 15) openai.chat → gpt-4o-mini (legacy chat completions, mode: "tool")
+  // =====================================================================
+  addLlmPair({
+    wrapperMsg: "ai.generateObject",
+    doMsg: "ai.generateObject.doGenerate",
+    system: "openai.chat",
+    reqModel: "gpt-4o-mini",
+    respModel: "gpt-4o-mini-2024-07-18",
+    inputTokens: 573,
+    outputTokens: 11,
+    finishReason: "stop",
+    wrapperDurationMs: 800,
+    doDurationMs: 600,
+    responseObject: JSON.stringify({ title: "Fed Rate Hold", emoji: "🏦" }),
+    settings: { maxRetries: 2, mode: "tool", temperature: 0.3 },
+    providerMetadata: {
+      openai: { reasoningTokens: 0, cachedPromptTokens: 0 },
+    },
+  });
+
+  // =====================================================================
+  // 16) Anthropic claude-sonnet-4-5 → streamText with reasoning
+  // =====================================================================
+  addLlmPair({
+    wrapperMsg: "ai.streamText",
+    doMsg: "ai.streamText.doStream",
+    system: "anthropic.messages",
+    reqModel: "claude-sonnet-4-5-20250929",
+    respModel: "claude-sonnet-4-5-20250929",
+    inputTokens: 15200,
+    outputTokens: 2840,
+    finishReason: "stop",
+    wrapperDurationMs: 12_000,
+    doDurationMs: 11_500,
+    responseText: `The Federal Reserve has maintained its target range for the federal funds rate at **4.25% to 4.50%** since December 2024.
+
+## Rate Cycle Overview
+
+This represents a **pause** in the rate-cutting cycle that began in September 2024:
+
+| Phase | Period | Action |
+|:---|:---|:---|
+| Peak hold | Jul 2023 – Sep 2024 | Held at 5.25%–5.50% |
+| Easing begins | Sep 2024 | Cut 50 bps |
+| Continued easing | Nov 2024 | Cut 25 bps |
+| Final cut (so far) | Dec 2024 | Cut 25 bps |
+| Current pause | Jan 2025 – present | Hold |
+
+### What's Driving the Pause?
+
+The FOMC has cited three primary factors:
+
+1. **Sticky inflation**: Core PCE at 2.8% remains above the 2% symmetric target
+2. **Resilient growth**: GDP growth of 3.1% in Q3 2024 exceeded expectations
+3. **Policy uncertainty**: New administration trade and fiscal policies create *"unusually elevated"* uncertainty
+
+> The Committee has indicated it will continue to assess incoming data, the evolving outlook, and the balance of risks when considering further adjustments to the target range.
+
+### Technical Note
+
+The effective federal funds rate (\`EFFR\`) currently sits at **4.33%**, near the midpoint of the target range. The overnight reverse repo facility (ON RRP) rate is set at **4.25%**.`,
+    responseReasoning: "The user is asking about the current Federal Reserve interest rate. Let me provide a comprehensive answer based on the most recent FOMC decision. I should include context about the rate trajectory and forward guidance. I'll structure this with a table showing the recent rate changes and explain the pause rationale.",
+    cacheReadTokens: 12400,
+    cacheCreationTokens: 2800,
+    providerMetadata: {
+      anthropic: {
+        usage: {
+          input_tokens: 15200,
+          output_tokens: 2840,
+          cache_creation_input_tokens: 2800,
+          cache_read_input_tokens: 12400,
+          service_tier: "standard",
+          inference_geo: "us-east-1",
+        },
+      },
+    },
+  });
+
+  // =====================================================================
+  // 17) google.vertex.chat → gemini-3.1-pro-preview with tool-calls
+  // =====================================================================
+  const vt = addLlmPair({
+    wrapperMsg: "ai.generateText",
+    doMsg: "ai.generateText.doGenerate",
+    system: "google.vertex.chat",
+    reqModel: "gemini-3.1-pro-preview",
+    respModel: "gemini-3.1-pro-preview",
+    inputTokens: 4200,
+    outputTokens: 680,
+    finishReason: "tool-calls",
+    wrapperDurationMs: 6_000,
+    doDurationMs: 5_500,
+    responseText: "I'll search for the latest FOMC decision and rate information.",
+    toolCallsJson: JSON.stringify([{
+      toolCallId: "call_vertex_001",
+      toolName: "searchFOMC",
+      input: '{"query":"latest FOMC decision december 2024"}',
+    }]),
+    providerMetadata: {
+      google: {
+        usageMetadata: {
+          thoughtsTokenCount: 320,
+          promptTokenCount: 4200,
+          candidatesTokenCount: 680,
+          totalTokenCount: 5200,
+        },
+      },
+    },
+  });
+  addToolCall(vt.wrapperId, "searchFOMC", '{"query":"latest FOMC decision december 2024"}', '{"decision":"hold","rate":"4.25-4.50%","date":"2024-12-18","vote":"unanimous"}', 800);
+
+  // =====================================================================
+  // 18) openai.responses → gpt-5.4 with reasoning tokens
+  // =====================================================================
+  addLlmPair({
+    wrapperMsg: "ai.streamText",
+    doMsg: "ai.streamText.doStream",
+    system: "openai.responses",
+    reqModel: "gpt-5.4",
+    respModel: "gpt-5.4-2026-03-05",
+    inputTokens: 8900,
+    outputTokens: 1250,
+    finishReason: "stop",
+    wrapperDurationMs: 8_000,
+    doDurationMs: 7_500,
+    responseText: `## Federal Funds Rate — Current Status
+
+The Federal Reserve's current target range is **4.25% to 4.50%**, established at the **December 18, 2024** FOMC meeting.
+
+### Policy Stance
+
+The committee has signaled a *cautious approach* to further rate cuts. Key considerations include:
+
+- **Inflation**: Core PCE remains at 2.8%, above the 2% target
+- **Employment**: Unemployment rate stable at 4.2%, with 256K jobs added in December
+- **Growth**: Real GDP tracking at ~2.5% annualized
+
+### Dot Plot Summary (Dec 2024 SEP)
+
+The median dot plot projections:
+
+\`\`\`python
+# Median FOMC projections
+rates = {
+    "2025": 3.75,  # implies 2 cuts of 25bps
+    "2026": 3.25,  # implies 2 additional cuts
+    "longer_run": 3.00  # neutral rate estimate (up from 2.5%)
+}
+\`\`\`
+
+### Risk Assessment
+
+| Risk Factor | Direction | Magnitude |
+|:---|:---:|:---:|
+| Tariff-driven inflation | ↑ Upside | Medium |
+| Labor market softening | ↓ Downside | Low |
+| Fiscal expansion | ↑ Upside | High |
+| Global growth slowdown | ↓ Downside | Medium |
+
+> *"The committee remains attentive to the risks to both sides of its dual mandate."* — Chair Powell, Dec 18 press conference`,
+    responseReasoning: "I need to provide accurate, up-to-date information about the Federal Reserve interest rate. The last FOMC meeting was in December 2024 where they cut rates by 25 bps after two previous cuts. Let me include the dot plot projections and a risk assessment table for a comprehensive view.",
+    reasoningTokens: 516,
+    providerMetadata: {
+      openai: {
+        responseId: "resp_seed_gpt54_001",
+        serviceTier: "default",
+      },
+    },
+    extraDoProps: {
+      "ai.response.msToFirstChunk": 1842.5,
+      "ai.response.msToFinish": 7234.8,
+      "ai.response.avgOutputTokensPerSecond": 172.8,
+    },
+  });
+
+  // =====================================================================
+  // 19) Cerebras cerebras-gpt-13b — no pricing, no provider cost
+  // =====================================================================
+  addLlmPair({
+    wrapperMsg: "ai.generateText",
+    doMsg: "ai.generateText.doGenerate",
+    system: "cerebras.chat",
+    reqModel: "cerebras-gpt-13b",
+    respModel: "cerebras-gpt-13b",
+    inputTokens: 450,
+    outputTokens: 120,
+    finishReason: "stop",
+    wrapperDurationMs: 600,
+    doDurationMs: 400,
+    responseText: `The Federal Reserve rate is currently at **4.25–4.50%**.
+
+Key details:
+- *Effective date*: December 18, 2024
+- *Next meeting*: January 28–29, 2025
+- *Market expectation*: Hold (\`89.3%\` probability per CME FedWatch)`,
+  });
+
+  // =====================================================================
+  // 20) Amazon Bedrock — no pricing in registry
+  // =====================================================================
+  addLlmPair({
+    wrapperMsg: "ai.generateText",
+    doMsg: "ai.generateText.doGenerate",
+    system: "amazon-bedrock",
+    reqModel: "us.anthropic.claude-sonnet-4-20250514-v1:0",
+    respModel: "us.anthropic.claude-sonnet-4-20250514-v1:0",
+    inputTokens: 3200,
+    outputTokens: 890,
+    finishReason: "stop",
+    wrapperDurationMs: 4_000,
+    doDurationMs: 3_500,
+    responseText: `Based on the latest FOMC statement, the target rate range remains at **4.25% to 4.50%**.
+
+### Additional Context
+
+The committee's statement included notable language changes:
+- Removed reference to *"gaining greater confidence"* on inflation
+- Added emphasis on monitoring \`both sides\` of the dual mandate
+- Acknowledged *"uncertainty around the economic outlook has increased"*
+
+Governor Bowman dissented, preferring a **hold** rather than the 25 bps cut — the first governor dissent since 2005.`,
+  });
+
+  // =====================================================================
+  // 21) Groq — fast inference, no pricing
+  // =====================================================================
+  addLlmPair({
+    wrapperMsg: "ai.generateObject",
+    doMsg: "ai.generateObject.doGenerate",
+    system: "groq.chat",
+    reqModel: "llama-4-scout-17b-16e-instruct",
+    respModel: "llama-4-scout-17b-16e-instruct",
+    inputTokens: 820,
+    outputTokens: 95,
+    finishReason: "stop",
+    wrapperDurationMs: 300,
+    doDurationMs: 200,
+    responseObject: JSON.stringify({ rate: "4.25-4.50%", source: "FOMC", date: "2024-12-18" }),
+  });
+
+  return events;
+}
+
+// ---------------------------------------------------------------------------
+
+seedAiSpans()
+  .catch((e) => {
+    console.error("Seed failed:");
+    console.error(e);
+    process.exit(1);
+  })
+  .finally(async () => {
+    await prisma.$disconnect();
+  });
diff --git a/apps/webapp/seed.mts b/apps/webapp/seed.mts
index aa08eaaeec0..9eb30cd2503 100644
--- a/apps/webapp/seed.mts
+++ b/apps/webapp/seed.mts
@@ -75,6 +75,7 @@ async function seed() {
   }
 
   await createBatchLimitOrgs(user);
+  await ensureDefaultWorkerGroup();
 
   console.log("\n🎉 Seed complete!\n");
   console.log("Summary:");
@@ -249,3 +250,62 @@ async function findOrCreateProject(
 
   return { project, environments };
 }
+
+async function ensureDefaultWorkerGroup() {
+  // Check if the feature flag already exists
+  const existingFlag = await prisma.featureFlag.findUnique({
+    where: { key: "defaultWorkerInstanceGroupId" },
+  });
+
+  if (existingFlag) {
+    console.log(`✅ Default worker instance group already configured`);
+    return;
+  }
+
+  // Check if a managed worker group already exists
+  let workerGroup = await prisma.workerInstanceGroup.findFirst({
+    where: { type: "MANAGED" },
+  });
+
+  if (!workerGroup) {
+    console.log("Creating default worker instance group...");
+
+    const { createHash, randomBytes } = await import("crypto");
+    const tokenValue = `tr_wgt_${randomBytes(20).toString("hex")}`;
+    const tokenHash = createHash("sha256").update(tokenValue).digest("hex");
+
+    const token = await prisma.workerGroupToken.create({
+      data: { tokenHash },
+    });
+
+    workerGroup = await prisma.workerInstanceGroup.create({
+      data: {
+        type: "MANAGED",
+        name: "local-dev",
+        masterQueue: "local-dev",
+        description: "Local development worker group",
+        tokenId: token.id,
+      },
+    });
+
+    console.log(`✅ Created worker instance group: ${workerGroup.name} (${workerGroup.id})`);
+  } else {
+    console.log(
+      `✅ Worker instance group already exists: ${workerGroup.name} (${workerGroup.id})`
+    );
+  }
+
+  // Set the feature flag
+  await prisma.featureFlag.upsert({
+    where: { key: "defaultWorkerInstanceGroupId" },
+    create: {
+      key: "defaultWorkerInstanceGroupId",
+      value: workerGroup.id,
+    },
+    update: {
+      value: workerGroup.id,
+    },
+  });
+
+  console.log(`✅ Set defaultWorkerInstanceGroupId feature flag`);
+}
diff --git a/apps/webapp/test/otlpExporter.test.ts b/apps/webapp/test/otlpExporter.test.ts
index 98380f2a596..f07019b4a25 100644
--- a/apps/webapp/test/otlpExporter.test.ts
+++ b/apps/webapp/test/otlpExporter.test.ts
@@ -1,5 +1,8 @@
-import { describe, it, expect } from "vitest";
-import { enrichCreatableEvents } from "../app/v3/utils/enrichCreatableEvents.server.js";
+import { describe, it, expect, beforeEach, afterEach } from "vitest";
+import {
+  enrichCreatableEvents,
+  setLlmPricingRegistry,
+} from "../app/v3/utils/enrichCreatableEvents.server.js";
 import {
   RuntimeEnvironmentType,
   TaskEventKind,
@@ -83,8 +86,8 @@ describe("OTLPExporter", () => {
 
       const event = $events[0];
       expect(event.message).toBe("Responses API with 'gpt-4o'");
-      expect(event.style).toEqual({
-        icon: "tabler-brand-openai",
+      expect(event.style).toMatchObject({
+        icon: "ai-provider-openai",
       });
     });
 
@@ -161,8 +164,17 @@ describe("OTLPExporter", () => {
 
       const event = $events[0];
       expect(event.message).toBe("Responses API with gpt-4o");
-      expect(event.style).toEqual({
-        icon: "tabler-brand-openai",
+      expect(event.style).toMatchObject({
+        icon: "ai-provider-openai",
+      });
+      // Enrichment also adds model/token pills as accessories
+      const style = event.style as Record<string, unknown>;
+      expect(style.accessory).toMatchObject({
+        style: "pills",
+        items: expect.arrayContaining([
+          expect.objectContaining({ text: "gpt-4o-2024-08-06" }),
+          expect.objectContaining({ text: "724" }),
+        ]),
       });
     });
 
@@ -218,7 +230,7 @@ describe("OTLPExporter", () => {
       const $events = enrichCreatableEvents(events);
       expect($events[0].message).toBe("Using 'gpt-4' with temperature 0.7");
       expect($events[0].style).toEqual({
-        icon: "tabler-brand-openai",
+        icon: "ai-provider-openai",
       });
     });
 
@@ -249,7 +261,7 @@ describe("OTLPExporter", () => {
       const $events = enrichCreatableEvents(events);
       expect($events[0].message).toBe("Count is 42 and enabled is true");
       expect($events[0].style).toEqual({
-        icon: "tabler-brand-anthropic",
+        icon: "ai-provider-anthropic",
       });
     });
 
@@ -278,7 +290,7 @@ describe("OTLPExporter", () => {
       const $events = enrichCreatableEvents(events);
       expect($events[0].message).toBe("Plain message without variables");
       expect($events[0].style).toEqual({
-        icon: "tabler-brand-openai",
+        icon: "ai-provider-openai",
       });
     });
 
@@ -334,7 +346,7 @@ describe("OTLPExporter", () => {
       const $events = enrichCreatableEvents(events);
       expect($events[0].style).toEqual({
         existingStyle: "value",
-        icon: "tabler-brand-openai", // GenAI enricher wins because it's first
+        icon: "ai-provider-openai", // GenAI enricher wins because it's first
       });
     });
 
@@ -394,4 +406,301 @@ describe("OTLPExporter", () => {
       });
     });
   });
+
+  describe("LLM cost enrichment", () => {
+    const mockRegistry = {
+      isLoaded: true,
+      calculateCost: (responseModel: string, usageDetails: Record<string, number>) => {
+        if (responseModel.startsWith("gpt-4o")) {
+          const inputCost = (usageDetails["input"] ?? 0) * 0.0000025;
+          const outputCost = (usageDetails["output"] ?? 0) * 0.00001;
+          return {
+            matchedModelId: "llm_model_gpt4o",
+            matchedModelName: "gpt-4o",
+            pricingTierId: "tier-standard",
+            pricingTierName: "Standard",
+            inputCost,
+            outputCost,
+            totalCost: inputCost + outputCost,
+            costDetails: { input: inputCost, output: outputCost },
+          };
+        }
+        return null;
+      },
+    };
+
+    beforeEach(() => {
+      setLlmPricingRegistry(mockRegistry);
+    });
+
+    afterEach(() => {
+      setLlmPricingRegistry(undefined as any);
+    });
+
+    function makeGenAiEvent(overrides: Record<string, unknown> = {}) {
+      return {
+        message: "ai.streamText.doStream",
+        traceId: "test-trace",
+        spanId: "test-span",
+        parentId: "test-parent",
+        isPartial: false,
+        isError: false,
+        kind: TaskEventKind.INTERNAL,
+        level: TaskEventLevel.TRACE,
+        status: TaskEventStatus.UNSET,
+        startTime: BigInt(1),
+        duration: 5000000000,
+        style: {},
+        serviceName: "test",
+        environmentId: "env-1",
+        environmentType: RuntimeEnvironmentType.DEVELOPMENT,
+        organizationId: "org-1",
+        projectId: "proj-1",
+        projectRef: "proj_test",
+        runId: "run_test",
+        runIsTest: false,
+        taskSlug: "my-task",
+        metadata: undefined,
+        properties: {
+          "gen_ai.system": "openai",
+          "gen_ai.request.model": "gpt-4o",
+          "gen_ai.response.model": "gpt-4o-2024-08-06",
+          "gen_ai.usage.input_tokens": 702,
+          "gen_ai.usage.output_tokens": 22,
+          "operation.name": "ai.streamText.doStream",
+          ...overrides,
+        },
+      };
+    }
+
+    it("should enrich spans with cost attributes and accessories", () => {
+      const events = [makeGenAiEvent()];
+
+      // @ts-expect-error
+      const $events = enrichCreatableEvents(events);
+      const event = $events[0];
+
+      // Cost attributes
+      expect(event.properties["trigger.llm.total_cost"]).toBeCloseTo(0.001975);
+      expect(event.properties["trigger.llm.input_cost"]).toBeCloseTo(0.001755);
+      expect(event.properties["trigger.llm.output_cost"]).toBeCloseTo(0.00022);
+      expect(event.properties["trigger.llm.matched_model"]).toBe("gpt-4o");
+      expect(event.properties["trigger.llm.pricing_tier"]).toBe("Standard");
+
+      // Accessories (pills style)
+      expect(event.style.accessory).toBeDefined();
+      expect(event.style.accessory.style).toBe("pills");
+      expect(event.style.accessory.items).toHaveLength(3);
+      expect(event.style.accessory.items[0]).toEqual({
+        text: "gpt-4o-2024-08-06",
+        icon: "tabler-cube",
+      });
+      expect(event.style.accessory.items[1]).toEqual({
+        text: "724",
+        icon: "tabler-hash",
+      });
+      expect(event.style.accessory.items[2]).toEqual({
+        text: "$0.001975",
+        icon: "tabler-currency-dollar",
+      });
+    });
+
+    it("should set _llmMetrics side-channel for dual-write", () => {
+      const events = [makeGenAiEvent()];
+
+      // @ts-expect-error
+      const $events = enrichCreatableEvents(events);
+      const event = $events[0];
+
+      expect(event._llmMetrics).toBeDefined();
+      expect(event._llmMetrics.genAiSystem).toBe("openai");
+      expect(event._llmMetrics.responseModel).toBe("gpt-4o-2024-08-06");
+      expect(event._llmMetrics.inputTokens).toBe(702);
+      expect(event._llmMetrics.outputTokens).toBe(22);
+      expect(event._llmMetrics.totalCost).toBeCloseTo(0.001975);
+      expect(event._llmMetrics.operationId).toBe("ai.streamText.doStream");
+    });
+
+    it("should skip partial spans", () => {
+      const events = [makeGenAiEvent()];
+      events[0].isPartial = true;
+
+      // @ts-expect-error
+      const $events = enrichCreatableEvents(events);
+      expect($events[0].properties["trigger.llm.total_cost"]).toBeUndefined();
+      expect($events[0]._llmMetrics).toBeUndefined();
+    });
+
+    it("should skip spans without gen_ai.response.model or gen_ai.request.model", () => {
+      const events = [
+        makeGenAiEvent({
+          "gen_ai.response.model": undefined,
+          "gen_ai.request.model": undefined,
+        }),
+      ];
+
+      // @ts-expect-error
+      const $events = enrichCreatableEvents(events);
+      expect($events[0].properties["trigger.llm.total_cost"]).toBeUndefined();
+    });
+
+    it("should fall back to gen_ai.request.model when response.model is missing", () => {
+      const events = [
+        makeGenAiEvent({
+          "gen_ai.response.model": undefined,
+          "gen_ai.request.model": "gpt-4o",
+        }),
+      ];
+
+      // @ts-expect-error
+      const $events = enrichCreatableEvents(events);
+      expect($events[0].properties["trigger.llm.matched_model"]).toBe("gpt-4o");
+    });
+
+    it("should skip spans with no token usage", () => {
+      const events = [
+        makeGenAiEvent({
+          "gen_ai.usage.input_tokens": 0,
+          "gen_ai.usage.output_tokens": 0,
+        }),
+      ];
+
+      // @ts-expect-error
+      const $events = enrichCreatableEvents(events);
+      expect($events[0].properties["trigger.llm.total_cost"]).toBeUndefined();
+    });
+
+    it("should skip spans with unknown models", () => {
+      const events = [
+        makeGenAiEvent({
+          "gen_ai.response.model": "unknown-model-xyz",
+          "gen_ai.request.model": "unknown-model-xyz",
+        }),
+      ];
+
+      // @ts-expect-error
+      const $events = enrichCreatableEvents(events);
+      expect($events[0].properties["trigger.llm.total_cost"]).toBeUndefined();
+    });
+
+    it("should not enrich non-span kinds like SPAN_EVENT or LOG", () => {
+      const events = [makeGenAiEvent()];
+      events[0].kind = "SPAN_EVENT" as any;
+
+      // @ts-expect-error
+      const $events = enrichCreatableEvents(events);
+      expect($events[0].properties["trigger.llm.total_cost"]).toBeUndefined();
+    });
+
+    it("should enrich SERVER kind events", () => {
+      const events = [makeGenAiEvent()];
+      events[0].kind = TaskEventKind.SERVER;
+
+      // @ts-expect-error
+      const $events = enrichCreatableEvents(events);
+      expect($events[0].properties["trigger.llm.total_cost"]).toBeCloseTo(0.001975);
+    });
+
+    it("should not enrich when registry is not loaded", () => {
+      setLlmPricingRegistry({ isLoaded: false, calculateCost: () => null });
+      const events = [makeGenAiEvent()];
+
+      // @ts-expect-error
+      const $events = enrichCreatableEvents(events);
+      expect($events[0].properties["trigger.llm.total_cost"]).toBeUndefined();
+    });
+
+    it("should format token counts with k/M suffixes in accessories", () => {
+      const events = [
+        makeGenAiEvent({
+          "gen_ai.usage.input_tokens": 150000,
+          "gen_ai.usage.output_tokens": 2000,
+        }),
+      ];
+
+      // @ts-expect-error
+      const $events = enrichCreatableEvents(events);
+      expect($events[0].style.accessory.items[1].text).toBe("152.0k");
+    });
+
+    it("should normalize alternate token attribute names", () => {
+      const events = [
+        makeGenAiEvent({
+          "gen_ai.usage.input_tokens": undefined,
+          "gen_ai.usage.output_tokens": undefined,
+          "gen_ai.usage.prompt_tokens": 500,
+          "gen_ai.usage.completion_tokens": 100,
+        }),
+      ];
+
+      // @ts-expect-error
+      const $events = enrichCreatableEvents(events);
+      expect($events[0]._llmMetrics.inputTokens).toBe(500);
+      expect($events[0]._llmMetrics.outputTokens).toBe(100);
+    });
+
+    it("should prefer gen_ai.usage.total_tokens over input+output sum", () => {
+      const events = [
+        makeGenAiEvent({
+          "gen_ai.usage.input_tokens": 100,
+          "gen_ai.usage.output_tokens": 50,
+          "gen_ai.usage.total_tokens": 200, // higher than 100+50 (e.g. includes cached/reasoning)
+        }),
+      ];
+
+      // @ts-expect-error
+      const $events = enrichCreatableEvents(events);
+      const event = $events[0];
+
+      // Pills should show the explicit total, not input+output
+      expect(event.style.accessory.items[1]).toEqual({
+        text: "200",
+        icon: "tabler-hash",
+      });
+
+      // LLM usage should also use the explicit total
+      expect(event._llmMetrics.totalTokens).toBe(200);
+      expect(event._llmMetrics.inputTokens).toBe(100);
+      expect(event._llmMetrics.outputTokens).toBe(50);
+    });
+
+    it("should fall back to input+output when total_tokens is absent", () => {
+      const events = [
+        makeGenAiEvent({
+          "gen_ai.usage.input_tokens": 300,
+          "gen_ai.usage.output_tokens": 75,
+        }),
+      ];
+
+      // @ts-expect-error
+      const $events = enrichCreatableEvents(events);
+      const event = $events[0];
+
+      expect(event.style.accessory.items[1]).toEqual({
+        text: "375",
+        icon: "tabler-hash",
+      });
+      expect(event._llmMetrics.totalTokens).toBe(375);
+    });
+
+    it("should use total_tokens when only total is present without input/output breakdown", () => {
+      const events = [
+        makeGenAiEvent({
+          "gen_ai.usage.input_tokens": undefined,
+          "gen_ai.usage.output_tokens": undefined,
+          "gen_ai.usage.total_tokens": 500,
+        }),
+      ];
+
+      // @ts-expect-error
+      const $events = enrichCreatableEvents(events);
+      const event = $events[0];
+
+      // Pills should show 500, not 0
+      expect(event.style.accessory.items[1]).toEqual({
+        text: "500",
+        icon: "tabler-hash",
+      });
+    });
+  });
 });
diff --git a/internal-packages/clickhouse/schema/024_create_llm_usage_v1.sql b/internal-packages/clickhouse/schema/024_create_llm_usage_v1.sql
new file mode 100644
index 00000000000..7cfbc0cea98
--- /dev/null
+++ b/internal-packages/clickhouse/schema/024_create_llm_usage_v1.sql
@@ -0,0 +1,64 @@
+-- +goose Up
+CREATE TABLE IF NOT EXISTS trigger_dev.llm_metrics_v1
+(
+  -- Tenant context
+  organization_id   LowCardinality(String),
+  project_id        LowCardinality(String),
+  environment_id    String CODEC(ZSTD(1)),
+  run_id            String CODEC(ZSTD(1)),
+  task_identifier   LowCardinality(String),
+  trace_id          String CODEC(ZSTD(1)),
+  span_id           String CODEC(ZSTD(1)),
+
+  -- Model & provider
+  gen_ai_system     LowCardinality(String),
+  request_model     String CODEC(ZSTD(1)),
+  response_model    String CODEC(ZSTD(1)),
+  matched_model_id  String CODEC(ZSTD(1)),
+  operation_id      LowCardinality(String),
+  finish_reason     LowCardinality(String),
+  cost_source       LowCardinality(String),
+
+  -- Pricing
+  pricing_tier_id   String CODEC(ZSTD(1)),
+  pricing_tier_name LowCardinality(String),
+
+  -- Token usage
+  input_tokens      UInt64 DEFAULT 0,
+  output_tokens     UInt64 DEFAULT 0,
+  total_tokens      UInt64 DEFAULT 0,
+  usage_details     Map(LowCardinality(String), UInt64),
+
+  -- Cost
+  input_cost        Decimal64(12) DEFAULT 0,
+  output_cost       Decimal64(12) DEFAULT 0,
+  total_cost        Decimal64(12) DEFAULT 0,
+  cost_details      Map(LowCardinality(String), Decimal64(12)),
+  provider_cost     Decimal64(12) DEFAULT 0,
+
+  -- Performance
+  ms_to_first_chunk Float64 DEFAULT 0,
+  tokens_per_second Float64 DEFAULT 0,
+
+  -- Attribution
+  metadata          Map(LowCardinality(String), String),
+
+  -- Timing
+  start_time        DateTime64(9) CODEC(Delta(8), ZSTD(1)),
+  duration          UInt64 DEFAULT 0 CODEC(ZSTD(1)),
+  inserted_at       DateTime64(3) DEFAULT now64(3),
+
+  -- Indexes
+  INDEX idx_run_id run_id TYPE bloom_filter(0.001) GRANULARITY 1,
+  INDEX idx_span_id span_id TYPE bloom_filter(0.001) GRANULARITY 1,
+  INDEX idx_response_model response_model TYPE bloom_filter(0.01) GRANULARITY 1,
+  INDEX idx_metadata_keys mapKeys(metadata) TYPE bloom_filter(0.01) GRANULARITY 1
+)
+ENGINE = MergeTree
+PARTITION BY toDate(inserted_at)
+ORDER BY (organization_id, project_id, environment_id, toDate(inserted_at), run_id)
+TTL toDateTime(inserted_at) + INTERVAL 365 DAY
+SETTINGS ttl_only_drop_parts = 1;
+
+-- +goose Down
+DROP TABLE IF EXISTS trigger_dev.llm_metrics_v1;
diff --git a/internal-packages/clickhouse/src/index.ts b/internal-packages/clickhouse/src/index.ts
index b6fbd92177b..18e52483627 100644
--- a/internal-packages/clickhouse/src/index.ts
+++ b/internal-packages/clickhouse/src/index.ts
@@ -27,6 +27,7 @@ import {
   getLogsSearchListQueryBuilder,
 } from "./taskEvents.js";
 import { insertMetrics } from "./metrics.js";
+import { insertLlmMetrics } from "./llmMetrics.js";
 import {
   getErrorGroups,
   getErrorInstances,
@@ -44,6 +45,7 @@ import type { Agent as HttpsAgent } from "https";
 export type * from "./taskRuns.js";
 export type * from "./taskEvents.js";
 export type * from "./metrics.js";
+export type * from "./llmMetrics.js";
 export type * from "./errors.js";
 export type * from "./client/queryBuilder.js";
 
@@ -225,6 +227,12 @@ export class ClickHouse {
     };
   }
 
+  get llmMetrics() {
+    return {
+      insert: insertLlmMetrics(this.writer),
+    };
+  }
+
   get taskEventsV2() {
     return {
       insert: insertTaskEventsV2(this.writer),
diff --git a/internal-packages/clickhouse/src/llmMetrics.ts b/internal-packages/clickhouse/src/llmMetrics.ts
new file mode 100644
index 00000000000..1f830b707d8
--- /dev/null
+++ b/internal-packages/clickhouse/src/llmMetrics.ts
@@ -0,0 +1,51 @@
+import { z } from "zod";
+import { ClickhouseWriter } from "./client/types.js";
+
+export const LlmMetricsV1Input = z.object({
+  organization_id: z.string(),
+  project_id: z.string(),
+  environment_id: z.string(),
+  run_id: z.string(),
+  task_identifier: z.string(),
+  trace_id: z.string(),
+  span_id: z.string(),
+
+  gen_ai_system: z.string(),
+  request_model: z.string(),
+  response_model: z.string(),
+  matched_model_id: z.string(),
+  operation_id: z.string(),
+  finish_reason: z.string(),
+  cost_source: z.string(),
+
+  pricing_tier_id: z.string(),
+  pricing_tier_name: z.string(),
+
+  input_tokens: z.number(),
+  output_tokens: z.number(),
+  total_tokens: z.number(),
+  usage_details: z.record(z.string(), z.number()),
+
+  input_cost: z.number(),
+  output_cost: z.number(),
+  total_cost: z.number(),
+  cost_details: z.record(z.string(), z.number()),
+  provider_cost: z.number(),
+
+  ms_to_first_chunk: z.number(),
+  tokens_per_second: z.number(),
+
+  metadata: z.record(z.string(), z.string()),
+
+  start_time: z.string(),
+  duration: z.string(),
+});
+
+export type LlmMetricsV1Input = z.input<typeof LlmMetricsV1Input>;
+
+export function insertLlmMetrics(ch: ClickhouseWriter) {
+  return ch.insertUnsafe<LlmMetricsV1Input>({
+    name: "insertLlmMetrics",
+    table: "trigger_dev.llm_metrics_v1",
+  });
+}
diff --git a/internal-packages/database/prisma/migrations/20260310155049_add_llm_pricing_tables/migration.sql b/internal-packages/database/prisma/migrations/20260310155049_add_llm_pricing_tables/migration.sql
new file mode 100644
index 00000000000..286de6eacfb
--- /dev/null
+++ b/internal-packages/database/prisma/migrations/20260310155049_add_llm_pricing_tables/migration.sql
@@ -0,0 +1,67 @@
+-- CreateTable
+CREATE TABLE "public"."llm_models" (
+    "id" TEXT NOT NULL,
+    "friendly_id" TEXT NOT NULL,
+    "project_id" TEXT,
+    "model_name" TEXT NOT NULL,
+    "match_pattern" TEXT NOT NULL,
+    "start_date" TIMESTAMP(3),
+    "source" TEXT NOT NULL DEFAULT 'default',
+    "created_at" TIMESTAMP(3) NOT NULL DEFAULT CURRENT_TIMESTAMP,
+    "updated_at" TIMESTAMP(3) NOT NULL,
+
+    CONSTRAINT "llm_models_pkey" PRIMARY KEY ("id")
+);
+
+-- CreateTable
+CREATE TABLE "public"."llm_pricing_tiers" (
+    "id" TEXT NOT NULL,
+    "model_id" TEXT NOT NULL,
+    "name" TEXT NOT NULL,
+    "is_default" BOOLEAN NOT NULL DEFAULT true,
+    "priority" INTEGER NOT NULL DEFAULT 0,
+    "conditions" JSONB NOT NULL DEFAULT '[]',
+
+    CONSTRAINT "llm_pricing_tiers_pkey" PRIMARY KEY ("id")
+);
+
+-- CreateTable
+CREATE TABLE "public"."llm_prices" (
+    "id" TEXT NOT NULL,
+    "model_id" TEXT NOT NULL,
+    "pricing_tier_id" TEXT NOT NULL,
+    "usage_type" TEXT NOT NULL,
+    "price" DECIMAL(20,12) NOT NULL,
+
+    CONSTRAINT "llm_prices_pkey" PRIMARY KEY ("id")
+);
+
+-- CreateIndex
+CREATE UNIQUE INDEX "llm_models_friendly_id_key" ON "public"."llm_models"("friendly_id");
+
+-- CreateIndex
+CREATE INDEX "llm_models_project_id_idx" ON "public"."llm_models"("project_id");
+
+-- CreateIndex
+CREATE UNIQUE INDEX "llm_models_project_id_model_name_start_date_key" ON "public"."llm_models"("project_id", "model_name", "start_date");
+
+-- CreateIndex
+CREATE UNIQUE INDEX "llm_pricing_tiers_model_id_priority_key" ON "public"."llm_pricing_tiers"("model_id", "priority");
+
+-- CreateIndex
+CREATE UNIQUE INDEX "llm_pricing_tiers_model_id_name_key" ON "public"."llm_pricing_tiers"("model_id", "name");
+
+-- CreateIndex
+CREATE UNIQUE INDEX "llm_prices_model_id_usage_type_pricing_tier_id_key" ON "public"."llm_prices"("model_id", "usage_type", "pricing_tier_id");
+
+-- AddForeignKey
+ALTER TABLE "public"."llm_models" ADD CONSTRAINT "llm_models_project_id_fkey" FOREIGN KEY ("project_id") REFERENCES "public"."Project"("id") ON DELETE CASCADE ON UPDATE CASCADE;
+
+-- AddForeignKey
+ALTER TABLE "public"."llm_pricing_tiers" ADD CONSTRAINT "llm_pricing_tiers_model_id_fkey" FOREIGN KEY ("model_id") REFERENCES "public"."llm_models"("id") ON DELETE CASCADE ON UPDATE CASCADE;
+
+-- AddForeignKey
+ALTER TABLE "public"."llm_prices" ADD CONSTRAINT "llm_prices_model_id_fkey" FOREIGN KEY ("model_id") REFERENCES "public"."llm_models"("id") ON DELETE CASCADE ON UPDATE CASCADE;
+
+-- AddForeignKey
+ALTER TABLE "public"."llm_prices" ADD CONSTRAINT "llm_prices_pricing_tier_id_fkey" FOREIGN KEY ("pricing_tier_id") REFERENCES "public"."llm_pricing_tiers"("id") ON DELETE CASCADE ON UPDATE CASCADE;
diff --git a/internal-packages/database/prisma/schema.prisma b/internal-packages/database/prisma/schema.prisma
index f6986be42c0..9e91fc70f14 100644
--- a/internal-packages/database/prisma/schema.prisma
+++ b/internal-packages/database/prisma/schema.prisma
@@ -417,6 +417,7 @@ model Project {
   onboardingData        Json?
   taskScheduleInstances TaskScheduleInstance[]
   metricsDashboards     MetricsDashboard[]
+  llmModels             LlmModel[]
 }
 
 enum ProjectVersion {
@@ -2577,3 +2578,59 @@ model MetricsDashboard {
   /// Fast lookup for the list
   @@index([projectId, createdAt(sort: Desc)])
 }
+
+// ====================================================
+// LLM Pricing Models
+// ====================================================
+
+/// A known LLM model or model pattern for cost tracking
+model LlmModel {
+  id           String    @id @default(cuid())
+  friendlyId   String    @unique @map("friendly_id")
+  projectId    String?   @map("project_id")
+  project      Project?  @relation(fields: [projectId], references: [id], onDelete: Cascade)
+  modelName    String    @map("model_name")
+  matchPattern String    @map("match_pattern")
+  startDate    DateTime? @map("start_date")
+  source       String    @default("default") // "default", "admin", "project"
+  createdAt    DateTime  @default(now()) @map("created_at")
+  updatedAt    DateTime  @updatedAt @map("updated_at")
+
+  pricingTiers LlmPricingTier[]
+  prices       LlmPrice[]
+
+  @@unique([projectId, modelName, startDate])
+  @@index([projectId])
+  @@map("llm_models")
+}
+
+/// A pricing tier for a model (supports volume-based or conditional pricing)
+model LlmPricingTier {
+  id         String   @id @default(cuid())
+  modelId    String   @map("model_id")
+  model      LlmModel @relation(fields: [modelId], references: [id], onDelete: Cascade)
+  name       String
+  isDefault  Boolean  @default(true) @map("is_default")
+  priority   Int      @default(0)
+  conditions Json     @default("[]") @db.JsonB
+
+  prices LlmPrice[]
+
+  @@unique([modelId, priority])
+  @@unique([modelId, name])
+  @@map("llm_pricing_tiers")
+}
+
+/// A price point for a usage type within a pricing tier
+model LlmPrice {
+  id            String         @id @default(cuid())
+  modelId       String         @map("model_id")
+  model         LlmModel       @relation(fields: [modelId], references: [id], onDelete: Cascade)
+  pricingTierId String         @map("pricing_tier_id")
+  pricingTier   LlmPricingTier @relation(fields: [pricingTierId], references: [id], onDelete: Cascade)
+  usageType     String         @map("usage_type")
+  price         Decimal        @db.Decimal(20, 12)
+
+  @@unique([modelId, usageType, pricingTierId])
+  @@map("llm_prices")
+}
diff --git a/internal-packages/llm-pricing/package.json b/internal-packages/llm-pricing/package.json
new file mode 100644
index 00000000000..8cf9e366f2c
--- /dev/null
+++ b/internal-packages/llm-pricing/package.json
@@ -0,0 +1,18 @@
+{
+  "name": "@internal/llm-pricing",
+  "private": true,
+  "version": "0.0.1",
+  "main": "./src/index.ts",
+  "types": "./src/index.ts",
+  "type": "module",
+  "dependencies": {
+    "@trigger.dev/core": "workspace:*",
+    "@trigger.dev/database": "workspace:*"
+  },
+  "scripts": {
+    "typecheck": "tsc --noEmit",
+    "generate": "echo 'defaultPrices.ts is pre-committed — run sync-prices to update'",
+    "sync-prices": "bash scripts/sync-model-prices.sh",
+    "sync-prices:check": "bash scripts/sync-model-prices.sh --check"
+  }
+}
diff --git a/internal-packages/llm-pricing/scripts/sync-model-prices.sh b/internal-packages/llm-pricing/scripts/sync-model-prices.sh
new file mode 100755
index 00000000000..d72aa6714c6
--- /dev/null
+++ b/internal-packages/llm-pricing/scripts/sync-model-prices.sh
@@ -0,0 +1,77 @@
+#!/usr/bin/env bash
+set -euo pipefail
+
+# Sync default model prices from Langfuse's repository and generate the TS module.
+# Usage: ./scripts/sync-model-prices.sh [--check]
+#   --check: Exit 1 if prices are outdated (for CI)
+
+SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+PACKAGE_DIR="$(dirname "$SCRIPT_DIR")"
+JSON_TARGET="$PACKAGE_DIR/src/default-model-prices.json"
+TS_TARGET="$PACKAGE_DIR/src/defaultPrices.ts"
+SOURCE_URL="https://raw.githubusercontent.com/langfuse/langfuse/main/worker/src/constants/default-model-prices.json"
+
+CHECK_MODE=false
+if [[ "${1:-}" == "--check" ]]; then
+  CHECK_MODE=true
+fi
+
+echo "Fetching latest model prices from Langfuse..."
+TMPFILE=$(mktemp)
+trap 'rm -f "$TMPFILE"' EXIT
+
+if ! curl -fsSL "$SOURCE_URL" -o "$TMPFILE"; then
+  echo "ERROR: Failed to fetch from $SOURCE_URL"
+  exit 1
+fi
+
+# Validate it's valid JSON with at least some models
+MODEL_COUNT=$(node -e "console.log(JSON.parse(require('fs').readFileSync('$TMPFILE','utf-8')).length)" 2>/dev/null || echo "0")
+if [[ "$MODEL_COUNT" -lt 10 ]]; then
+  echo "ERROR: Downloaded file has only $MODEL_COUNT models (expected 100+). Aborting."
+  exit 1
+fi
+
+if $CHECK_MODE; then
+  if diff -q "$JSON_TARGET" "$TMPFILE" > /dev/null 2>&1; then
+    echo "Model prices are up to date ($MODEL_COUNT models)"
+    exit 0
+  else
+    echo "Model prices are OUTDATED. Run 'pnpm run sync-prices' in @internal/llm-pricing to update."
+    exit 1
+  fi
+fi
+
+cp "$TMPFILE" "$JSON_TARGET"
+echo "Updated default-model-prices.json ($MODEL_COUNT models)"
+
+# Generate the TypeScript module from the JSON
+echo "Generating defaultPrices.ts..."
+node -e "
+const data = JSON.parse(require('fs').readFileSync('$JSON_TARGET', 'utf-8'));
+const stripped = data.map(e => ({
+  modelName: e.modelName.trim(),
+  matchPattern: e.matchPattern,
+  startDate: e.createdAt,
+  pricingTiers: e.pricingTiers.map(t => ({
+    name: t.name,
+    isDefault: t.isDefault,
+    priority: t.priority,
+    conditions: t.conditions.map(c => ({
+      usageDetailPattern: c.usageDetailPattern,
+      operator: c.operator,
+      value: c.value,
+    })),
+    prices: t.prices,
+  })),
+}));
+
+let out = 'import type { DefaultModelDefinition } from \"./types.js\";\n\n';
+out += '// Auto-generated from Langfuse default-model-prices.json — do not edit manually.\n';
+out += '// Run \`pnpm run sync-prices\` to update from upstream.\n';
+out += '// Source: https://github.com/langfuse/langfuse\n\n';
+out += 'export const defaultModelPrices: DefaultModelDefinition[] = ';
+out += JSON.stringify(stripped, null, 2) + ';\n';
+require('fs').writeFileSync('$TS_TARGET', out);
+console.log('Generated defaultPrices.ts with ' + stripped.length + ' models');
+"
diff --git a/internal-packages/llm-pricing/src/default-model-prices.json b/internal-packages/llm-pricing/src/default-model-prices.json
new file mode 100644
index 00000000000..4d2394ec082
--- /dev/null
+++ b/internal-packages/llm-pricing/src/default-model-prices.json
@@ -0,0 +1,3863 @@
+[
+  {
+    "id": "b9854a5c92dc496b997d99d20",
+    "modelName": "gpt-4o",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4o)$",
+    "createdAt": "2024-05-13T23:15:07.670Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4o",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "b9854a5c92dc496b997d99d20_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000025,
+          "input_cached_tokens": 0.00000125,
+          "input_cache_read": 0.00000125,
+          "output": 0.00001
+        }
+      }
+    ]
+  },
+  {
+    "id": "b9854a5c92dc496b997d99d21",
+    "modelName": "gpt-4o-2024-05-13",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4o-2024-05-13)$",
+    "createdAt": "2024-05-13T23:15:07.670Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4o-2024-05-13",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "b9854a5c92dc496b997d99d21_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000005,
+          "output": 0.000015
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrkvq6iq000008ju6c16gynt",
+    "modelName": "gpt-4-1106-preview",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4-1106-preview)$",
+    "createdAt": "2024-04-23T10:37:17.092Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4-1106-preview",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clrkvq6iq000008ju6c16gynt_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00001,
+          "output": 0.00003
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrkvx5gp000108juaogs54ea",
+    "modelName": "gpt-4-turbo-vision",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4(-\\d{4})?-vision-preview)$",
+    "createdAt": "2024-01-24T10:19:21.693Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4-vision-preview",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clrkvx5gp000108juaogs54ea_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00001,
+          "output": 0.00003
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrkvyzgw000308jue4hse4j9",
+    "modelName": "gpt-4-32k",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4-32k)$",
+    "createdAt": "2024-01-24T10:19:21.693Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4-32k",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clrkvyzgw000308jue4hse4j9_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00006,
+          "output": 0.00012
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrkwk4cb000108l5hwwh3zdi",
+    "modelName": "gpt-4-32k-0613",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4-32k-0613)$",
+    "createdAt": "2024-01-24T10:19:21.693Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4-32k-0613",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clrkwk4cb000108l5hwwh3zdi_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00006,
+          "output": 0.00012
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrkwk4cb000208l59yvb9yq8",
+    "modelName": "gpt-3.5-turbo-1106",
+    "matchPattern": "(?i)^(openai\/)?(gpt-)(35|3.5)(-turbo-1106)$",
+    "createdAt": "2024-01-24T10:19:21.693Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-3.5-turbo-1106",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clrkwk4cb000208l59yvb9yq8_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000001,
+          "output": 0.000002
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrkwk4cc000808l51xmk4uic",
+    "modelName": "gpt-3.5-turbo-0613",
+    "matchPattern": "(?i)^(openai\/)?(gpt-)(35|3.5)(-turbo-0613)$",
+    "createdAt": "2024-01-24T10:19:21.693Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-3.5-turbo-0613",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clrkwk4cc000808l51xmk4uic_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000015,
+          "output": 0.000002
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrkwk4cc000908l537kl0rx3",
+    "modelName": "gpt-4-0613",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4-0613)$",
+    "createdAt": "2024-01-24T10:19:21.693Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4-0613",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clrkwk4cc000908l537kl0rx3_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00003,
+          "output": 0.00006
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrkwk4cc000a08l562uc3s9g",
+    "modelName": "gpt-3.5-turbo-instruct",
+    "matchPattern": "(?i)^(openai\/)?(gpt-)(35|3.5)(-turbo-instruct)$",
+    "createdAt": "2024-01-24T10:19:21.693Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-3.5-turbo",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clrkwk4cc000a08l562uc3s9g_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000015,
+          "output": 0.000002
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrntjt89000108jwcou1af71",
+    "modelName": "text-ada-001",
+    "matchPattern": "(?i)^(text-ada-001)$",
+    "createdAt": "2024-01-24T18:18:50.861Z",
+    "updatedAt": "2024-01-24T18:18:50.861Z",
+    "tokenizerConfig": {
+      "tokenizerModel": "text-ada-001"
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clrntjt89000108jwcou1af71_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 0.000004
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrntjt89000208jwawjr894q",
+    "modelName": "text-babbage-001",
+    "matchPattern": "(?i)^(text-babbage-001)$",
+    "createdAt": "2024-01-24T18:18:50.861Z",
+    "updatedAt": "2024-01-24T18:18:50.861Z",
+    "tokenizerConfig": {
+      "tokenizerModel": "text-babbage-001"
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clrntjt89000208jwawjr894q_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrntjt89000308jw0jtfa4rs",
+    "modelName": "text-curie-001",
+    "matchPattern": "(?i)^(text-curie-001)$",
+    "createdAt": "2024-01-24T18:18:50.861Z",
+    "updatedAt": "2024-01-24T18:18:50.861Z",
+    "tokenizerConfig": {
+      "tokenizerModel": "text-curie-001"
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clrntjt89000308jw0jtfa4rs_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 0.00002
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrntjt89000408jwc2c93h6i",
+    "modelName": "text-davinci-001",
+    "matchPattern": "(?i)^(text-davinci-001)$",
+    "createdAt": "2024-01-24T18:18:50.861Z",
+    "updatedAt": "2024-01-24T18:18:50.861Z",
+    "tokenizerConfig": {
+      "tokenizerModel": "text-davinci-001"
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clrntjt89000408jwc2c93h6i_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 0.00002
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrntjt89000508jw192m64qi",
+    "modelName": "text-davinci-002",
+    "matchPattern": "(?i)^(text-davinci-002)$",
+    "createdAt": "2024-01-24T18:18:50.861Z",
+    "updatedAt": "2024-01-24T18:18:50.861Z",
+    "tokenizerConfig": {
+      "tokenizerModel": "text-davinci-002"
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clrntjt89000508jw192m64qi_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 0.00002
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrntjt89000608jw4m3x5s55",
+    "modelName": "text-davinci-003",
+    "matchPattern": "(?i)^(text-davinci-003)$",
+    "createdAt": "2024-01-24T18:18:50.861Z",
+    "updatedAt": "2024-01-24T18:18:50.861Z",
+    "tokenizerConfig": {
+      "tokenizerModel": "text-davinci-003"
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clrntjt89000608jw4m3x5s55_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 0.00002
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrntjt89000908jwhvkz5crg",
+    "modelName": "text-embedding-ada-002-v2",
+    "matchPattern": "(?i)^(text-embedding-ada-002-v2)$",
+    "createdAt": "2024-01-24T18:18:50.861Z",
+    "updatedAt": "2024-01-24T18:18:50.861Z",
+    "tokenizerConfig": {
+      "tokenizerModel": "text-embedding-ada-002"
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clrntjt89000908jwhvkz5crg_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 1e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrntjt89000908jwhvkz5crm",
+    "modelName": "text-embedding-ada-002",
+    "matchPattern": "(?i)^(text-embedding-ada-002)$",
+    "createdAt": "2024-01-24T18:18:50.861Z",
+    "updatedAt": "2024-01-24T18:18:50.861Z",
+    "tokenizerConfig": {
+      "tokenizerModel": "text-embedding-ada-002"
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clrntjt89000908jwhvkz5crm_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 1e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrntjt89000a08jw0gcdbd5a",
+    "modelName": "gpt-3.5-turbo-16k-0613",
+    "matchPattern": "(?i)^(openai\/)?(gpt-)(35|3.5)(-turbo-16k-0613)$",
+    "createdAt": "2024-02-03T17:29:57.350Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-3.5-turbo-16k-0613",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clrntjt89000a08jw0gcdbd5a_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000003,
+          "output": 0.000004
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrntkjgy000a08jx4e062mr0",
+    "modelName": "gpt-3.5-turbo-0301",
+    "matchPattern": "(?i)^(openai\/)?(gpt-)(35|3.5)(-turbo-0301)$",
+    "createdAt": "2024-01-24T10:19:21.693Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": -1,
+      "tokenizerModel": "gpt-3.5-turbo-0301",
+      "tokensPerMessage": 4
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clrntkjgy000a08jx4e062mr0_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000002,
+          "output": 0.000002
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrntkjgy000d08jx0p4y9h4l",
+    "modelName": "gpt-4-32k-0314",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4-32k-0314)$",
+    "createdAt": "2024-01-24T10:19:21.693Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4-32k-0314",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clrntkjgy000d08jx0p4y9h4l_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00006,
+          "output": 0.00012
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrntkjgy000e08jx4x6uawoo",
+    "modelName": "gpt-4-0314",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4-0314)$",
+    "createdAt": "2024-01-24T10:19:21.693Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4-0314",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clrntkjgy000e08jx4x6uawoo_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00003,
+          "output": 0.00006
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrntkjgy000f08jx79v9g1xj",
+    "modelName": "gpt-4",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4)$",
+    "createdAt": "2024-01-24T10:19:21.693Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clrntkjgy000f08jx79v9g1xj_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00003,
+          "output": 0.00006
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrnwb41q000308jsfrac9uh6",
+    "modelName": "claude-instant-1.2",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-instant-1.2)$",
+    "createdAt": "2024-01-30T15:44:13.447Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "clrnwb41q000308jsfrac9uh6_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00000163,
+          "output": 0.00000551
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrnwb836000408jsallr6u11",
+    "modelName": "claude-2.0",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-2.0)$",
+    "createdAt": "2024-01-30T15:44:13.447Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "clrnwb836000408jsallr6u11_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000008,
+          "output": 0.000024
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrnwbd1m000508js4hxu6o7n",
+    "modelName": "claude-2.1",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-2.1)$",
+    "createdAt": "2024-01-30T15:44:13.447Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "clrnwbd1m000508js4hxu6o7n_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000008,
+          "output": 0.000024
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrnwbg2b000608jse2pp4q2d",
+    "modelName": "claude-1.3",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-1.3)$",
+    "createdAt": "2024-01-30T15:44:13.447Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "clrnwbg2b000608jse2pp4q2d_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000008,
+          "output": 0.000024
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrnwbi9d000708jseiy44k26",
+    "modelName": "claude-1.2",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-1.2)$",
+    "createdAt": "2024-01-30T15:44:13.447Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "clrnwbi9d000708jseiy44k26_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000008,
+          "output": 0.000024
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrnwblo0000808jsc1385hdp",
+    "modelName": "claude-1.1",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-1.1)$",
+    "createdAt": "2024-01-30T15:44:13.447Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "clrnwblo0000808jsc1385hdp_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000008,
+          "output": 0.000024
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrnwbota000908jsgg9mb1ml",
+    "modelName": "claude-instant-1",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-instant-1)$",
+    "createdAt": "2024-01-30T15:44:13.447Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "clrnwbota000908jsgg9mb1ml_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00000163,
+          "output": 0.00000551
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrs2dnql000108l46vo0gp2t",
+    "modelName": "babbage-002",
+    "matchPattern": "(?i)^(babbage-002)$",
+    "createdAt": "2024-01-26T17:35:21.129Z",
+    "updatedAt": "2024-01-26T17:35:21.129Z",
+    "tokenizerConfig": {
+      "tokenizerModel": "babbage-002"
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clrs2dnql000108l46vo0gp2t_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 4e-7,
+          "output": 0.0000016
+        }
+      }
+    ]
+  },
+  {
+    "id": "clrs2ds35000208l4g4b0hi3u",
+    "modelName": "davinci-002",
+    "matchPattern": "(?i)^(davinci-002)$",
+    "createdAt": "2024-01-26T17:35:21.129Z",
+    "updatedAt": "2024-01-26T17:35:21.129Z",
+    "tokenizerConfig": {
+      "tokenizerModel": "davinci-002"
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clrs2ds35000208l4g4b0hi3u_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000006,
+          "output": 0.000012
+        }
+      }
+    ]
+  },
+  {
+    "id": "clruwn3pc00010al7bl611c8o",
+    "modelName": "text-embedding-3-small",
+    "matchPattern": "(?i)^(text-embedding-3-small)$",
+    "createdAt": "2024-01-26T17:35:21.129Z",
+    "updatedAt": "2024-01-26T17:35:21.129Z",
+    "tokenizerConfig": {
+      "tokenizerModel": "text-embedding-ada-002"
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clruwn3pc00010al7bl611c8o_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 2e-8
+        }
+      }
+    ]
+  },
+  {
+    "id": "clruwn76700020al7gp8e4g4l",
+    "modelName": "text-embedding-3-large",
+    "matchPattern": "(?i)^(text-embedding-3-large)$",
+    "createdAt": "2024-01-26T17:35:21.129Z",
+    "updatedAt": "2024-01-26T17:35:21.129Z",
+    "tokenizerConfig": {
+      "tokenizerModel": "text-embedding-ada-002"
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clruwn76700020al7gp8e4g4l_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 1.3e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "clruwnahl00030al7ab9rark7",
+    "modelName": "gpt-3.5-turbo-0125",
+    "matchPattern": "(?i)^(openai\/)?(gpt-)(35|3.5)(-turbo-0125)$",
+    "createdAt": "2024-01-26T17:35:21.129Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-3.5-turbo",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clruwnahl00030al7ab9rark7_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 5e-7,
+          "output": 0.0000015
+        }
+      }
+    ]
+  },
+  {
+    "id": "clruwnahl00040al78f1lb0at",
+    "modelName": "gpt-3.5-turbo",
+    "matchPattern": "(?i)^(openai\/)?(gpt-)(35|3.5)(-turbo)$",
+    "createdAt": "2024-02-13T12:00:37.424Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-3.5-turbo",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clruwnahl00040al78f1lb0at_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 5e-7,
+          "output": 0.0000015
+        }
+      }
+    ]
+  },
+  {
+    "id": "clruwnahl00050al796ck3p44",
+    "modelName": "gpt-4-0125-preview",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4-0125-preview)$",
+    "createdAt": "2024-01-26T17:35:21.129Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clruwnahl00050al796ck3p44_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00001,
+          "output": 0.00003
+        }
+      }
+    ]
+  },
+  {
+    "id": "cls08r8sq000308jq14ae96f0",
+    "modelName": "ft:gpt-3.5-turbo-1106",
+    "matchPattern": "(?i)^(ft:)(gpt-3.5-turbo-1106:)(.+)(:)(.*)(:)(.+)$",
+    "createdAt": "2024-01-31T13:25:02.141Z",
+    "updatedAt": "2024-01-31T13:25:02.141Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-3.5-turbo-1106",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "cls08r8sq000308jq14ae96f0_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000003,
+          "output": 0.000006
+        }
+      }
+    ]
+  },
+  {
+    "id": "cls08rp99000408jqepxoakjv",
+    "modelName": "ft:gpt-3.5-turbo-0613",
+    "matchPattern": "(?i)^(ft:)(gpt-3.5-turbo-0613:)(.+)(:)(.*)(:)(.+)$",
+    "createdAt": "2024-01-31T13:25:02.141Z",
+    "updatedAt": "2024-01-31T13:25:02.141Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-3.5-turbo-0613",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "cls08rp99000408jqepxoakjv_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000012,
+          "output": 0.000016
+        }
+      }
+    ]
+  },
+  {
+    "id": "cls08rv9g000508jq5p4z4nlr",
+    "modelName": "ft:davinci-002",
+    "matchPattern": "(?i)^(ft:)(davinci-002:)(.+)(:)(.*)(:)(.+)$$",
+    "createdAt": "2024-01-31T13:25:02.141Z",
+    "updatedAt": "2024-01-31T13:25:02.141Z",
+    "tokenizerConfig": {
+      "tokenizerModel": "davinci-002"
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "cls08rv9g000508jq5p4z4nlr_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000012,
+          "output": 0.000012
+        }
+      }
+    ]
+  },
+  {
+    "id": "cls08s2bw000608jq57wj4un2",
+    "modelName": "ft:babbage-002",
+    "matchPattern": "(?i)^(ft:)(babbage-002:)(.+)(:)(.*)(:)(.+)$$",
+    "createdAt": "2024-01-31T13:25:02.141Z",
+    "updatedAt": "2024-01-31T13:25:02.141Z",
+    "tokenizerConfig": {
+      "tokenizerModel": "babbage-002"
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "cls08s2bw000608jq57wj4un2_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000016,
+          "output": 0.0000016
+        }
+      }
+    ]
+  },
+  {
+    "id": "cls0iv12d000108l251gf3038",
+    "modelName": "chat-bison",
+    "matchPattern": "(?i)^(chat-bison)(@[a-zA-Z0-9]+)?$",
+    "createdAt": "2024-01-31T13:25:02.141Z",
+    "updatedAt": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "id": "cls0iv12d000108l251gf3038_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "output": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cls0j33v1000008joagkc4lql",
+    "modelName": "codechat-bison-32k",
+    "matchPattern": "(?i)^(codechat-bison-32k)(@[a-zA-Z0-9]+)?$",
+    "createdAt": "2024-01-31T13:25:02.141Z",
+    "updatedAt": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "id": "cls0j33v1000008joagkc4lql_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "output": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cls0jmc9v000008l8ee6r3gsd",
+    "modelName": "codechat-bison",
+    "matchPattern": "(?i)^(codechat-bison)(@[a-zA-Z0-9]+)?$",
+    "createdAt": "2024-01-31T13:25:02.141Z",
+    "updatedAt": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "id": "cls0jmc9v000008l8ee6r3gsd_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "output": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cls0jmjt3000108l83ix86w0d",
+    "modelName": "text-bison-32k",
+    "matchPattern": "(?i)^(text-bison-32k)(@[a-zA-Z0-9]+)?$",
+    "createdAt": "2024-01-31T13:25:02.141Z",
+    "updatedAt": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "id": "cls0jmjt3000108l83ix86w0d_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "output": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cls0jni4t000008jk3kyy803r",
+    "modelName": "chat-bison-32k",
+    "matchPattern": "(?i)^(chat-bison-32k)(@[a-zA-Z0-9]+)?$",
+    "createdAt": "2024-01-31T13:25:02.141Z",
+    "updatedAt": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "id": "cls0jni4t000008jk3kyy803r_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "output": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cls0jungb000208jk12gm4gk1",
+    "modelName": "text-unicorn",
+    "matchPattern": "(?i)^(text-unicorn)(@[a-zA-Z0-9]+)?$",
+    "createdAt": "2024-01-31T13:25:02.141Z",
+    "updatedAt": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "id": "cls0jungb000208jk12gm4gk1_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000025,
+          "output": 0.0000075
+        }
+      }
+    ]
+  },
+  {
+    "id": "cls0juygp000308jk2a6x9my2",
+    "modelName": "text-bison",
+    "matchPattern": "(?i)^(text-bison)(@[a-zA-Z0-9]+)?$",
+    "createdAt": "2024-01-31T13:25:02.141Z",
+    "updatedAt": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "id": "cls0juygp000308jk2a6x9my2_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "output": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cls1nyj5q000208l33ne901d8",
+    "modelName": "textembedding-gecko",
+    "matchPattern": "(?i)^(textembedding-gecko)(@[a-zA-Z0-9]+)?$",
+    "createdAt": "2024-01-31T13:25:02.141Z",
+    "updatedAt": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "id": "cls1nyj5q000208l33ne901d8_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 1e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cls1nyyjp000308l31gxy1bih",
+    "modelName": "textembedding-gecko-multilingual",
+    "matchPattern": "(?i)^(textembedding-gecko-multilingual)(@[a-zA-Z0-9]+)?$",
+    "createdAt": "2024-01-31T13:25:02.141Z",
+    "updatedAt": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "id": "cls1nyyjp000308l31gxy1bih_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 1e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cls1nzjt3000508l3dnwad3g0",
+    "modelName": "code-gecko",
+    "matchPattern": "(?i)^(code-gecko)(@[a-zA-Z0-9]+)?$",
+    "createdAt": "2024-01-31T13:25:02.141Z",
+    "updatedAt": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "id": "cls1nzjt3000508l3dnwad3g0_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "output": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cls1nzwx4000608l38va7e4tv",
+    "modelName": "code-bison",
+    "matchPattern": "(?i)^(code-bison)(@[a-zA-Z0-9]+)?$",
+    "createdAt": "2024-01-31T13:25:02.141Z",
+    "updatedAt": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "id": "cls1nzwx4000608l38va7e4tv_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "output": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cls1o053j000708l39f8g4bgs",
+    "modelName": "code-bison-32k",
+    "matchPattern": "(?i)^(code-bison-32k)(@[a-zA-Z0-9]+)?$",
+    "createdAt": "2024-01-31T13:25:02.141Z",
+    "updatedAt": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "id": "cls1o053j000708l39f8g4bgs_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "output": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "clsk9lntu000008jwfc51bbqv",
+    "modelName": "gpt-3.5-turbo-16k",
+    "matchPattern": "(?i)^(openai\/)?(gpt-)(35|3.5)(-turbo-16k)$",
+    "createdAt": "2024-02-13T12:00:37.424Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-3.5-turbo-16k",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clsk9lntu000008jwfc51bbqv_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 5e-7,
+          "output": 0.0000015
+        }
+      }
+    ]
+  },
+  {
+    "id": "clsnq07bn000008l4e46v1ll8",
+    "modelName": "gpt-4-turbo-preview",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4-turbo-preview)$",
+    "createdAt": "2024-02-15T21:21:50.947Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clsnq07bn000008l4e46v1ll8_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00001,
+          "output": 0.00003
+        }
+      }
+    ]
+  },
+  {
+    "id": "cltgy0iuw000008le3vod1hhy",
+    "modelName": "claude-3-opus-20240229",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-3-opus-20240229|anthropic\\.claude-3-opus-20240229-v1:0|claude-3-opus@20240229)$",
+    "createdAt": "2024-03-07T17:55:38.139Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "cltgy0iuw000008le3vod1hhy_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000015,
+          "output": 0.000075
+        }
+      }
+    ]
+  },
+  {
+    "id": "cltgy0pp6000108le56se7bl3",
+    "modelName": "claude-3-sonnet-20240229",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-3-sonnet-20240229|anthropic\\.claude-3-sonnet-20240229-v1:0|claude-3-sonnet@20240229)$",
+    "createdAt": "2024-03-07T17:55:38.139Z",
+    "updatedAt": "2026-03-04T00:00:00.000Z",
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "cltgy0pp6000108le56se7bl3_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000003,
+          "input_tokens": 0.000003,
+          "output": 0.000015,
+          "output_tokens": 0.000015,
+          "cache_creation_input_tokens": 0.00000375,
+          "input_cache_creation": 0.00000375,
+          "input_cache_creation_5m": 0.00000375,
+          "input_cache_creation_1h": 0.000006,
+          "cache_read_input_tokens": 3e-7,
+          "input_cache_read": 3e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cltr0w45b000008k1407o9qv1",
+    "modelName": "claude-3-haiku-20240307",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-3-haiku-20240307|anthropic\\.claude-3-haiku-20240307-v1:0|claude-3-haiku@20240307)$",
+    "createdAt": "2024-03-14T09:41:18.736Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "cltr0w45b000008k1407o9qv1_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "output": 0.00000125
+        }
+      }
+    ]
+  },
+  {
+    "id": "cluv2sjeo000008ih0fv23hi0",
+    "modelName": "gemini-1.0-pro-latest",
+    "matchPattern": "(?i)^(google\/)?(gemini-1.0-pro-latest)(@[a-zA-Z0-9]+)?$",
+    "createdAt": "2024-04-11T10:27:46.517Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cluv2sjeo000008ih0fv23hi0_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "output": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cluv2subq000108ih2mlrga6a",
+    "modelName": "gemini-1.0-pro",
+    "matchPattern": "(?i)^(google\/)?(gemini-1.0-pro)(@[a-zA-Z0-9]+)?$",
+    "createdAt": "2024-04-11T10:27:46.517Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cluv2subq000108ih2mlrga6a_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 1.25e-7,
+          "output": 3.75e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cluv2sx04000208ihbek75lsz",
+    "modelName": "gemini-1.0-pro-001",
+    "matchPattern": "(?i)^(google\/)?(gemini-1.0-pro-001)(@[a-zA-Z0-9]+)?$",
+    "createdAt": "2024-04-11T10:27:46.517Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cluv2sx04000208ihbek75lsz_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 1.25e-7,
+          "output": 3.75e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cluv2szw0000308ihch3n79x7",
+    "modelName": "gemini-pro",
+    "matchPattern": "(?i)^(google\/)?(gemini-pro)(@[a-zA-Z0-9]+)?$",
+    "createdAt": "2024-04-11T10:27:46.517Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cluv2szw0000308ihch3n79x7_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 1.25e-7,
+          "output": 3.75e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cluv2t2x0000408ihfytl45l1",
+    "modelName": "gemini-1.5-pro-latest",
+    "matchPattern": "(?i)^(google\/)?(gemini-1.5-pro-latest)(@[a-zA-Z0-9]+)?$",
+    "createdAt": "2024-04-11T10:27:46.517Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cluv2t2x0000408ihfytl45l1_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000025,
+          "output": 0.0000075
+        }
+      }
+    ]
+  },
+  {
+    "id": "cluv2t5k3000508ih5kve9zag",
+    "modelName": "gpt-4-turbo-2024-04-09",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4-turbo-2024-04-09)$",
+    "createdAt": "2024-04-23T10:37:17.092Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4-turbo-2024-04-09",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "cluv2t5k3000508ih5kve9zag_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00001,
+          "output": 0.00003
+        }
+      }
+    ]
+  },
+  {
+    "id": "cluvpl4ls000008l6h2gx3i07",
+    "modelName": "gpt-4-turbo",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4-turbo)$",
+    "createdAt": "2024-04-11T21:13:44.989Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4-1106-preview",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "cluvpl4ls000008l6h2gx3i07_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00001,
+          "output": 0.00003
+        }
+      }
+    ]
+  },
+  {
+    "id": "clv2o2x0p000008jsf9afceau",
+    "modelName": " gpt-4-preview",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4-preview)$",
+    "createdAt": "2024-04-23T10:37:17.092Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4-turbo-preview",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clv2o2x0p000008jsf9afceau_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00001,
+          "output": 0.00003
+        }
+      }
+    ]
+  },
+  {
+    "id": "clxt0n0m60000pumz1j5b7zsf",
+    "modelName": "claude-3-5-sonnet-20240620",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-3-5-sonnet-20240620|(eu\\.|us\\.|apac\\.)?anthropic\\.claude-3-5-sonnet-20240620-v1:0|claude-3-5-sonnet@20240620)$",
+    "createdAt": "2024-06-25T11:47:24.475Z",
+    "updatedAt": "2026-03-04T00:00:00.000Z",
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "clxt0n0m60000pumz1j5b7zsf_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000003,
+          "input_tokens": 0.000003,
+          "output": 0.000015,
+          "output_tokens": 0.000015,
+          "cache_creation_input_tokens": 0.00000375,
+          "input_cache_creation": 0.00000375,
+          "input_cache_creation_5m": 0.00000375,
+          "input_cache_creation_1h": 0.000006,
+          "cache_read_input_tokens": 3e-7,
+          "input_cache_read": 3e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "clyrjp56f0000t0mzapoocd7u",
+    "modelName": "gpt-4o-mini",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4o-mini)$",
+    "createdAt": "2024-07-18T17:56:09.591Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4o",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clyrjp56f0000t0mzapoocd7u_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 1.5e-7,
+          "output": 6e-7,
+          "input_cached_tokens": 7.5e-8,
+          "input_cache_read": 7.5e-8
+        }
+      }
+    ]
+  },
+  {
+    "id": "clyrjpbe20000t0mzcbwc42rg",
+    "modelName": "gpt-4o-mini-2024-07-18",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4o-mini-2024-07-18)$",
+    "createdAt": "2024-07-18T17:56:09.591Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4o",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clyrjpbe20000t0mzcbwc42rg_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 1.5e-7,
+          "input_cached_tokens": 7.5e-8,
+          "input_cache_read": 7.5e-8,
+          "output": 6e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "clzjr85f70000ymmzg7hqffra",
+    "modelName": "gpt-4o-2024-08-06",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4o-2024-08-06)$",
+    "createdAt": "2024-08-07T11:54:31.298Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4o",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "clzjr85f70000ymmzg7hqffra_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000025,
+          "input_cached_tokens": 0.00000125,
+          "input_cache_read": 0.00000125,
+          "output": 0.00001
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm10ivcdp0000gix7lelmbw80",
+    "modelName": "o1-preview",
+    "matchPattern": "(?i)^(openai\/)?(o1-preview)$",
+    "createdAt": "2024-09-13T10:01:35.373Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cm10ivcdp0000gix7lelmbw80_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000015,
+          "input_cached_tokens": 0.0000075,
+          "input_cache_read": 0.0000075,
+          "output": 0.00006,
+          "output_reasoning_tokens": 0.00006,
+          "output_reasoning": 0.00006
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm10ivo130000n8x7qopcjjcg",
+    "modelName": "o1-preview-2024-09-12",
+    "matchPattern": "(?i)^(openai\/)?(o1-preview-2024-09-12)$",
+    "createdAt": "2024-09-13T10:01:35.373Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cm10ivo130000n8x7qopcjjcg_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000015,
+          "input_cached_tokens": 0.0000075,
+          "input_cache_read": 0.0000075,
+          "output": 0.00006,
+          "output_reasoning_tokens": 0.00006,
+          "output_reasoning": 0.00006
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm10ivwo40000r1x7gg3syjq0",
+    "modelName": "o1-mini",
+    "matchPattern": "(?i)^(openai\/)?(o1-mini)$",
+    "createdAt": "2024-09-13T10:01:35.373Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cm10ivwo40000r1x7gg3syjq0_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000011,
+          "input_cached_tokens": 5.5e-7,
+          "input_cache_read": 5.5e-7,
+          "output": 0.0000044,
+          "output_reasoning_tokens": 0.0000044,
+          "output_reasoning": 0.0000044
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm10iw6p20000wgx7it1hlb22",
+    "modelName": "o1-mini-2024-09-12",
+    "matchPattern": "(?i)^(openai\/)?(o1-mini-2024-09-12)$",
+    "createdAt": "2024-09-13T10:01:35.373Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cm10iw6p20000wgx7it1hlb22_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000011,
+          "input_cached_tokens": 5.5e-7,
+          "input_cache_read": 5.5e-7,
+          "output": 0.0000044,
+          "output_reasoning_tokens": 0.0000044,
+          "output_reasoning": 0.0000044
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm2krz1uf000208jjg5653iud",
+    "modelName": "claude-3.5-sonnet-20241022",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-3-5-sonnet-20241022|(eu\\.|us\\.|apac\\.)?anthropic\\.claude-3-5-sonnet-20241022-v2:0|claude-3-5-sonnet-V2@20241022)$",
+    "createdAt": "2024-10-22T18:48:01.676Z",
+    "updatedAt": "2026-03-04T00:00:00.000Z",
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "cm2krz1uf000208jjg5653iud_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000003,
+          "input_tokens": 0.000003,
+          "output": 0.000015,
+          "output_tokens": 0.000015,
+          "cache_creation_input_tokens": 0.00000375,
+          "input_cache_creation": 0.00000375,
+          "input_cache_creation_5m": 0.00000375,
+          "input_cache_creation_1h": 0.000006,
+          "cache_read_input_tokens": 3e-7,
+          "input_cache_read": 3e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm2ks2vzn000308jjh4ze1w7q",
+    "modelName": "claude-3.5-sonnet-latest",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-3-5-sonnet-latest)$",
+    "createdAt": "2024-10-22T18:48:01.676Z",
+    "updatedAt": "2026-03-04T00:00:00.000Z",
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "cm2ks2vzn000308jjh4ze1w7q_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000003,
+          "input_tokens": 0.000003,
+          "output": 0.000015,
+          "output_tokens": 0.000015,
+          "cache_creation_input_tokens": 0.00000375,
+          "input_cache_creation": 0.00000375,
+          "input_cache_creation_5m": 0.00000375,
+          "input_cache_creation_1h": 0.000006,
+          "cache_read_input_tokens": 3e-7,
+          "input_cache_read": 3e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm34aq60d000207ml0j1h31ar",
+    "modelName": "claude-3-5-haiku-20241022",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-3-5-haiku-20241022|(eu\\.|us\\.|apac\\.)?anthropic\\.claude-3-5-haiku-20241022-v1:0|claude-3-5-haiku-V1@20241022)$",
+    "createdAt": "2024-11-05T10:30:50.566Z",
+    "updatedAt": "2026-03-04T00:00:00.000Z",
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "cm34aq60d000207ml0j1h31ar_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 8e-7,
+          "input_tokens": 8e-7,
+          "output": 0.000004,
+          "output_tokens": 0.000004,
+          "cache_creation_input_tokens": 0.000001,
+          "input_cache_creation": 0.000001,
+          "input_cache_creation_5m": 0.000001,
+          "input_cache_creation_1h": 0.0000016,
+          "cache_read_input_tokens": 8e-8,
+          "input_cache_read": 8e-8
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm34aqb9h000307ml6nypd618",
+    "modelName": "claude-3.5-haiku-latest",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-3-5-haiku-latest)$",
+    "createdAt": "2024-11-05T10:30:50.566Z",
+    "updatedAt": "2026-03-04T00:00:00.000Z",
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "cm34aqb9h000307ml6nypd618_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 8e-7,
+          "input_tokens": 8e-7,
+          "output": 0.000004,
+          "output_tokens": 0.000004,
+          "cache_creation_input_tokens": 0.000001,
+          "input_cache_creation": 0.000001,
+          "input_cache_creation_5m": 0.000001,
+          "input_cache_creation_1h": 0.0000016,
+          "cache_read_input_tokens": 8e-8,
+          "input_cache_read": 8e-8
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm3x0p8ev000008kyd96800c8",
+    "modelName": "chatgpt-4o-latest",
+    "matchPattern": "(?i)^(chatgpt-4o-latest)$",
+    "createdAt": "2024-11-25T12:47:17.504Z",
+    "updatedAt": "2024-11-25T12:47:17.504Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4o",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "cm3x0p8ev000008kyd96800c8_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000005,
+          "output": 0.000015
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm48akqgo000008ldbia24qg0",
+    "modelName": "gpt-4o-2024-11-20",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4o-2024-11-20)$",
+    "createdAt": "2024-12-03T10:06:12.000Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4o",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "cm48akqgo000008ldbia24qg0_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000025,
+          "input_cached_tokens": 0.00000125,
+          "input_cache_read": 0.00000125,
+          "output": 0.00001
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm48b2ksh000008l0hn3u0hl3",
+    "modelName": "gpt-4o-audio-preview",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4o-audio-preview)$",
+    "createdAt": "2024-12-03T10:19:56.000Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cm48b2ksh000008l0hn3u0hl3_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input_text_tokens": 0.0000025,
+          "output_text_tokens": 0.00001,
+          "input_audio_tokens": 0.0001,
+          "input_audio": 0.0001,
+          "output_audio_tokens": 0.0002,
+          "output_audio": 0.0002
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm48bbm0k000008l69nsdakwf",
+    "modelName": "gpt-4o-audio-preview-2024-10-01",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4o-audio-preview-2024-10-01)$",
+    "createdAt": "2024-12-03T10:19:56.000Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cm48bbm0k000008l69nsdakwf_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input_text_tokens": 0.0000025,
+          "output_text_tokens": 0.00001,
+          "input_audio_tokens": 0.0001,
+          "input_audio": 0.0001,
+          "output_audio_tokens": 0.0002,
+          "output_audio": 0.0002
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm48c2qh4000008mhgy4mg2qc",
+    "modelName": "gpt-4o-realtime-preview",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4o-realtime-preview)$",
+    "createdAt": "2024-12-03T10:19:56.000Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cm48c2qh4000008mhgy4mg2qc_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input_text_tokens": 0.000005,
+          "input_cached_text_tokens": 0.0000025,
+          "output_text_tokens": 0.00002,
+          "input_audio_tokens": 0.0001,
+          "input_audio": 0.0001,
+          "input_cached_audio_tokens": 0.00002,
+          "output_audio_tokens": 0.0002,
+          "output_audio": 0.0002
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm48cjxtc000008jrcsso3avv",
+    "modelName": "gpt-4o-realtime-preview-2024-10-01",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4o-realtime-preview-2024-10-01)$",
+    "createdAt": "2024-12-03T10:19:56.000Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cm48cjxtc000008jrcsso3avv_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input_text_tokens": 0.000005,
+          "input_cached_text_tokens": 0.0000025,
+          "output_text_tokens": 0.00002,
+          "input_audio_tokens": 0.0001,
+          "input_audio": 0.0001,
+          "input_cached_audio_tokens": 0.00002,
+          "output_audio_tokens": 0.0002,
+          "output_audio": 0.0002
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm48cjxtc000108jrcsso3avv",
+    "modelName": "o1",
+    "matchPattern": "(?i)^(openai\/)?(o1)$",
+    "createdAt": "2025-01-17T00:01:35.373Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cm48cjxtc000108jrcsso3avv_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000015,
+          "input_cached_tokens": 0.0000075,
+          "input_cache_read": 0.0000075,
+          "output": 0.00006,
+          "output_reasoning_tokens": 0.00006,
+          "output_reasoning": 0.00006
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm48cjxtc000208jrcsso3avv",
+    "modelName": "o1-2024-12-17",
+    "matchPattern": "(?i)^(openai\/)?(o1-2024-12-17)$",
+    "createdAt": "2025-01-17T00:01:35.373Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cm48cjxtc000208jrcsso3avv_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000015,
+          "input_cached_tokens": 0.0000075,
+          "input_cache_read": 0.0000075,
+          "output": 0.00006,
+          "output_reasoning_tokens": 0.00006,
+          "output_reasoning": 0.00006
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm6l8j7vs0000tymz9vk7ew8t",
+    "modelName": "o3-mini",
+    "matchPattern": "(?i)^(openai\/)?(o3-mini)$",
+    "createdAt": "2025-01-31T20:41:35.373Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cm6l8j7vs0000tymz9vk7ew8t_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000011,
+          "input_cached_tokens": 5.5e-7,
+          "input_cache_read": 5.5e-7,
+          "output": 0.0000044,
+          "output_reasoning_tokens": 0.0000044,
+          "output_reasoning": 0.0000044
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm6l8jan90000tymz52sh0ql8",
+    "modelName": "o3-mini-2025-01-31",
+    "matchPattern": "(?i)^(openai\/)?(o3-mini-2025-01-31)$",
+    "createdAt": "2025-01-31T20:41:35.373Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cm6l8jan90000tymz52sh0ql8_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000011,
+          "input_cached_tokens": 5.5e-7,
+          "input_cache_read": 5.5e-7,
+          "output": 0.0000044,
+          "output_reasoning_tokens": 0.0000044,
+          "output_reasoning": 0.0000044
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm6l8jdef0000tymz52sh0ql0",
+    "modelName": "gemini-2.0-flash-001",
+    "matchPattern": "(?i)^(google\/)?(gemini-2.0-flash-001)(@[a-zA-Z0-9]+)?$",
+    "createdAt": "2025-02-06T11:11:35.241Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cm6l8jdef0000tymz52sh0ql0_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 1e-7,
+          "output": 4e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm6l8jfgh0000tymz52sh0ql1",
+    "modelName": "gemini-2.0-flash-lite-preview-02-05",
+    "matchPattern": "(?i)^(google\/)?(gemini-2.0-flash-lite-preview-02-05)(@[a-zA-Z0-9]+)?$",
+    "createdAt": "2025-02-06T11:11:35.241Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cm6l8jfgh0000tymz52sh0ql1_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 7.5e-8,
+          "output": 3e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm7ka7561000108js3t9tb3at",
+    "modelName": "claude-3.7-sonnet-20250219",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-3.7-sonnet-20250219|(eu\\.|us\\.|apac\\.)?anthropic\\.claude-3.7-sonnet-20250219-v1:0|claude-3-7-sonnet-V1@20250219)$",
+    "createdAt": "2025-02-25T09:35:39.000Z",
+    "updatedAt": "2026-03-04T00:00:00.000Z",
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "cm7ka7561000108js3t9tb3at_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000003,
+          "input_tokens": 0.000003,
+          "output": 0.000015,
+          "output_tokens": 0.000015,
+          "cache_creation_input_tokens": 0.00000375,
+          "input_cache_creation": 0.00000375,
+          "input_cache_creation_5m": 0.00000375,
+          "input_cache_creation_1h": 0.000006,
+          "cache_read_input_tokens": 3e-7,
+          "input_cache_read": 3e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm7ka7zob000208jsfs9h5ajj",
+    "modelName": "claude-3.7-sonnet-latest",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-3-7-sonnet-latest)$",
+    "createdAt": "2025-02-25T09:35:39.000Z",
+    "updatedAt": "2026-03-04T00:00:00.000Z",
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "cm7ka7zob000208jsfs9h5ajj_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000003,
+          "input_tokens": 0.000003,
+          "output": 0.000015,
+          "output_tokens": 0.000015,
+          "cache_creation_input_tokens": 0.00000375,
+          "input_cache_creation": 0.00000375,
+          "input_cache_creation_5m": 0.00000375,
+          "input_cache_creation_1h": 0.000006,
+          "cache_read_input_tokens": 3e-7,
+          "input_cache_read": 3e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm7nusjvk0000tvmz71o85jwg",
+    "modelName": "gpt-4.5-preview",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4.5-preview)$",
+    "createdAt": "2025-02-27T21:26:54.132Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cm7nusjvk0000tvmz71o85jwg_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000075,
+          "input_cached_tokens": 0.0000375,
+          "input_cached_text_tokens": 0.0000375,
+          "input_cache_read": 0.0000375,
+          "output": 0.00015
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm7nusn640000tvmzf10z2x65",
+    "modelName": "gpt-4.5-preview-2025-02-27",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4.5-preview-2025-02-27)$",
+    "createdAt": "2025-02-27T21:26:54.132Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cm7nusn640000tvmzf10z2x65_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000075,
+          "input_cached_tokens": 0.0000375,
+          "input_cached_text_tokens": 0.0000375,
+          "input_cache_read": 0.0000375,
+          "output": 0.00015
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm7nusn643377tvmzh27m33kl",
+    "modelName": "gpt-4.1",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4.1)$",
+    "createdAt": "2025-04-15T10:26:54.132Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "cm7nusn643377tvmzh27m33kl_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000002,
+          "input_cached_tokens": 5e-7,
+          "input_cached_text_tokens": 5e-7,
+          "input_cache_read": 5e-7,
+          "output": 0.000008
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm7qahw732891bpmzy45r3x70",
+    "modelName": "gpt-4.1-2025-04-14",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4.1-2025-04-14)$",
+    "createdAt": "2025-04-15T10:26:54.132Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "cm7qahw732891bpmzy45r3x70_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000002,
+          "input_cached_tokens": 5e-7,
+          "input_cached_text_tokens": 5e-7,
+          "input_cache_read": 5e-7,
+          "output": 0.000008
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm7sglt825463kxnza72p6v81",
+    "modelName": "gpt-4.1-mini-2025-04-14",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4.1-mini-2025-04-14)$",
+    "createdAt": "2025-04-15T10:26:54.132Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "cm7sglt825463kxnza72p6v81_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 4e-7,
+          "input_cached_tokens": 1e-7,
+          "input_cached_text_tokens": 1e-7,
+          "input_cache_read": 1e-7,
+          "output": 0.0000016
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm7vxpz967124dhjtb95w8f92",
+    "modelName": "gpt-4.1-nano-2025-04-14",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4.1-nano-2025-04-14)$",
+    "createdAt": "2025-04-15T10:26:54.132Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "cm7vxpz967124dhjtb95w8f92_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 1e-7,
+          "input_cached_tokens": 2.5e-8,
+          "input_cached_text_tokens": 2.5e-8,
+          "input_cache_read": 2.5e-8,
+          "output": 4e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm7wmny967124dhjtb95w8f81",
+    "modelName": "o3",
+    "matchPattern": "(?i)^(openai\/)?(o3)$",
+    "createdAt": "2025-04-16T23:26:54.132Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cm7wmny967124dhjtb95w8f81_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000002,
+          "input_cached_tokens": 5e-7,
+          "input_cache_read": 5e-7,
+          "output": 0.000008,
+          "output_reasoning_tokens": 0.000008,
+          "output_reasoning": 0.000008
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm7wopq3327124dhjtb95w8f81",
+    "modelName": "o3-2025-04-16",
+    "matchPattern": "(?i)^(openai\/)?(o3-2025-04-16)$",
+    "createdAt": "2025-04-16T23:26:54.132Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cm7wopq3327124dhjtb95w8f81_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000002,
+          "input_cached_tokens": 5e-7,
+          "input_cache_read": 5e-7,
+          "output": 0.000008,
+          "output_reasoning_tokens": 0.000008,
+          "output_reasoning": 0.000008
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm7wqrs1327124dhjtb95w8f81",
+    "modelName": "o4-mini",
+    "matchPattern": "(?i)^(o4-mini)$",
+    "createdAt": "2025-04-16T23:26:54.132Z",
+    "updatedAt": "2025-04-16T23:26:54.132Z",
+    "pricingTiers": [
+      {
+        "id": "cm7wqrs1327124dhjtb95w8f81_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000011,
+          "input_cached_tokens": 2.75e-7,
+          "input_cache_read": 2.75e-7,
+          "output": 0.0000044,
+          "output_reasoning_tokens": 0.0000044,
+          "output_reasoning": 0.0000044
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm7zqrs1327124dhjtb95w8f82",
+    "modelName": "o4-mini-2025-04-16",
+    "matchPattern": "(?i)^(o4-mini-2025-04-16)$",
+    "createdAt": "2025-04-16T23:26:54.132Z",
+    "updatedAt": "2025-04-16T23:26:54.132Z",
+    "pricingTiers": [
+      {
+        "id": "cm7zqrs1327124dhjtb95w8f82_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000011,
+          "input_cached_tokens": 2.75e-7,
+          "input_cache_read": 2.75e-7,
+          "output": 0.0000044,
+          "output_reasoning_tokens": 0.0000044,
+          "output_reasoning": 0.0000044
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm7zsrs1327124dhjtb95w8f74",
+    "modelName": "gemini-2.0-flash",
+    "matchPattern": "(?i)^(google\/)?(gemini-2.0-flash)(@[a-zA-Z0-9]+)?$",
+    "createdAt": "2025-04-22T10:11:35.241Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cm7zsrs1327124dhjtb95w8f74_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 1e-7,
+          "output": 4e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm7ztrs1327124dhjtb95w8f19",
+    "modelName": "gemini-2.0-flash-lite-preview",
+    "matchPattern": "(?i)^(google\/)?(gemini-2.0-flash-lite-preview)(@[a-zA-Z0-9]+)?$",
+    "createdAt": "2025-04-22T10:11:35.241Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cm7ztrs1327124dhjtb95w8f19_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 7.5e-8,
+          "output": 3e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm7zxrs1327124dhjtb95w8f45",
+    "modelName": "gpt-4.1-nano",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4.1-nano)$",
+    "createdAt": "2025-04-22T10:11:35.241Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "cm7zxrs1327124dhjtb95w8f45_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 1e-7,
+          "input_cached_tokens": 2.5e-8,
+          "input_cached_text_tokens": 2.5e-8,
+          "input_cache_read": 2.5e-8,
+          "output": 4e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cm7zzrs1327124dhjtb95w8p96",
+    "modelName": "gpt-4.1-mini",
+    "matchPattern": "(?i)^(openai\/)?(gpt-4.1-mini)$",
+    "createdAt": "2025-04-22T10:11:35.241Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "cm7zzrs1327124dhjtb95w8p96_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 4e-7,
+          "input_cached_tokens": 1e-7,
+          "input_cached_text_tokens": 1e-7,
+          "input_cache_read": 1e-7,
+          "output": 0.0000016
+        }
+      }
+    ]
+  },
+  {
+    "id": "c5qmrqolku82tra3vgdixmys",
+    "modelName": "claude-sonnet-4-5-20250929",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-sonnet-4-5(-20250929)?|(eu\\.|us\\.|apac\\.|global\\.)?anthropic\\.claude-sonnet-4-5(-20250929)?-v1(:0)?|claude-sonnet-4-5-V1(@20250929)?|claude-sonnet-4-5(@20250929)?)$",
+    "createdAt": "2025-09-29T00:00:00.000Z",
+    "updatedAt": "2026-03-04T00:00:00.000Z",
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "c5qmrqolku82tra3vgdixmys_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000003,
+          "input_tokens": 0.000003,
+          "output": 0.000015,
+          "output_tokens": 0.000015,
+          "cache_creation_input_tokens": 0.00000375,
+          "input_cache_creation": 0.00000375,
+          "input_cache_creation_5m": 0.00000375,
+          "input_cache_creation_1h": 0.000006,
+          "cache_read_input_tokens": 3e-7,
+          "input_cache_read": 3e-7
+        }
+      },
+      {
+        "id": "00b65240-047b-4722-9590-808edbc2067f",
+        "name": "Large Context",
+        "isDefault": false,
+        "priority": 1,
+        "conditions": [
+          {
+            "usageDetailPattern": "input",
+            "operator": "gt",
+            "value": 200000,
+            "caseSensitive": false
+          }
+        ],
+        "prices": {
+          "input": 0.000006,
+          "input_tokens": 0.000006,
+          "output": 0.0000225,
+          "output_tokens": 0.0000225,
+          "cache_creation_input_tokens": 0.0000075,
+          "input_cache_creation": 0.0000075,
+          "input_cache_creation_5m": 0.0000075,
+          "input_cache_creation_1h": 0.000012,
+          "cache_read_input_tokens": 6e-7,
+          "input_cache_read": 6e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cmazmkzlm00000djp1e1qe4k4",
+    "modelName": "claude-sonnet-4-20250514",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-sonnet-4(-20250514)?|(eu\\.|us\\.|apac\\.|global\\.)?anthropic\\.claude-sonnet-4(-20250514)?-v1(:0)?|claude-sonnet-4-V1(@20250514)?|claude-sonnet-4(@20250514)?)$",
+    "createdAt": "2025-05-22T17:09:02.131Z",
+    "updatedAt": "2026-03-04T00:00:00.000Z",
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "cmazmkzlm00000djp1e1qe4k4_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000003,
+          "input_tokens": 0.000003,
+          "output": 0.000015,
+          "output_tokens": 0.000015,
+          "cache_creation_input_tokens": 0.00000375,
+          "input_cache_creation": 0.00000375,
+          "input_cache_creation_5m": 0.00000375,
+          "input_cache_creation_1h": 0.000006,
+          "cache_read_input_tokens": 3e-7,
+          "input_cache_read": 3e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cmazmlbnv00010djpazed91va",
+    "modelName": "claude-sonnet-4-latest",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-sonnet-4-latest)$",
+    "createdAt": "2025-05-22T17:09:02.131Z",
+    "updatedAt": "2026-03-04T00:00:00.000Z",
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "cmazmlbnv00010djpazed91va_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000003,
+          "input_tokens": 0.000003,
+          "output": 0.000015,
+          "output_tokens": 0.000015,
+          "cache_creation_input_tokens": 0.00000375,
+          "input_cache_creation": 0.00000375,
+          "input_cache_creation_5m": 0.00000375,
+          "input_cache_creation_1h": 0.000006,
+          "cache_read_input_tokens": 3e-7,
+          "input_cache_read": 3e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cmazmlm2p00020djpa9s64jw5",
+    "modelName": "claude-opus-4-20250514",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-opus-4(-20250514)?|(eu\\.|us\\.|apac\\.)?anthropic\\.claude-opus-4(-20250514)?-v1(:0)?|claude-opus-4(@20250514)?)$",
+    "createdAt": "2025-05-22T17:09:02.131Z",
+    "updatedAt": "2026-03-04T00:00:00.000Z",
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "cmazmlm2p00020djpa9s64jw5_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000015,
+          "input_tokens": 0.000015,
+          "output": 0.000075,
+          "output_tokens": 0.000075,
+          "cache_creation_input_tokens": 0.00001875,
+          "input_cache_creation": 0.00001875,
+          "input_cache_creation_5m": 0.00001875,
+          "input_cache_creation_1h": 0.00003,
+          "cache_read_input_tokens": 0.0000015,
+          "input_cache_read": 0.0000015
+        }
+      }
+    ]
+  },
+  {
+    "id": "cmz9x72kq55721pqrs83y4n2bx",
+    "modelName": "o3-pro",
+    "matchPattern": "(?i)^(openai\/)?(o3-pro)$",
+    "createdAt": "2025-06-10T22:26:54.132Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cmz9x72kq55721pqrs83y4n2bx_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00002,
+          "output": 0.00008,
+          "output_reasoning_tokens": 0.00008,
+          "output_reasoning": 0.00008
+        }
+      }
+    ]
+  },
+  {
+    "id": "cmz9x72kq55721pqrs83y4n2by",
+    "modelName": "o3-pro-2025-06-10",
+    "matchPattern": "(?i)^(openai\/)?(o3-pro-2025-06-10)$",
+    "createdAt": "2025-06-10T22:26:54.132Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cmz9x72kq55721pqrs83y4n2by_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00002,
+          "output": 0.00008,
+          "output_reasoning_tokens": 0.00008,
+          "output_reasoning": 0.00008
+        }
+      }
+    ]
+  },
+  {
+    "id": "cmbrold5b000107lbftb9fdoo",
+    "modelName": "o1-pro",
+    "matchPattern": "(?i)^(openai\/)?(o1-pro)$",
+    "createdAt": "2025-06-10T22:26:54.132Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cmbrold5b000107lbftb9fdoo_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00015,
+          "output": 0.0006,
+          "output_reasoning_tokens": 0.0006,
+          "output_reasoning": 0.0006
+        }
+      }
+    ]
+  },
+  {
+    "id": "cmbrolpax000207lb3xkedysz",
+    "modelName": "o1-pro-2025-03-19",
+    "matchPattern": "(?i)^(openai\/)?(o1-pro-2025-03-19)$",
+    "createdAt": "2025-06-10T22:26:54.132Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cmbrolpax000207lb3xkedysz_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00015,
+          "output": 0.0006,
+          "output_reasoning_tokens": 0.0006,
+          "output_reasoning": 0.0006
+        }
+      }
+    ]
+  },
+  {
+    "id": "cmcnjkfwn000107l43bf5e8ax",
+    "modelName": "gemini-2.5-flash",
+    "matchPattern": "(?i)^(google\/)?(gemini-2.5-flash)$",
+    "createdAt": "2025-07-03T13:44:06.964Z",
+    "updatedAt": "2026-03-04T00:00:00.000Z",
+    "pricingTiers": [
+      {
+        "id": "cmcnjkfwn000107l43bf5e8ax_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 3e-7,
+          "input_text": 3e-7,
+          "input_modality_1": 3e-7,
+          "prompt_token_count": 3e-7,
+          "promptTokenCount": 3e-7,
+          "input_cached_tokens": 3e-8,
+          "cached_content_token_count": 3e-8,
+          "output": 0.0000025,
+          "output_modality_1": 0.0000025,
+          "candidates_token_count": 0.0000025,
+          "candidatesTokenCount": 0.0000025,
+          "thoughtsTokenCount": 0.0000025,
+          "thoughts_token_count": 0.0000025,
+          "output_reasoning": 0.0000025,
+          "input_audio_tokens": 0.000001
+        }
+      }
+    ]
+  },
+  {
+    "id": "cmcnjkrfa000207l4fpnh5mnv",
+    "modelName": "gemini-2.5-flash-lite",
+    "matchPattern": "(?i)^(google\/)?(gemini-2.5-flash-lite)$",
+    "createdAt": "2025-07-03T13:44:06.964Z",
+    "updatedAt": "2026-03-04T00:00:00.000Z",
+    "pricingTiers": [
+      {
+        "id": "cmcnjkrfa000207l4fpnh5mnv_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 1e-7,
+          "input_text": 1e-7,
+          "input_modality_1": 1e-7,
+          "prompt_token_count": 1e-7,
+          "promptTokenCount": 1e-7,
+          "input_cached_tokens": 2.5e-8,
+          "cached_content_token_count": 2.5e-8,
+          "output": 4e-7,
+          "output_modality_1": 4e-7,
+          "candidates_token_count": 4e-7,
+          "candidatesTokenCount": 4e-7,
+          "thoughtsTokenCount": 4e-7,
+          "thoughts_token_count": 4e-7,
+          "output_reasoning": 4e-7,
+          "input_audio_tokens": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cmdysde5w0000rkmzbc1g5au3",
+    "modelName": "claude-opus-4-1-20250805",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-opus-4-1(-20250805)?|(eu\\.|us\\.|apac\\.)?anthropic\\.claude-opus-4-1(-20250805)?-v1(:0)?|claude-opus-4-1(@20250805)?)$",
+    "createdAt": "2025-08-05T15:00:00.000Z",
+    "updatedAt": "2026-03-04T00:00:00.000Z",
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "cmdysde5w0000rkmzbc1g5au3_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000015,
+          "input_tokens": 0.000015,
+          "output": 0.000075,
+          "output_tokens": 0.000075,
+          "cache_creation_input_tokens": 0.00001875,
+          "input_cache_creation": 0.00001875,
+          "input_cache_creation_5m": 0.00001875,
+          "input_cache_creation_1h": 0.00003,
+          "cache_read_input_tokens": 0.0000015,
+          "input_cache_read": 0.0000015
+        }
+      }
+    ]
+  },
+  {
+    "id": "38c3822a-09a3-457b-b200-2c6f17f7cf2f",
+    "modelName": "gpt-5",
+    "matchPattern": "(?i)^(openai\/)?(gpt-5)$",
+    "createdAt": "2025-08-07T16:00:00.000Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "38c3822a-09a3-457b-b200-2c6f17f7cf2f_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00000125,
+          "input_cached_tokens": 1.25e-7,
+          "output": 0.00001,
+          "input_cache_read": 1.25e-7,
+          "output_reasoning_tokens": 0.00001,
+          "output_reasoning": 0.00001
+        }
+      }
+    ]
+  },
+  {
+    "id": "12543803-2d5f-4189-addc-821ad71c8b55",
+    "modelName": "gpt-5-2025-08-07",
+    "matchPattern": "(?i)^(openai\/)?(gpt-5-2025-08-07)$",
+    "createdAt": "2025-08-11T08:00:00.000Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "12543803-2d5f-4189-addc-821ad71c8b55_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00000125,
+          "input_cached_tokens": 1.25e-7,
+          "output": 0.00001,
+          "input_cache_read": 1.25e-7,
+          "output_reasoning_tokens": 0.00001,
+          "output_reasoning": 0.00001
+        }
+      }
+    ]
+  },
+  {
+    "id": "3d6a975a-a42d-4ea2-a3ec-4ae567d5a364",
+    "modelName": "gpt-5-mini",
+    "matchPattern": "(?i)^(openai\/)?(gpt-5-mini)$",
+    "createdAt": "2025-08-07T16:00:00.000Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "3d6a975a-a42d-4ea2-a3ec-4ae567d5a364_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "input_cached_tokens": 2.5e-8,
+          "output": 0.000002,
+          "input_cache_read": 2.5e-8,
+          "output_reasoning_tokens": 0.000002,
+          "output_reasoning": 0.000002
+        }
+      }
+    ]
+  },
+  {
+    "id": "03b83894-7172-4e1e-8e8b-37d792484efd",
+    "modelName": "gpt-5-mini-2025-08-07",
+    "matchPattern": "(?i)^(openai\/)?(gpt-5-mini-2025-08-07)$",
+    "createdAt": "2025-08-11T08:00:00.000Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "03b83894-7172-4e1e-8e8b-37d792484efd_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "input_cached_tokens": 2.5e-8,
+          "output": 0.000002,
+          "input_cache_read": 2.5e-8,
+          "output_reasoning_tokens": 0.000002,
+          "output_reasoning": 0.000002
+        }
+      }
+    ]
+  },
+  {
+    "id": "f0b40234-b694-4c40-9494-7b0efd860fb9",
+    "modelName": "gpt-5-nano",
+    "matchPattern": "(?i)^(openai\/)?(gpt-5-nano)$",
+    "createdAt": "2025-08-07T16:00:00.000Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "f0b40234-b694-4c40-9494-7b0efd860fb9_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 5e-8,
+          "input_cached_tokens": 5e-9,
+          "output": 4e-7,
+          "input_cache_read": 5e-9,
+          "output_reasoning_tokens": 4e-7,
+          "output_reasoning": 4e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "4489fde4-a594-4011-948b-526989300cd3",
+    "modelName": "gpt-5-nano-2025-08-07",
+    "matchPattern": "(?i)^(openai\/)?(gpt-5-nano-2025-08-07)$",
+    "createdAt": "2025-08-11T08:00:00.000Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "4489fde4-a594-4011-948b-526989300cd3_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 5e-8,
+          "input_cached_tokens": 5e-9,
+          "output": 4e-7,
+          "input_cache_read": 5e-9,
+          "output_reasoning_tokens": 4e-7,
+          "output_reasoning": 4e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "8ba72ee3-ebe8-4110-a614-bf81094447e5",
+    "modelName": "gpt-5-chat-latest",
+    "matchPattern": "(?i)^(openai\/)?(gpt-5-chat-latest)$",
+    "createdAt": "2025-08-07T16:00:00.000Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "8ba72ee3-ebe8-4110-a614-bf81094447e5_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00000125,
+          "input_cached_tokens": 1.25e-7,
+          "output": 0.00001,
+          "input_cache_read": 1.25e-7,
+          "output_reasoning_tokens": 0.00001,
+          "output_reasoning": 0.00001
+        }
+      }
+    ]
+  },
+  {
+    "id": "cmgg9zco3000004l258um9xk8",
+    "modelName": "gpt-5-pro",
+    "matchPattern": "(?i)^(openai\/)?(gpt-5-pro)$",
+    "createdAt": "2025-10-07T08:03:54.727Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "cmgg9zco3000004l258um9xk8_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000015,
+          "output": 0.00012,
+          "output_reasoning_tokens": 0.00012,
+          "output_reasoning": 0.00012
+        }
+      }
+    ]
+  },
+  {
+    "id": "cmgga0vh9000104l22qe4fes4",
+    "modelName": "gpt-5-pro-2025-10-06",
+    "matchPattern": "(?i)^(openai\/)?(gpt-5-pro-2025-10-06)$",
+    "createdAt": "2025-10-07T08:03:54.727Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "cmgga0vh9000104l22qe4fes4_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000015,
+          "output": 0.00012,
+          "output_reasoning_tokens": 0.00012,
+          "output_reasoning": 0.00012
+        }
+      }
+    ]
+  },
+  {
+    "id": "cmgt5gnkv000104jx171tbq4e",
+    "modelName": "claude-haiku-4-5-20251001",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-haiku-4-5-20251001|(eu\\.|us\\.|apac\\.|global\\.)?anthropic\\.claude-haiku-4-5-20251001-v1:0|claude-4-5-haiku@20251001)$",
+    "createdAt": "2025-10-16T08:20:44.558Z",
+    "updatedAt": "2026-03-04T00:00:00.000Z",
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "cmgt5gnkv000104jx171tbq4e_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000001,
+          "input_tokens": 0.000001,
+          "output": 0.000005,
+          "output_tokens": 0.000005,
+          "cache_creation_input_tokens": 0.00000125,
+          "input_cache_creation": 0.00000125,
+          "input_cache_creation_5m": 0.00000125,
+          "input_cache_creation_1h": 0.000002,
+          "cache_read_input_tokens": 1e-7,
+          "input_cache_read": 1e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "cmhymgpym000d04ih34rndvhr",
+    "modelName": "gpt-5.1",
+    "matchPattern": "(?i)^(openai\/)?(gpt-5.1)$",
+    "createdAt": "2025-11-14T08:57:23.481Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "cmhymgpym000d04ih34rndvhr_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00000125,
+          "input_cached_tokens": 1.25e-7,
+          "output": 0.00001,
+          "input_cache_read": 1.25e-7,
+          "output_reasoning_tokens": 0.00001,
+          "output_reasoning": 0.00001
+        }
+      }
+    ]
+  },
+  {
+    "id": "cmhymgxiw000e04ihh9pw12ef",
+    "modelName": "gpt-5.1-2025-11-13",
+    "matchPattern": "(?i)^(openai\/)?(gpt-5.1-2025-11-13)$",
+    "createdAt": "2025-11-14T08:57:23.481Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "cmhymgxiw000e04ihh9pw12ef_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00000125,
+          "input_cached_tokens": 1.25e-7,
+          "output": 0.00001,
+          "input_cache_read": 1.25e-7,
+          "output_reasoning_tokens": 0.00001,
+          "output_reasoning": 0.00001
+        }
+      }
+    ]
+  },
+  {
+    "id": "cmieupdva000004l541kwae70",
+    "modelName": "claude-opus-4-5-20251101",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-opus-4-5(-20251101)?|(eu\\.|us\\.|apac\\.|global\\.)?anthropic\\.claude-opus-4-5(-20251101)?-v1(:0)?|claude-opus-4-5(@20251101)?)$",
+    "createdAt": "2025-11-24T20:53:27.571Z",
+    "updatedAt": "2026-03-04T00:00:00.000Z",
+    "tokenizerConfig": null,
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "cmieupdva000004l541kwae70_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 5e-6,
+          "input_tokens": 5e-6,
+          "output": 25e-6,
+          "output_tokens": 25e-6,
+          "cache_creation_input_tokens": 6.25e-6,
+          "input_cache_creation": 6.25e-6,
+          "input_cache_creation_5m": 6.25e-6,
+          "input_cache_creation_1h": 10e-6,
+          "cache_read_input_tokens": 0.5e-6,
+          "input_cache_read": 0.5e-6
+        }
+      }
+    ]
+  },
+  {
+    "id": "90ec5ec3-1a48-4ff0-919c-70cdb8f632ed",
+    "modelName": "claude-sonnet-4-6",
+    "matchPattern": "(?i)^(anthropic\\/)?(claude-sonnet-4-6|(eu\\.|us\\.|apac\\.|global\\.)?anthropic\\.claude-sonnet-4-6(-v1(:0)?)?|claude-sonnet-4-6)$",
+    "createdAt": "2026-02-18T00:00:00.000Z",
+    "updatedAt": "2026-03-04T00:00:00.000Z",
+    "tokenizerConfig": null,
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "90ec5ec3-1a48-4ff0-919c-70cdb8f632ed_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 3e-6,
+          "input_tokens": 3e-6,
+          "output": 15e-6,
+          "output_tokens": 15e-6,
+          "cache_creation_input_tokens": 3.75e-6,
+          "input_cache_creation": 3.75e-6,
+          "input_cache_creation_5m": 3.75e-6,
+          "input_cache_creation_1h": 6e-6,
+          "cache_read_input_tokens": 3e-7,
+          "input_cache_read": 3e-7
+        }
+      },
+      {
+        "id": "7830bfc2-c464-4ffe-b9a2-6e741f6c5486",
+        "name": "Large Context",
+        "isDefault": false,
+        "priority": 1,
+        "conditions": [
+          {
+            "usageDetailPattern": "input",
+            "operator": "gt",
+            "value": 200000,
+            "caseSensitive": false
+          }
+        ],
+        "prices": {
+          "input": 6e-6,
+          "input_tokens": 6e-6,
+          "output": 22.5e-6,
+          "output_tokens": 22.5e-6,
+          "cache_creation_input_tokens": 7.5e-6,
+          "input_cache_creation": 7.5e-6,
+          "input_cache_creation_5m": 7.5e-6,
+          "input_cache_creation_1h": 12e-6,
+          "cache_read_input_tokens": 6e-7,
+          "input_cache_read": 6e-7
+        }
+      }
+    ]
+  },
+  {
+    "id": "13458bc0-1c20-44c2-8753-172f54b67647",
+    "modelName": "claude-opus-4-6",
+    "matchPattern": "(?i)^(anthropic\/)?(claude-opus-4-6|(eu\\.|us\\.|apac\\.|global\\.)?anthropic\\.claude-opus-4-6-v1(:0)?|claude-opus-4-6)$",
+    "createdAt": "2026-02-09T00:00:00.000Z",
+    "updatedAt": "2026-03-04T00:00:00.000Z",
+    "tokenizerConfig": null,
+    "tokenizerId": "claude",
+    "pricingTiers": [
+      {
+        "id": "13458bc0-1c20-44c2-8753-172f54b67647_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 5e-6,
+          "input_tokens": 5e-6,
+          "output": 25e-6,
+          "output_tokens": 25e-6,
+          "cache_creation_input_tokens": 6.25e-6,
+          "input_cache_creation": 6.25e-6,
+          "input_cache_creation_5m": 6.25e-6,
+          "input_cache_creation_1h": 10e-6,
+          "cache_read_input_tokens": 0.5e-6,
+          "input_cache_read": 0.5e-6
+        }
+      }
+    ]
+  },
+  {
+    "id": "cmig1hb7i000104l72qrzgc6h",
+    "modelName": "gemini-2.5-pro",
+    "matchPattern": "(?i)^(google\/)?(gemini-2.5-pro)$",
+    "createdAt": "2025-11-26T13:27:53.545Z",
+    "updatedAt": "2026-03-04T00:00:00.000Z",
+    "pricingTiers": [
+      {
+        "id": "cmig1hb7i000104l72qrzgc6h_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 1.25e-6,
+          "input_text": 1.25e-6,
+          "input_modality_1": 1.25e-6,
+          "prompt_token_count": 1.25e-6,
+          "promptTokenCount": 1.25e-6,
+          "input_cached_tokens": 0.125e-6,
+          "cached_content_token_count": 0.125e-6,
+          "output": 10e-6,
+          "output_modality_1": 10e-6,
+          "candidates_token_count": 10e-6,
+          "candidatesTokenCount": 10e-6,
+          "thoughtsTokenCount": 10e-6,
+          "thoughts_token_count": 10e-6,
+          "output_reasoning": 10e-6
+        }
+      },
+      {
+        "id": "bcf39e8f-9969-455f-be9a-541a00256092",
+        "name": "Large Context",
+        "isDefault": false,
+        "priority": 1,
+        "conditions": [
+          {
+            "usageDetailPattern": "(input|prompt|cached)",
+            "operator": "gt",
+            "value": 200000,
+            "caseSensitive": false
+          }
+        ],
+        "prices": {
+          "input": 2.5e-6,
+          "input_text": 2.5e-6,
+          "input_modality_1": 2.5e-6,
+          "prompt_token_count": 2.5e-6,
+          "promptTokenCount": 2.5e-6,
+          "input_cached_tokens": 0.25e-6,
+          "cached_content_token_count": 0.25e-6,
+          "output": 15e-6,
+          "output_modality_1": 15e-6,
+          "candidates_token_count": 15e-6,
+          "candidatesTokenCount": 15e-6,
+          "thoughtsTokenCount": 15e-6,
+          "thoughts_token_count": 15e-6,
+          "output_reasoning": 15e-6
+        }
+      }
+    ]
+  },
+  {
+    "id": "cmig1wmep000404l7fh6q5uog",
+    "modelName": "gemini-3-pro-preview",
+    "matchPattern": "(?i)^(google\/)?(gemini-3-pro-preview)$",
+    "createdAt": "2025-11-26T13:27:53.545Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "pricingTiers": [
+      {
+        "id": "cmig1wmep000404l7fh6q5uog_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2e-6,
+          "input_modality_1": 2e-6,
+          "prompt_token_count": 2e-6,
+          "promptTokenCount": 2e-6,
+          "input_cached_tokens": 0.2e-6,
+          "cached_content_token_count": 0.2e-6,
+          "output": 12e-6,
+          "output_modality_1": 12e-6,
+          "candidates_token_count": 12e-6,
+          "candidatesTokenCount": 12e-6,
+          "thoughtsTokenCount": 12e-6,
+          "thoughts_token_count": 12e-6,
+          "output_reasoning": 12e-6
+        }
+      },
+      {
+        "id": "4da930c8-7146-4e27-b66c-b62f2c2ec357",
+        "name": "Large Context",
+        "isDefault": false,
+        "priority": 1,
+        "conditions": [
+          {
+            "usageDetailPattern": "(input|prompt|cached)",
+            "operator": "gt",
+            "value": 200000,
+            "caseSensitive": false
+          }
+        ],
+        "prices": {
+          "input": 4e-6,
+          "input_modality_1": 4e-6,
+          "prompt_token_count": 4e-6,
+          "promptTokenCount": 4e-6,
+          "input_cached_tokens": 0.4e-6,
+          "cached_content_token_count": 0.4e-6,
+          "output": 18e-6,
+          "output_modality_1": 18e-6,
+          "candidates_token_count": 18e-6,
+          "candidatesTokenCount": 18e-6,
+          "thoughtsTokenCount": 18e-6,
+          "thoughts_token_count": 18e-6,
+          "output_reasoning": 18e-6
+        }
+      }
+    ]
+  },
+  {
+    "id": "55106bba-a5dd-441b-bc0d-5652582b349d",
+    "modelName": "gemini-3.1-pro-preview",
+    "matchPattern": "(?i)^(google\/)?(gemini-3.1-pro-preview(-customtools)?)$",
+    "createdAt": "2026-02-19T00:00:00.000Z",
+    "updatedAt": "2026-02-19T00:00:00.000Z",
+    "pricingTiers": [
+      {
+        "id": "55106bba-a5dd-441b-bc0d-5652582b349d_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2e-6,
+          "input_modality_1": 2e-6,
+          "prompt_token_count": 2e-6,
+          "promptTokenCount": 2e-6,
+          "input_cached_tokens": 0.2e-6,
+          "cached_content_token_count": 0.2e-6,
+          "output": 12e-6,
+          "output_modality_1": 12e-6,
+          "candidates_token_count": 12e-6,
+          "candidatesTokenCount": 12e-6,
+          "thoughtsTokenCount": 12e-6,
+          "thoughts_token_count": 12e-6,
+          "output_reasoning": 12e-6
+        }
+      },
+      {
+        "id": "ada11e9f-fe0d-465a-92af-ce334d0eedeb",
+        "name": "Large Context",
+        "isDefault": false,
+        "priority": 1,
+        "conditions": [
+          {
+            "usageDetailPattern": "(input|prompt|cached)",
+            "operator": "gt",
+            "value": 200000,
+            "caseSensitive": false
+          }
+        ],
+        "prices": {
+          "input": 4e-6,
+          "input_modality_1": 4e-6,
+          "prompt_token_count": 4e-6,
+          "promptTokenCount": 4e-6,
+          "input_cached_tokens": 0.4e-6,
+          "cached_content_token_count": 0.4e-6,
+          "output": 18e-6,
+          "output_modality_1": 18e-6,
+          "candidates_token_count": 18e-6,
+          "candidatesTokenCount": 18e-6,
+          "thoughtsTokenCount": 18e-6,
+          "thoughts_token_count": 18e-6,
+          "output_reasoning": 18e-6
+        }
+      }
+    ]
+  },
+  {
+    "id": "cmj2n4f2a000304kz49g4c43u",
+    "modelName": "gpt-5.2",
+    "matchPattern": "(?i)^(openai\/)?(gpt-5.2)$",
+    "createdAt": "2025-12-12T09:00:06.513Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "cmj2n4f2a000304kz49g4c43u_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 1.75e-6,
+          "input_cached_tokens": 0.175e-6,
+          "input_cache_read": 0.175e-6,
+          "output": 14e-6,
+          "output_reasoning_tokens": 14e-6,
+          "output_reasoning": 14e-6
+        }
+      }
+    ]
+  },
+  {
+    "id": "cmj2muxg6000104kzd2tc8953",
+    "modelName": "gpt-5.2-2025-12-11",
+    "matchPattern": "(?i)^(openai\/)?(gpt-5.2-2025-12-11)$",
+    "createdAt": "2025-12-12T09:00:06.513Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "cmj2muxg6000104kzd2tc8953_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 1.75e-6,
+          "input_cached_tokens": 0.175e-6,
+          "input_cache_read": 0.175e-6,
+          "output": 14e-6,
+          "output_reasoning_tokens": 14e-6,
+          "output_reasoning": 14e-6
+        }
+      }
+    ]
+  },
+  {
+    "id": "cmj2n6pkq000404kz2s0b6if7",
+    "modelName": "gpt-5.2-pro",
+    "matchPattern": "(?i)^(openai\/)?(gpt-5.2-pro)$",
+    "createdAt": "2025-12-12T09:00:06.513Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "cmj2n6pkq000404kz2s0b6if7_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 21e-6,
+          "output": 168e-6,
+          "output_reasoning_tokens": 168e-6,
+          "output_reasoning": 168e-6
+        }
+      }
+    ]
+  },
+  {
+    "id": "cmj2n70oe000504kz21b76mes",
+    "modelName": "gpt-5.2-pro-2025-12-11",
+    "matchPattern": "(?i)^(openai\/)?(gpt-5.2-pro-2025-12-11)$",
+    "createdAt": "2025-12-12T09:00:06.513Z",
+    "updatedAt": "2025-12-12T15:00:06.513Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "cmj2n70oe000504kz21b76mes_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 21e-6,
+          "output": 168e-6,
+          "output_reasoning_tokens": 168e-6,
+          "output_reasoning": 168e-6
+        }
+      }
+    ]
+  },
+  {
+    "id": "bee3c111-fe6f-4641-8775-73ea33b29fca",
+    "modelName": "gpt-5.4",
+    "matchPattern": "(?i)^(openai\/)?(gpt-5.4)$",
+    "createdAt": "2026-03-05T00:00:00.000Z",
+    "updatedAt": "2026-03-05T00:00:00.000Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "bee3c111-fe6f-4641-8775-73ea33b29fca_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-6,
+          "input_cached_tokens": 0.25e-6,
+          "input_cache_read": 0.25e-6,
+          "output": 15e-6,
+          "output_reasoning_tokens": 15e-6,
+          "output_reasoning": 15e-6
+        }
+      }
+    ]
+  },
+  {
+    "id": "68d32054-8748-4d25-9f64-d78d483601bd",
+    "modelName": "gpt-5.4-pro",
+    "matchPattern": "(?i)^(openai\/)?(gpt-5.4-pro)$",
+    "createdAt": "2026-03-05T00:00:00.000Z",
+    "updatedAt": "2026-03-05T00:00:00.000Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "68d32054-8748-4d25-9f64-d78d483601bd_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 30e-6,
+          "output": 180e-6,
+          "output_reasoning_tokens": 180e-6,
+          "output_reasoning": 180e-6
+        }
+      }
+    ]
+  },
+  {
+    "id": "22dfc7e1-1fe1-4286-b1af-928635e7ecb9",
+    "modelName": "gpt-5.4-2026-03-05",
+    "matchPattern": "(?i)^(openai\/)?(gpt-5.4-2026-03-05)$",
+    "createdAt": "2026-03-05T00:00:00.000Z",
+    "updatedAt": "2026-03-05T00:00:00.000Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "22dfc7e1-1fe1-4286-b1af-928635e7ecb9_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-6,
+          "input_cached_tokens": 0.25e-6,
+          "input_cache_read": 0.25e-6,
+          "output": 15e-6,
+          "output_reasoning_tokens": 15e-6,
+          "output_reasoning": 15e-6
+        }
+      }
+    ]
+  },
+  {
+    "id": "d8873413-05ab-4374-8223-e8c9005c4a0e",
+    "modelName": "gpt-5.4-pro-2026-03-05",
+    "matchPattern": "(?i)^(openai\/)?(gpt-5.4-pro-2026-03-05)$",
+    "createdAt": "2026-03-05T00:00:00.000Z",
+    "updatedAt": "2026-03-05T00:00:00.000Z",
+    "tokenizerConfig": {
+      "tokensPerName": 1,
+      "tokenizerModel": "gpt-4",
+      "tokensPerMessage": 3
+    },
+    "tokenizerId": "openai",
+    "pricingTiers": [
+      {
+        "id": "d8873413-05ab-4374-8223-e8c9005c4a0e_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 30e-6,
+          "output": 180e-6,
+          "output_reasoning_tokens": 180e-6,
+          "output_reasoning": 180e-6
+        }
+      }
+    ]
+  },
+  {
+    "id": "cmjfoeykl000004l8ffzra8c7",
+    "modelName": "gemini-3-flash-preview",
+    "matchPattern": "(?i)^(google\/)?(gemini-3-flash-preview)$",
+    "createdAt": "2025-12-21T12:01:42.282Z",
+    "updatedAt": "2025-12-21T12:01:42.282Z",
+    "pricingTiers": [
+      {
+        "id": "cmjfoeykl000004l8ffzra8c7_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.5e-6,
+          "input_modality_1": 0.5e-6,
+          "prompt_token_count": 0.5e-6,
+          "promptTokenCount": 0.5e-6,
+          "input_cached_tokens": 0.05e-6,
+          "cached_content_token_count": 0.05e-6,
+          "output": 3e-6,
+          "output_modality_1": 3e-6,
+          "candidates_token_count": 3e-6,
+          "candidatesTokenCount": 3e-6,
+          "thoughtsTokenCount": 3e-6,
+          "thoughts_token_count": 3e-6,
+          "output_reasoning": 3e-6
+        }
+      }
+    ]
+  },
+  {
+    "id": "0707bef8-10c8-46e2-a871-0436f05f0b92",
+    "modelName": "gemini-3.1-flash-lite-preview",
+    "matchPattern": "(?i)^(google\/)?(gemini-3.1-flash-lite-preview)$",
+    "createdAt": "2026-03-03T00:00:00.000Z",
+    "updatedAt": "2026-03-03T00:00:00.000Z",
+    "pricingTiers": [
+      {
+        "id": "0707bef8-10c8-46e2-a871-0436f05f0b92_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.25e-6,
+          "input_modality_1": 0.25e-6,
+          "prompt_token_count": 0.25e-6,
+          "promptTokenCount": 0.25e-6,
+          "input_cached_tokens": 0.025e-6,
+          "cached_content_token_count": 0.025e-6,
+          "output": 1.5e-6,
+          "output_modality_1": 1.5e-6,
+          "candidates_token_count": 1.5e-6,
+          "candidatesTokenCount": 1.5e-6,
+          "thoughtsTokenCount": 1.5e-6,
+          "thoughts_token_count": 1.5e-6,
+          "output_reasoning": 1.5e-6,
+          "input_audio_tokens": 0.5e-6
+        }
+      }
+    ]
+  },
+  {
+    "id": "029e6695-ff24-47f0-b37b-7285fb2e5785",
+    "modelName": "gemini-live-2.5-flash-native-audio",
+    "matchPattern": "(?i)^(google\/)?(gemini-live-2.5-flash-native-audio)$",
+    "createdAt": "2026-03-16T00:00:00.000Z",
+    "updatedAt": "2026-03-16T00:00:00.000Z",
+    "tokenizerConfig": null,
+    "tokenizerId": null,
+    "pricingTiers": [
+      {
+        "id": "029e6695-ff24-47f0-b37b-7285fb2e5785_tier_default",
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input_text": 0.5e-6,
+          "input_audio": 3e-6,
+          "input_image": 3e-6,
+          "output_text": 2e-6,
+          "output_audio": 12e-6
+        }
+      }
+    ]
+  }
+]
diff --git a/internal-packages/llm-pricing/src/defaultPrices.ts b/internal-packages/llm-pricing/src/defaultPrices.ts
new file mode 100644
index 00000000000..87013e55337
--- /dev/null
+++ b/internal-packages/llm-pricing/src/defaultPrices.ts
@@ -0,0 +1,3004 @@
+import type { DefaultModelDefinition } from "./types.js";
+
+// Auto-generated from Langfuse default-model-prices.json — do not edit manually.
+// Run `pnpm run sync-prices` to update from upstream.
+// Source: https://github.com/langfuse/langfuse
+
+export const defaultModelPrices: DefaultModelDefinition[] = [
+  {
+    "modelName": "gpt-4o",
+    "matchPattern": "(?i)^(openai/)?(gpt-4o)$",
+    "startDate": "2024-05-13T23:15:07.670Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000025,
+          "input_cached_tokens": 0.00000125,
+          "input_cache_read": 0.00000125,
+          "output": 0.00001
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4o-2024-05-13",
+    "matchPattern": "(?i)^(openai/)?(gpt-4o-2024-05-13)$",
+    "startDate": "2024-05-13T23:15:07.670Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000005,
+          "output": 0.000015
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4-1106-preview",
+    "matchPattern": "(?i)^(openai/)?(gpt-4-1106-preview)$",
+    "startDate": "2024-04-23T10:37:17.092Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00001,
+          "output": 0.00003
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4-turbo-vision",
+    "matchPattern": "(?i)^(openai/)?(gpt-4(-\\d{4})?-vision-preview)$",
+    "startDate": "2024-01-24T10:19:21.693Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00001,
+          "output": 0.00003
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4-32k",
+    "matchPattern": "(?i)^(openai/)?(gpt-4-32k)$",
+    "startDate": "2024-01-24T10:19:21.693Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00006,
+          "output": 0.00012
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4-32k-0613",
+    "matchPattern": "(?i)^(openai/)?(gpt-4-32k-0613)$",
+    "startDate": "2024-01-24T10:19:21.693Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00006,
+          "output": 0.00012
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-3.5-turbo-1106",
+    "matchPattern": "(?i)^(openai/)?(gpt-)(35|3.5)(-turbo-1106)$",
+    "startDate": "2024-01-24T10:19:21.693Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000001,
+          "output": 0.000002
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-3.5-turbo-0613",
+    "matchPattern": "(?i)^(openai/)?(gpt-)(35|3.5)(-turbo-0613)$",
+    "startDate": "2024-01-24T10:19:21.693Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000015,
+          "output": 0.000002
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4-0613",
+    "matchPattern": "(?i)^(openai/)?(gpt-4-0613)$",
+    "startDate": "2024-01-24T10:19:21.693Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00003,
+          "output": 0.00006
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-3.5-turbo-instruct",
+    "matchPattern": "(?i)^(openai/)?(gpt-)(35|3.5)(-turbo-instruct)$",
+    "startDate": "2024-01-24T10:19:21.693Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000015,
+          "output": 0.000002
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "text-ada-001",
+    "matchPattern": "(?i)^(text-ada-001)$",
+    "startDate": "2024-01-24T18:18:50.861Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 0.000004
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "text-babbage-001",
+    "matchPattern": "(?i)^(text-babbage-001)$",
+    "startDate": "2024-01-24T18:18:50.861Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "text-curie-001",
+    "matchPattern": "(?i)^(text-curie-001)$",
+    "startDate": "2024-01-24T18:18:50.861Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 0.00002
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "text-davinci-001",
+    "matchPattern": "(?i)^(text-davinci-001)$",
+    "startDate": "2024-01-24T18:18:50.861Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 0.00002
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "text-davinci-002",
+    "matchPattern": "(?i)^(text-davinci-002)$",
+    "startDate": "2024-01-24T18:18:50.861Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 0.00002
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "text-davinci-003",
+    "matchPattern": "(?i)^(text-davinci-003)$",
+    "startDate": "2024-01-24T18:18:50.861Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 0.00002
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "text-embedding-ada-002-v2",
+    "matchPattern": "(?i)^(text-embedding-ada-002-v2)$",
+    "startDate": "2024-01-24T18:18:50.861Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 1e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "text-embedding-ada-002",
+    "matchPattern": "(?i)^(text-embedding-ada-002)$",
+    "startDate": "2024-01-24T18:18:50.861Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 1e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-3.5-turbo-16k-0613",
+    "matchPattern": "(?i)^(openai/)?(gpt-)(35|3.5)(-turbo-16k-0613)$",
+    "startDate": "2024-02-03T17:29:57.350Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000003,
+          "output": 0.000004
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-3.5-turbo-0301",
+    "matchPattern": "(?i)^(openai/)?(gpt-)(35|3.5)(-turbo-0301)$",
+    "startDate": "2024-01-24T10:19:21.693Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000002,
+          "output": 0.000002
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4-32k-0314",
+    "matchPattern": "(?i)^(openai/)?(gpt-4-32k-0314)$",
+    "startDate": "2024-01-24T10:19:21.693Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00006,
+          "output": 0.00012
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4-0314",
+    "matchPattern": "(?i)^(openai/)?(gpt-4-0314)$",
+    "startDate": "2024-01-24T10:19:21.693Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00003,
+          "output": 0.00006
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4",
+    "matchPattern": "(?i)^(openai/)?(gpt-4)$",
+    "startDate": "2024-01-24T10:19:21.693Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00003,
+          "output": 0.00006
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-instant-1.2",
+    "matchPattern": "(?i)^(anthropic/)?(claude-instant-1.2)$",
+    "startDate": "2024-01-30T15:44:13.447Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00000163,
+          "output": 0.00000551
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-2.0",
+    "matchPattern": "(?i)^(anthropic/)?(claude-2.0)$",
+    "startDate": "2024-01-30T15:44:13.447Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000008,
+          "output": 0.000024
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-2.1",
+    "matchPattern": "(?i)^(anthropic/)?(claude-2.1)$",
+    "startDate": "2024-01-30T15:44:13.447Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000008,
+          "output": 0.000024
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-1.3",
+    "matchPattern": "(?i)^(anthropic/)?(claude-1.3)$",
+    "startDate": "2024-01-30T15:44:13.447Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000008,
+          "output": 0.000024
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-1.2",
+    "matchPattern": "(?i)^(anthropic/)?(claude-1.2)$",
+    "startDate": "2024-01-30T15:44:13.447Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000008,
+          "output": 0.000024
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-1.1",
+    "matchPattern": "(?i)^(anthropic/)?(claude-1.1)$",
+    "startDate": "2024-01-30T15:44:13.447Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000008,
+          "output": 0.000024
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-instant-1",
+    "matchPattern": "(?i)^(anthropic/)?(claude-instant-1)$",
+    "startDate": "2024-01-30T15:44:13.447Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00000163,
+          "output": 0.00000551
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "babbage-002",
+    "matchPattern": "(?i)^(babbage-002)$",
+    "startDate": "2024-01-26T17:35:21.129Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 4e-7,
+          "output": 0.0000016
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "davinci-002",
+    "matchPattern": "(?i)^(davinci-002)$",
+    "startDate": "2024-01-26T17:35:21.129Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000006,
+          "output": 0.000012
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "text-embedding-3-small",
+    "matchPattern": "(?i)^(text-embedding-3-small)$",
+    "startDate": "2024-01-26T17:35:21.129Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 2e-8
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "text-embedding-3-large",
+    "matchPattern": "(?i)^(text-embedding-3-large)$",
+    "startDate": "2024-01-26T17:35:21.129Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 1.3e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-3.5-turbo-0125",
+    "matchPattern": "(?i)^(openai/)?(gpt-)(35|3.5)(-turbo-0125)$",
+    "startDate": "2024-01-26T17:35:21.129Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 5e-7,
+          "output": 0.0000015
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-3.5-turbo",
+    "matchPattern": "(?i)^(openai/)?(gpt-)(35|3.5)(-turbo)$",
+    "startDate": "2024-02-13T12:00:37.424Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 5e-7,
+          "output": 0.0000015
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4-0125-preview",
+    "matchPattern": "(?i)^(openai/)?(gpt-4-0125-preview)$",
+    "startDate": "2024-01-26T17:35:21.129Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00001,
+          "output": 0.00003
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "ft:gpt-3.5-turbo-1106",
+    "matchPattern": "(?i)^(ft:)(gpt-3.5-turbo-1106:)(.+)(:)(.*)(:)(.+)$",
+    "startDate": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000003,
+          "output": 0.000006
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "ft:gpt-3.5-turbo-0613",
+    "matchPattern": "(?i)^(ft:)(gpt-3.5-turbo-0613:)(.+)(:)(.*)(:)(.+)$",
+    "startDate": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000012,
+          "output": 0.000016
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "ft:davinci-002",
+    "matchPattern": "(?i)^(ft:)(davinci-002:)(.+)(:)(.*)(:)(.+)$$",
+    "startDate": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000012,
+          "output": 0.000012
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "ft:babbage-002",
+    "matchPattern": "(?i)^(ft:)(babbage-002:)(.+)(:)(.*)(:)(.+)$$",
+    "startDate": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000016,
+          "output": 0.0000016
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "chat-bison",
+    "matchPattern": "(?i)^(chat-bison)(@[a-zA-Z0-9]+)?$",
+    "startDate": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "output": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "codechat-bison-32k",
+    "matchPattern": "(?i)^(codechat-bison-32k)(@[a-zA-Z0-9]+)?$",
+    "startDate": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "output": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "codechat-bison",
+    "matchPattern": "(?i)^(codechat-bison)(@[a-zA-Z0-9]+)?$",
+    "startDate": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "output": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "text-bison-32k",
+    "matchPattern": "(?i)^(text-bison-32k)(@[a-zA-Z0-9]+)?$",
+    "startDate": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "output": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "chat-bison-32k",
+    "matchPattern": "(?i)^(chat-bison-32k)(@[a-zA-Z0-9]+)?$",
+    "startDate": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "output": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "text-unicorn",
+    "matchPattern": "(?i)^(text-unicorn)(@[a-zA-Z0-9]+)?$",
+    "startDate": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000025,
+          "output": 0.0000075
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "text-bison",
+    "matchPattern": "(?i)^(text-bison)(@[a-zA-Z0-9]+)?$",
+    "startDate": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "output": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "textembedding-gecko",
+    "matchPattern": "(?i)^(textembedding-gecko)(@[a-zA-Z0-9]+)?$",
+    "startDate": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 1e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "textembedding-gecko-multilingual",
+    "matchPattern": "(?i)^(textembedding-gecko-multilingual)(@[a-zA-Z0-9]+)?$",
+    "startDate": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "total": 1e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "code-gecko",
+    "matchPattern": "(?i)^(code-gecko)(@[a-zA-Z0-9]+)?$",
+    "startDate": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "output": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "code-bison",
+    "matchPattern": "(?i)^(code-bison)(@[a-zA-Z0-9]+)?$",
+    "startDate": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "output": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "code-bison-32k",
+    "matchPattern": "(?i)^(code-bison-32k)(@[a-zA-Z0-9]+)?$",
+    "startDate": "2024-01-31T13:25:02.141Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "output": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-3.5-turbo-16k",
+    "matchPattern": "(?i)^(openai/)?(gpt-)(35|3.5)(-turbo-16k)$",
+    "startDate": "2024-02-13T12:00:37.424Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 5e-7,
+          "output": 0.0000015
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4-turbo-preview",
+    "matchPattern": "(?i)^(openai/)?(gpt-4-turbo-preview)$",
+    "startDate": "2024-02-15T21:21:50.947Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00001,
+          "output": 0.00003
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-3-opus-20240229",
+    "matchPattern": "(?i)^(anthropic/)?(claude-3-opus-20240229|anthropic\\.claude-3-opus-20240229-v1:0|claude-3-opus@20240229)$",
+    "startDate": "2024-03-07T17:55:38.139Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000015,
+          "output": 0.000075
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-3-sonnet-20240229",
+    "matchPattern": "(?i)^(anthropic/)?(claude-3-sonnet-20240229|anthropic\\.claude-3-sonnet-20240229-v1:0|claude-3-sonnet@20240229)$",
+    "startDate": "2024-03-07T17:55:38.139Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000003,
+          "input_tokens": 0.000003,
+          "output": 0.000015,
+          "output_tokens": 0.000015,
+          "cache_creation_input_tokens": 0.00000375,
+          "input_cache_creation": 0.00000375,
+          "input_cache_creation_5m": 0.00000375,
+          "input_cache_creation_1h": 0.000006,
+          "cache_read_input_tokens": 3e-7,
+          "input_cache_read": 3e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-3-haiku-20240307",
+    "matchPattern": "(?i)^(anthropic/)?(claude-3-haiku-20240307|anthropic\\.claude-3-haiku-20240307-v1:0|claude-3-haiku@20240307)$",
+    "startDate": "2024-03-14T09:41:18.736Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "output": 0.00000125
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gemini-1.0-pro-latest",
+    "matchPattern": "(?i)^(google/)?(gemini-1.0-pro-latest)(@[a-zA-Z0-9]+)?$",
+    "startDate": "2024-04-11T10:27:46.517Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "output": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gemini-1.0-pro",
+    "matchPattern": "(?i)^(google/)?(gemini-1.0-pro)(@[a-zA-Z0-9]+)?$",
+    "startDate": "2024-04-11T10:27:46.517Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 1.25e-7,
+          "output": 3.75e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gemini-1.0-pro-001",
+    "matchPattern": "(?i)^(google/)?(gemini-1.0-pro-001)(@[a-zA-Z0-9]+)?$",
+    "startDate": "2024-04-11T10:27:46.517Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 1.25e-7,
+          "output": 3.75e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gemini-pro",
+    "matchPattern": "(?i)^(google/)?(gemini-pro)(@[a-zA-Z0-9]+)?$",
+    "startDate": "2024-04-11T10:27:46.517Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 1.25e-7,
+          "output": 3.75e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gemini-1.5-pro-latest",
+    "matchPattern": "(?i)^(google/)?(gemini-1.5-pro-latest)(@[a-zA-Z0-9]+)?$",
+    "startDate": "2024-04-11T10:27:46.517Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000025,
+          "output": 0.0000075
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4-turbo-2024-04-09",
+    "matchPattern": "(?i)^(openai/)?(gpt-4-turbo-2024-04-09)$",
+    "startDate": "2024-04-23T10:37:17.092Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00001,
+          "output": 0.00003
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4-turbo",
+    "matchPattern": "(?i)^(openai/)?(gpt-4-turbo)$",
+    "startDate": "2024-04-11T21:13:44.989Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00001,
+          "output": 0.00003
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4-preview",
+    "matchPattern": "(?i)^(openai/)?(gpt-4-preview)$",
+    "startDate": "2024-04-23T10:37:17.092Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00001,
+          "output": 0.00003
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-3-5-sonnet-20240620",
+    "matchPattern": "(?i)^(anthropic/)?(claude-3-5-sonnet-20240620|(eu\\.|us\\.|apac\\.)?anthropic\\.claude-3-5-sonnet-20240620-v1:0|claude-3-5-sonnet@20240620)$",
+    "startDate": "2024-06-25T11:47:24.475Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000003,
+          "input_tokens": 0.000003,
+          "output": 0.000015,
+          "output_tokens": 0.000015,
+          "cache_creation_input_tokens": 0.00000375,
+          "input_cache_creation": 0.00000375,
+          "input_cache_creation_5m": 0.00000375,
+          "input_cache_creation_1h": 0.000006,
+          "cache_read_input_tokens": 3e-7,
+          "input_cache_read": 3e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4o-mini",
+    "matchPattern": "(?i)^(openai/)?(gpt-4o-mini)$",
+    "startDate": "2024-07-18T17:56:09.591Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 1.5e-7,
+          "output": 6e-7,
+          "input_cached_tokens": 7.5e-8,
+          "input_cache_read": 7.5e-8
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4o-mini-2024-07-18",
+    "matchPattern": "(?i)^(openai/)?(gpt-4o-mini-2024-07-18)$",
+    "startDate": "2024-07-18T17:56:09.591Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 1.5e-7,
+          "input_cached_tokens": 7.5e-8,
+          "input_cache_read": 7.5e-8,
+          "output": 6e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4o-2024-08-06",
+    "matchPattern": "(?i)^(openai/)?(gpt-4o-2024-08-06)$",
+    "startDate": "2024-08-07T11:54:31.298Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000025,
+          "input_cached_tokens": 0.00000125,
+          "input_cache_read": 0.00000125,
+          "output": 0.00001
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "o1-preview",
+    "matchPattern": "(?i)^(openai/)?(o1-preview)$",
+    "startDate": "2024-09-13T10:01:35.373Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000015,
+          "input_cached_tokens": 0.0000075,
+          "input_cache_read": 0.0000075,
+          "output": 0.00006,
+          "output_reasoning_tokens": 0.00006,
+          "output_reasoning": 0.00006
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "o1-preview-2024-09-12",
+    "matchPattern": "(?i)^(openai/)?(o1-preview-2024-09-12)$",
+    "startDate": "2024-09-13T10:01:35.373Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000015,
+          "input_cached_tokens": 0.0000075,
+          "input_cache_read": 0.0000075,
+          "output": 0.00006,
+          "output_reasoning_tokens": 0.00006,
+          "output_reasoning": 0.00006
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "o1-mini",
+    "matchPattern": "(?i)^(openai/)?(o1-mini)$",
+    "startDate": "2024-09-13T10:01:35.373Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000011,
+          "input_cached_tokens": 5.5e-7,
+          "input_cache_read": 5.5e-7,
+          "output": 0.0000044,
+          "output_reasoning_tokens": 0.0000044,
+          "output_reasoning": 0.0000044
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "o1-mini-2024-09-12",
+    "matchPattern": "(?i)^(openai/)?(o1-mini-2024-09-12)$",
+    "startDate": "2024-09-13T10:01:35.373Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000011,
+          "input_cached_tokens": 5.5e-7,
+          "input_cache_read": 5.5e-7,
+          "output": 0.0000044,
+          "output_reasoning_tokens": 0.0000044,
+          "output_reasoning": 0.0000044
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-3.5-sonnet-20241022",
+    "matchPattern": "(?i)^(anthropic/)?(claude-3-5-sonnet-20241022|(eu\\.|us\\.|apac\\.)?anthropic\\.claude-3-5-sonnet-20241022-v2:0|claude-3-5-sonnet-V2@20241022)$",
+    "startDate": "2024-10-22T18:48:01.676Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000003,
+          "input_tokens": 0.000003,
+          "output": 0.000015,
+          "output_tokens": 0.000015,
+          "cache_creation_input_tokens": 0.00000375,
+          "input_cache_creation": 0.00000375,
+          "input_cache_creation_5m": 0.00000375,
+          "input_cache_creation_1h": 0.000006,
+          "cache_read_input_tokens": 3e-7,
+          "input_cache_read": 3e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-3.5-sonnet-latest",
+    "matchPattern": "(?i)^(anthropic/)?(claude-3-5-sonnet-latest)$",
+    "startDate": "2024-10-22T18:48:01.676Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000003,
+          "input_tokens": 0.000003,
+          "output": 0.000015,
+          "output_tokens": 0.000015,
+          "cache_creation_input_tokens": 0.00000375,
+          "input_cache_creation": 0.00000375,
+          "input_cache_creation_5m": 0.00000375,
+          "input_cache_creation_1h": 0.000006,
+          "cache_read_input_tokens": 3e-7,
+          "input_cache_read": 3e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-3-5-haiku-20241022",
+    "matchPattern": "(?i)^(anthropic/)?(claude-3-5-haiku-20241022|(eu\\.|us\\.|apac\\.)?anthropic\\.claude-3-5-haiku-20241022-v1:0|claude-3-5-haiku-V1@20241022)$",
+    "startDate": "2024-11-05T10:30:50.566Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 8e-7,
+          "input_tokens": 8e-7,
+          "output": 0.000004,
+          "output_tokens": 0.000004,
+          "cache_creation_input_tokens": 0.000001,
+          "input_cache_creation": 0.000001,
+          "input_cache_creation_5m": 0.000001,
+          "input_cache_creation_1h": 0.0000016,
+          "cache_read_input_tokens": 8e-8,
+          "input_cache_read": 8e-8
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-3.5-haiku-latest",
+    "matchPattern": "(?i)^(anthropic/)?(claude-3-5-haiku-latest)$",
+    "startDate": "2024-11-05T10:30:50.566Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 8e-7,
+          "input_tokens": 8e-7,
+          "output": 0.000004,
+          "output_tokens": 0.000004,
+          "cache_creation_input_tokens": 0.000001,
+          "input_cache_creation": 0.000001,
+          "input_cache_creation_5m": 0.000001,
+          "input_cache_creation_1h": 0.0000016,
+          "cache_read_input_tokens": 8e-8,
+          "input_cache_read": 8e-8
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "chatgpt-4o-latest",
+    "matchPattern": "(?i)^(chatgpt-4o-latest)$",
+    "startDate": "2024-11-25T12:47:17.504Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000005,
+          "output": 0.000015
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4o-2024-11-20",
+    "matchPattern": "(?i)^(openai/)?(gpt-4o-2024-11-20)$",
+    "startDate": "2024-12-03T10:06:12.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000025,
+          "input_cached_tokens": 0.00000125,
+          "input_cache_read": 0.00000125,
+          "output": 0.00001
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4o-audio-preview",
+    "matchPattern": "(?i)^(openai/)?(gpt-4o-audio-preview)$",
+    "startDate": "2024-12-03T10:19:56.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input_text_tokens": 0.0000025,
+          "output_text_tokens": 0.00001,
+          "input_audio_tokens": 0.0001,
+          "input_audio": 0.0001,
+          "output_audio_tokens": 0.0002,
+          "output_audio": 0.0002
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4o-audio-preview-2024-10-01",
+    "matchPattern": "(?i)^(openai/)?(gpt-4o-audio-preview-2024-10-01)$",
+    "startDate": "2024-12-03T10:19:56.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input_text_tokens": 0.0000025,
+          "output_text_tokens": 0.00001,
+          "input_audio_tokens": 0.0001,
+          "input_audio": 0.0001,
+          "output_audio_tokens": 0.0002,
+          "output_audio": 0.0002
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4o-realtime-preview",
+    "matchPattern": "(?i)^(openai/)?(gpt-4o-realtime-preview)$",
+    "startDate": "2024-12-03T10:19:56.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input_text_tokens": 0.000005,
+          "input_cached_text_tokens": 0.0000025,
+          "output_text_tokens": 0.00002,
+          "input_audio_tokens": 0.0001,
+          "input_audio": 0.0001,
+          "input_cached_audio_tokens": 0.00002,
+          "output_audio_tokens": 0.0002,
+          "output_audio": 0.0002
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4o-realtime-preview-2024-10-01",
+    "matchPattern": "(?i)^(openai/)?(gpt-4o-realtime-preview-2024-10-01)$",
+    "startDate": "2024-12-03T10:19:56.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input_text_tokens": 0.000005,
+          "input_cached_text_tokens": 0.0000025,
+          "output_text_tokens": 0.00002,
+          "input_audio_tokens": 0.0001,
+          "input_audio": 0.0001,
+          "input_cached_audio_tokens": 0.00002,
+          "output_audio_tokens": 0.0002,
+          "output_audio": 0.0002
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "o1",
+    "matchPattern": "(?i)^(openai/)?(o1)$",
+    "startDate": "2025-01-17T00:01:35.373Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000015,
+          "input_cached_tokens": 0.0000075,
+          "input_cache_read": 0.0000075,
+          "output": 0.00006,
+          "output_reasoning_tokens": 0.00006,
+          "output_reasoning": 0.00006
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "o1-2024-12-17",
+    "matchPattern": "(?i)^(openai/)?(o1-2024-12-17)$",
+    "startDate": "2025-01-17T00:01:35.373Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000015,
+          "input_cached_tokens": 0.0000075,
+          "input_cache_read": 0.0000075,
+          "output": 0.00006,
+          "output_reasoning_tokens": 0.00006,
+          "output_reasoning": 0.00006
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "o3-mini",
+    "matchPattern": "(?i)^(openai/)?(o3-mini)$",
+    "startDate": "2025-01-31T20:41:35.373Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000011,
+          "input_cached_tokens": 5.5e-7,
+          "input_cache_read": 5.5e-7,
+          "output": 0.0000044,
+          "output_reasoning_tokens": 0.0000044,
+          "output_reasoning": 0.0000044
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "o3-mini-2025-01-31",
+    "matchPattern": "(?i)^(openai/)?(o3-mini-2025-01-31)$",
+    "startDate": "2025-01-31T20:41:35.373Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000011,
+          "input_cached_tokens": 5.5e-7,
+          "input_cache_read": 5.5e-7,
+          "output": 0.0000044,
+          "output_reasoning_tokens": 0.0000044,
+          "output_reasoning": 0.0000044
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gemini-2.0-flash-001",
+    "matchPattern": "(?i)^(google/)?(gemini-2.0-flash-001)(@[a-zA-Z0-9]+)?$",
+    "startDate": "2025-02-06T11:11:35.241Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 1e-7,
+          "output": 4e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gemini-2.0-flash-lite-preview-02-05",
+    "matchPattern": "(?i)^(google/)?(gemini-2.0-flash-lite-preview-02-05)(@[a-zA-Z0-9]+)?$",
+    "startDate": "2025-02-06T11:11:35.241Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 7.5e-8,
+          "output": 3e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-3.7-sonnet-20250219",
+    "matchPattern": "(?i)^(anthropic/)?(claude-3.7-sonnet-20250219|(eu\\.|us\\.|apac\\.)?anthropic\\.claude-3.7-sonnet-20250219-v1:0|claude-3-7-sonnet-V1@20250219)$",
+    "startDate": "2025-02-25T09:35:39.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000003,
+          "input_tokens": 0.000003,
+          "output": 0.000015,
+          "output_tokens": 0.000015,
+          "cache_creation_input_tokens": 0.00000375,
+          "input_cache_creation": 0.00000375,
+          "input_cache_creation_5m": 0.00000375,
+          "input_cache_creation_1h": 0.000006,
+          "cache_read_input_tokens": 3e-7,
+          "input_cache_read": 3e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-3.7-sonnet-latest",
+    "matchPattern": "(?i)^(anthropic/)?(claude-3-7-sonnet-latest)$",
+    "startDate": "2025-02-25T09:35:39.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000003,
+          "input_tokens": 0.000003,
+          "output": 0.000015,
+          "output_tokens": 0.000015,
+          "cache_creation_input_tokens": 0.00000375,
+          "input_cache_creation": 0.00000375,
+          "input_cache_creation_5m": 0.00000375,
+          "input_cache_creation_1h": 0.000006,
+          "cache_read_input_tokens": 3e-7,
+          "input_cache_read": 3e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4.5-preview",
+    "matchPattern": "(?i)^(openai/)?(gpt-4.5-preview)$",
+    "startDate": "2025-02-27T21:26:54.132Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000075,
+          "input_cached_tokens": 0.0000375,
+          "input_cached_text_tokens": 0.0000375,
+          "input_cache_read": 0.0000375,
+          "output": 0.00015
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4.5-preview-2025-02-27",
+    "matchPattern": "(?i)^(openai/)?(gpt-4.5-preview-2025-02-27)$",
+    "startDate": "2025-02-27T21:26:54.132Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000075,
+          "input_cached_tokens": 0.0000375,
+          "input_cached_text_tokens": 0.0000375,
+          "input_cache_read": 0.0000375,
+          "output": 0.00015
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4.1",
+    "matchPattern": "(?i)^(openai/)?(gpt-4.1)$",
+    "startDate": "2025-04-15T10:26:54.132Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000002,
+          "input_cached_tokens": 5e-7,
+          "input_cached_text_tokens": 5e-7,
+          "input_cache_read": 5e-7,
+          "output": 0.000008
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4.1-2025-04-14",
+    "matchPattern": "(?i)^(openai/)?(gpt-4.1-2025-04-14)$",
+    "startDate": "2025-04-15T10:26:54.132Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000002,
+          "input_cached_tokens": 5e-7,
+          "input_cached_text_tokens": 5e-7,
+          "input_cache_read": 5e-7,
+          "output": 0.000008
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4.1-mini-2025-04-14",
+    "matchPattern": "(?i)^(openai/)?(gpt-4.1-mini-2025-04-14)$",
+    "startDate": "2025-04-15T10:26:54.132Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 4e-7,
+          "input_cached_tokens": 1e-7,
+          "input_cached_text_tokens": 1e-7,
+          "input_cache_read": 1e-7,
+          "output": 0.0000016
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4.1-nano-2025-04-14",
+    "matchPattern": "(?i)^(openai/)?(gpt-4.1-nano-2025-04-14)$",
+    "startDate": "2025-04-15T10:26:54.132Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 1e-7,
+          "input_cached_tokens": 2.5e-8,
+          "input_cached_text_tokens": 2.5e-8,
+          "input_cache_read": 2.5e-8,
+          "output": 4e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "o3",
+    "matchPattern": "(?i)^(openai/)?(o3)$",
+    "startDate": "2025-04-16T23:26:54.132Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000002,
+          "input_cached_tokens": 5e-7,
+          "input_cache_read": 5e-7,
+          "output": 0.000008,
+          "output_reasoning_tokens": 0.000008,
+          "output_reasoning": 0.000008
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "o3-2025-04-16",
+    "matchPattern": "(?i)^(openai/)?(o3-2025-04-16)$",
+    "startDate": "2025-04-16T23:26:54.132Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000002,
+          "input_cached_tokens": 5e-7,
+          "input_cache_read": 5e-7,
+          "output": 0.000008,
+          "output_reasoning_tokens": 0.000008,
+          "output_reasoning": 0.000008
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "o4-mini",
+    "matchPattern": "(?i)^(o4-mini)$",
+    "startDate": "2025-04-16T23:26:54.132Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000011,
+          "input_cached_tokens": 2.75e-7,
+          "input_cache_read": 2.75e-7,
+          "output": 0.0000044,
+          "output_reasoning_tokens": 0.0000044,
+          "output_reasoning": 0.0000044
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "o4-mini-2025-04-16",
+    "matchPattern": "(?i)^(o4-mini-2025-04-16)$",
+    "startDate": "2025-04-16T23:26:54.132Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000011,
+          "input_cached_tokens": 2.75e-7,
+          "input_cache_read": 2.75e-7,
+          "output": 0.0000044,
+          "output_reasoning_tokens": 0.0000044,
+          "output_reasoning": 0.0000044
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gemini-2.0-flash",
+    "matchPattern": "(?i)^(google/)?(gemini-2.0-flash)(@[a-zA-Z0-9]+)?$",
+    "startDate": "2025-04-22T10:11:35.241Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 1e-7,
+          "output": 4e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gemini-2.0-flash-lite-preview",
+    "matchPattern": "(?i)^(google/)?(gemini-2.0-flash-lite-preview)(@[a-zA-Z0-9]+)?$",
+    "startDate": "2025-04-22T10:11:35.241Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 7.5e-8,
+          "output": 3e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4.1-nano",
+    "matchPattern": "(?i)^(openai/)?(gpt-4.1-nano)$",
+    "startDate": "2025-04-22T10:11:35.241Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 1e-7,
+          "input_cached_tokens": 2.5e-8,
+          "input_cached_text_tokens": 2.5e-8,
+          "input_cache_read": 2.5e-8,
+          "output": 4e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-4.1-mini",
+    "matchPattern": "(?i)^(openai/)?(gpt-4.1-mini)$",
+    "startDate": "2025-04-22T10:11:35.241Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 4e-7,
+          "input_cached_tokens": 1e-7,
+          "input_cached_text_tokens": 1e-7,
+          "input_cache_read": 1e-7,
+          "output": 0.0000016
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-sonnet-4-5-20250929",
+    "matchPattern": "(?i)^(anthropic/)?(claude-sonnet-4-5(-20250929)?|(eu\\.|us\\.|apac\\.|global\\.)?anthropic\\.claude-sonnet-4-5(-20250929)?-v1(:0)?|claude-sonnet-4-5-V1(@20250929)?|claude-sonnet-4-5(@20250929)?)$",
+    "startDate": "2025-09-29T00:00:00.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000003,
+          "input_tokens": 0.000003,
+          "output": 0.000015,
+          "output_tokens": 0.000015,
+          "cache_creation_input_tokens": 0.00000375,
+          "input_cache_creation": 0.00000375,
+          "input_cache_creation_5m": 0.00000375,
+          "input_cache_creation_1h": 0.000006,
+          "cache_read_input_tokens": 3e-7,
+          "input_cache_read": 3e-7
+        }
+      },
+      {
+        "name": "Large Context",
+        "isDefault": false,
+        "priority": 1,
+        "conditions": [
+          {
+            "usageDetailPattern": "input",
+            "operator": "gt",
+            "value": 200000
+          }
+        ],
+        "prices": {
+          "input": 0.000006,
+          "input_tokens": 0.000006,
+          "output": 0.0000225,
+          "output_tokens": 0.0000225,
+          "cache_creation_input_tokens": 0.0000075,
+          "input_cache_creation": 0.0000075,
+          "input_cache_creation_5m": 0.0000075,
+          "input_cache_creation_1h": 0.000012,
+          "cache_read_input_tokens": 6e-7,
+          "input_cache_read": 6e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-sonnet-4-20250514",
+    "matchPattern": "(?i)^(anthropic/)?(claude-sonnet-4(-20250514)?|(eu\\.|us\\.|apac\\.|global\\.)?anthropic\\.claude-sonnet-4(-20250514)?-v1(:0)?|claude-sonnet-4-V1(@20250514)?|claude-sonnet-4(@20250514)?)$",
+    "startDate": "2025-05-22T17:09:02.131Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000003,
+          "input_tokens": 0.000003,
+          "output": 0.000015,
+          "output_tokens": 0.000015,
+          "cache_creation_input_tokens": 0.00000375,
+          "input_cache_creation": 0.00000375,
+          "input_cache_creation_5m": 0.00000375,
+          "input_cache_creation_1h": 0.000006,
+          "cache_read_input_tokens": 3e-7,
+          "input_cache_read": 3e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-sonnet-4-latest",
+    "matchPattern": "(?i)^(anthropic/)?(claude-sonnet-4-latest)$",
+    "startDate": "2025-05-22T17:09:02.131Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000003,
+          "input_tokens": 0.000003,
+          "output": 0.000015,
+          "output_tokens": 0.000015,
+          "cache_creation_input_tokens": 0.00000375,
+          "input_cache_creation": 0.00000375,
+          "input_cache_creation_5m": 0.00000375,
+          "input_cache_creation_1h": 0.000006,
+          "cache_read_input_tokens": 3e-7,
+          "input_cache_read": 3e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-opus-4-20250514",
+    "matchPattern": "(?i)^(anthropic/)?(claude-opus-4(-20250514)?|(eu\\.|us\\.|apac\\.)?anthropic\\.claude-opus-4(-20250514)?-v1(:0)?|claude-opus-4(@20250514)?)$",
+    "startDate": "2025-05-22T17:09:02.131Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000015,
+          "input_tokens": 0.000015,
+          "output": 0.000075,
+          "output_tokens": 0.000075,
+          "cache_creation_input_tokens": 0.00001875,
+          "input_cache_creation": 0.00001875,
+          "input_cache_creation_5m": 0.00001875,
+          "input_cache_creation_1h": 0.00003,
+          "cache_read_input_tokens": 0.0000015,
+          "input_cache_read": 0.0000015
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "o3-pro",
+    "matchPattern": "(?i)^(openai/)?(o3-pro)$",
+    "startDate": "2025-06-10T22:26:54.132Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00002,
+          "output": 0.00008,
+          "output_reasoning_tokens": 0.00008,
+          "output_reasoning": 0.00008
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "o3-pro-2025-06-10",
+    "matchPattern": "(?i)^(openai/)?(o3-pro-2025-06-10)$",
+    "startDate": "2025-06-10T22:26:54.132Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00002,
+          "output": 0.00008,
+          "output_reasoning_tokens": 0.00008,
+          "output_reasoning": 0.00008
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "o1-pro",
+    "matchPattern": "(?i)^(openai/)?(o1-pro)$",
+    "startDate": "2025-06-10T22:26:54.132Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00015,
+          "output": 0.0006,
+          "output_reasoning_tokens": 0.0006,
+          "output_reasoning": 0.0006
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "o1-pro-2025-03-19",
+    "matchPattern": "(?i)^(openai/)?(o1-pro-2025-03-19)$",
+    "startDate": "2025-06-10T22:26:54.132Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00015,
+          "output": 0.0006,
+          "output_reasoning_tokens": 0.0006,
+          "output_reasoning": 0.0006
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gemini-2.5-flash",
+    "matchPattern": "(?i)^(google/)?(gemini-2.5-flash)$",
+    "startDate": "2025-07-03T13:44:06.964Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 3e-7,
+          "input_text": 3e-7,
+          "input_modality_1": 3e-7,
+          "prompt_token_count": 3e-7,
+          "promptTokenCount": 3e-7,
+          "input_cached_tokens": 3e-8,
+          "cached_content_token_count": 3e-8,
+          "output": 0.0000025,
+          "output_modality_1": 0.0000025,
+          "candidates_token_count": 0.0000025,
+          "candidatesTokenCount": 0.0000025,
+          "thoughtsTokenCount": 0.0000025,
+          "thoughts_token_count": 0.0000025,
+          "output_reasoning": 0.0000025,
+          "input_audio_tokens": 0.000001
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gemini-2.5-flash-lite",
+    "matchPattern": "(?i)^(google/)?(gemini-2.5-flash-lite)$",
+    "startDate": "2025-07-03T13:44:06.964Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 1e-7,
+          "input_text": 1e-7,
+          "input_modality_1": 1e-7,
+          "prompt_token_count": 1e-7,
+          "promptTokenCount": 1e-7,
+          "input_cached_tokens": 2.5e-8,
+          "cached_content_token_count": 2.5e-8,
+          "output": 4e-7,
+          "output_modality_1": 4e-7,
+          "candidates_token_count": 4e-7,
+          "candidatesTokenCount": 4e-7,
+          "thoughtsTokenCount": 4e-7,
+          "thoughts_token_count": 4e-7,
+          "output_reasoning": 4e-7,
+          "input_audio_tokens": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-opus-4-1-20250805",
+    "matchPattern": "(?i)^(anthropic/)?(claude-opus-4-1(-20250805)?|(eu\\.|us\\.|apac\\.)?anthropic\\.claude-opus-4-1(-20250805)?-v1(:0)?|claude-opus-4-1(@20250805)?)$",
+    "startDate": "2025-08-05T15:00:00.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000015,
+          "input_tokens": 0.000015,
+          "output": 0.000075,
+          "output_tokens": 0.000075,
+          "cache_creation_input_tokens": 0.00001875,
+          "input_cache_creation": 0.00001875,
+          "input_cache_creation_5m": 0.00001875,
+          "input_cache_creation_1h": 0.00003,
+          "cache_read_input_tokens": 0.0000015,
+          "input_cache_read": 0.0000015
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-5",
+    "matchPattern": "(?i)^(openai/)?(gpt-5)$",
+    "startDate": "2025-08-07T16:00:00.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00000125,
+          "input_cached_tokens": 1.25e-7,
+          "output": 0.00001,
+          "input_cache_read": 1.25e-7,
+          "output_reasoning_tokens": 0.00001,
+          "output_reasoning": 0.00001
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-5-2025-08-07",
+    "matchPattern": "(?i)^(openai/)?(gpt-5-2025-08-07)$",
+    "startDate": "2025-08-11T08:00:00.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00000125,
+          "input_cached_tokens": 1.25e-7,
+          "output": 0.00001,
+          "input_cache_read": 1.25e-7,
+          "output_reasoning_tokens": 0.00001,
+          "output_reasoning": 0.00001
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-5-mini",
+    "matchPattern": "(?i)^(openai/)?(gpt-5-mini)$",
+    "startDate": "2025-08-07T16:00:00.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "input_cached_tokens": 2.5e-8,
+          "output": 0.000002,
+          "input_cache_read": 2.5e-8,
+          "output_reasoning_tokens": 0.000002,
+          "output_reasoning": 0.000002
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-5-mini-2025-08-07",
+    "matchPattern": "(?i)^(openai/)?(gpt-5-mini-2025-08-07)$",
+    "startDate": "2025-08-11T08:00:00.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "input_cached_tokens": 2.5e-8,
+          "output": 0.000002,
+          "input_cache_read": 2.5e-8,
+          "output_reasoning_tokens": 0.000002,
+          "output_reasoning": 0.000002
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-5-nano",
+    "matchPattern": "(?i)^(openai/)?(gpt-5-nano)$",
+    "startDate": "2025-08-07T16:00:00.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 5e-8,
+          "input_cached_tokens": 5e-9,
+          "output": 4e-7,
+          "input_cache_read": 5e-9,
+          "output_reasoning_tokens": 4e-7,
+          "output_reasoning": 4e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-5-nano-2025-08-07",
+    "matchPattern": "(?i)^(openai/)?(gpt-5-nano-2025-08-07)$",
+    "startDate": "2025-08-11T08:00:00.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 5e-8,
+          "input_cached_tokens": 5e-9,
+          "output": 4e-7,
+          "input_cache_read": 5e-9,
+          "output_reasoning_tokens": 4e-7,
+          "output_reasoning": 4e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-5-chat-latest",
+    "matchPattern": "(?i)^(openai/)?(gpt-5-chat-latest)$",
+    "startDate": "2025-08-07T16:00:00.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00000125,
+          "input_cached_tokens": 1.25e-7,
+          "output": 0.00001,
+          "input_cache_read": 1.25e-7,
+          "output_reasoning_tokens": 0.00001,
+          "output_reasoning": 0.00001
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-5-pro",
+    "matchPattern": "(?i)^(openai/)?(gpt-5-pro)$",
+    "startDate": "2025-10-07T08:03:54.727Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000015,
+          "output": 0.00012,
+          "output_reasoning_tokens": 0.00012,
+          "output_reasoning": 0.00012
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-5-pro-2025-10-06",
+    "matchPattern": "(?i)^(openai/)?(gpt-5-pro-2025-10-06)$",
+    "startDate": "2025-10-07T08:03:54.727Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000015,
+          "output": 0.00012,
+          "output_reasoning_tokens": 0.00012,
+          "output_reasoning": 0.00012
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-haiku-4-5-20251001",
+    "matchPattern": "(?i)^(anthropic/)?(claude-haiku-4-5-20251001|(eu\\.|us\\.|apac\\.|global\\.)?anthropic\\.claude-haiku-4-5-20251001-v1:0|claude-4-5-haiku@20251001)$",
+    "startDate": "2025-10-16T08:20:44.558Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000001,
+          "input_tokens": 0.000001,
+          "output": 0.000005,
+          "output_tokens": 0.000005,
+          "cache_creation_input_tokens": 0.00000125,
+          "input_cache_creation": 0.00000125,
+          "input_cache_creation_5m": 0.00000125,
+          "input_cache_creation_1h": 0.000002,
+          "cache_read_input_tokens": 1e-7,
+          "input_cache_read": 1e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-5.1",
+    "matchPattern": "(?i)^(openai/)?(gpt-5.1)$",
+    "startDate": "2025-11-14T08:57:23.481Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00000125,
+          "input_cached_tokens": 1.25e-7,
+          "output": 0.00001,
+          "input_cache_read": 1.25e-7,
+          "output_reasoning_tokens": 0.00001,
+          "output_reasoning": 0.00001
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-5.1-2025-11-13",
+    "matchPattern": "(?i)^(openai/)?(gpt-5.1-2025-11-13)$",
+    "startDate": "2025-11-14T08:57:23.481Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00000125,
+          "input_cached_tokens": 1.25e-7,
+          "output": 0.00001,
+          "input_cache_read": 1.25e-7,
+          "output_reasoning_tokens": 0.00001,
+          "output_reasoning": 0.00001
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-opus-4-5-20251101",
+    "matchPattern": "(?i)^(anthropic/)?(claude-opus-4-5(-20251101)?|(eu\\.|us\\.|apac\\.|global\\.)?anthropic\\.claude-opus-4-5(-20251101)?-v1(:0)?|claude-opus-4-5(@20251101)?)$",
+    "startDate": "2025-11-24T20:53:27.571Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000005,
+          "input_tokens": 0.000005,
+          "output": 0.000025,
+          "output_tokens": 0.000025,
+          "cache_creation_input_tokens": 0.00000625,
+          "input_cache_creation": 0.00000625,
+          "input_cache_creation_5m": 0.00000625,
+          "input_cache_creation_1h": 0.00001,
+          "cache_read_input_tokens": 5e-7,
+          "input_cache_read": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-sonnet-4-6",
+    "matchPattern": "(?i)^(anthropic\\/)?(claude-sonnet-4-6|(eu\\.|us\\.|apac\\.|global\\.)?anthropic\\.claude-sonnet-4-6(-v1(:0)?)?|claude-sonnet-4-6)$",
+    "startDate": "2026-02-18T00:00:00.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000003,
+          "input_tokens": 0.000003,
+          "output": 0.000015,
+          "output_tokens": 0.000015,
+          "cache_creation_input_tokens": 0.00000375,
+          "input_cache_creation": 0.00000375,
+          "input_cache_creation_5m": 0.00000375,
+          "input_cache_creation_1h": 0.000006,
+          "cache_read_input_tokens": 3e-7,
+          "input_cache_read": 3e-7
+        }
+      },
+      {
+        "name": "Large Context",
+        "isDefault": false,
+        "priority": 1,
+        "conditions": [
+          {
+            "usageDetailPattern": "input",
+            "operator": "gt",
+            "value": 200000
+          }
+        ],
+        "prices": {
+          "input": 0.000006,
+          "input_tokens": 0.000006,
+          "output": 0.0000225,
+          "output_tokens": 0.0000225,
+          "cache_creation_input_tokens": 0.0000075,
+          "input_cache_creation": 0.0000075,
+          "input_cache_creation_5m": 0.0000075,
+          "input_cache_creation_1h": 0.000012,
+          "cache_read_input_tokens": 6e-7,
+          "input_cache_read": 6e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "claude-opus-4-6",
+    "matchPattern": "(?i)^(anthropic/)?(claude-opus-4-6|(eu\\.|us\\.|apac\\.|global\\.)?anthropic\\.claude-opus-4-6-v1(:0)?|claude-opus-4-6)$",
+    "startDate": "2026-02-09T00:00:00.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000005,
+          "input_tokens": 0.000005,
+          "output": 0.000025,
+          "output_tokens": 0.000025,
+          "cache_creation_input_tokens": 0.00000625,
+          "input_cache_creation": 0.00000625,
+          "input_cache_creation_5m": 0.00000625,
+          "input_cache_creation_1h": 0.00001,
+          "cache_read_input_tokens": 5e-7,
+          "input_cache_read": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gemini-2.5-pro",
+    "matchPattern": "(?i)^(google/)?(gemini-2.5-pro)$",
+    "startDate": "2025-11-26T13:27:53.545Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00000125,
+          "input_text": 0.00000125,
+          "input_modality_1": 0.00000125,
+          "prompt_token_count": 0.00000125,
+          "promptTokenCount": 0.00000125,
+          "input_cached_tokens": 1.25e-7,
+          "cached_content_token_count": 1.25e-7,
+          "output": 0.00001,
+          "output_modality_1": 0.00001,
+          "candidates_token_count": 0.00001,
+          "candidatesTokenCount": 0.00001,
+          "thoughtsTokenCount": 0.00001,
+          "thoughts_token_count": 0.00001,
+          "output_reasoning": 0.00001
+        }
+      },
+      {
+        "name": "Large Context",
+        "isDefault": false,
+        "priority": 1,
+        "conditions": [
+          {
+            "usageDetailPattern": "(input|prompt|cached)",
+            "operator": "gt",
+            "value": 200000
+          }
+        ],
+        "prices": {
+          "input": 0.0000025,
+          "input_text": 0.0000025,
+          "input_modality_1": 0.0000025,
+          "prompt_token_count": 0.0000025,
+          "promptTokenCount": 0.0000025,
+          "input_cached_tokens": 2.5e-7,
+          "cached_content_token_count": 2.5e-7,
+          "output": 0.000015,
+          "output_modality_1": 0.000015,
+          "candidates_token_count": 0.000015,
+          "candidatesTokenCount": 0.000015,
+          "thoughtsTokenCount": 0.000015,
+          "thoughts_token_count": 0.000015,
+          "output_reasoning": 0.000015
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gemini-3-pro-preview",
+    "matchPattern": "(?i)^(google/)?(gemini-3-pro-preview)$",
+    "startDate": "2025-11-26T13:27:53.545Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000002,
+          "input_modality_1": 0.000002,
+          "prompt_token_count": 0.000002,
+          "promptTokenCount": 0.000002,
+          "input_cached_tokens": 2e-7,
+          "cached_content_token_count": 2e-7,
+          "output": 0.000012,
+          "output_modality_1": 0.000012,
+          "candidates_token_count": 0.000012,
+          "candidatesTokenCount": 0.000012,
+          "thoughtsTokenCount": 0.000012,
+          "thoughts_token_count": 0.000012,
+          "output_reasoning": 0.000012
+        }
+      },
+      {
+        "name": "Large Context",
+        "isDefault": false,
+        "priority": 1,
+        "conditions": [
+          {
+            "usageDetailPattern": "(input|prompt|cached)",
+            "operator": "gt",
+            "value": 200000
+          }
+        ],
+        "prices": {
+          "input": 0.000004,
+          "input_modality_1": 0.000004,
+          "prompt_token_count": 0.000004,
+          "promptTokenCount": 0.000004,
+          "input_cached_tokens": 4e-7,
+          "cached_content_token_count": 4e-7,
+          "output": 0.000018,
+          "output_modality_1": 0.000018,
+          "candidates_token_count": 0.000018,
+          "candidatesTokenCount": 0.000018,
+          "thoughtsTokenCount": 0.000018,
+          "thoughts_token_count": 0.000018,
+          "output_reasoning": 0.000018
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gemini-3.1-pro-preview",
+    "matchPattern": "(?i)^(google/)?(gemini-3.1-pro-preview(-customtools)?)$",
+    "startDate": "2026-02-19T00:00:00.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000002,
+          "input_modality_1": 0.000002,
+          "prompt_token_count": 0.000002,
+          "promptTokenCount": 0.000002,
+          "input_cached_tokens": 2e-7,
+          "cached_content_token_count": 2e-7,
+          "output": 0.000012,
+          "output_modality_1": 0.000012,
+          "candidates_token_count": 0.000012,
+          "candidatesTokenCount": 0.000012,
+          "thoughtsTokenCount": 0.000012,
+          "thoughts_token_count": 0.000012,
+          "output_reasoning": 0.000012
+        }
+      },
+      {
+        "name": "Large Context",
+        "isDefault": false,
+        "priority": 1,
+        "conditions": [
+          {
+            "usageDetailPattern": "(input|prompt|cached)",
+            "operator": "gt",
+            "value": 200000
+          }
+        ],
+        "prices": {
+          "input": 0.000004,
+          "input_modality_1": 0.000004,
+          "prompt_token_count": 0.000004,
+          "promptTokenCount": 0.000004,
+          "input_cached_tokens": 4e-7,
+          "cached_content_token_count": 4e-7,
+          "output": 0.000018,
+          "output_modality_1": 0.000018,
+          "candidates_token_count": 0.000018,
+          "candidatesTokenCount": 0.000018,
+          "thoughtsTokenCount": 0.000018,
+          "thoughts_token_count": 0.000018,
+          "output_reasoning": 0.000018
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-5.2",
+    "matchPattern": "(?i)^(openai/)?(gpt-5.2)$",
+    "startDate": "2025-12-12T09:00:06.513Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00000175,
+          "input_cached_tokens": 1.75e-7,
+          "input_cache_read": 1.75e-7,
+          "output": 0.000014,
+          "output_reasoning_tokens": 0.000014,
+          "output_reasoning": 0.000014
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-5.2-2025-12-11",
+    "matchPattern": "(?i)^(openai/)?(gpt-5.2-2025-12-11)$",
+    "startDate": "2025-12-12T09:00:06.513Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00000175,
+          "input_cached_tokens": 1.75e-7,
+          "input_cache_read": 1.75e-7,
+          "output": 0.000014,
+          "output_reasoning_tokens": 0.000014,
+          "output_reasoning": 0.000014
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-5.2-pro",
+    "matchPattern": "(?i)^(openai/)?(gpt-5.2-pro)$",
+    "startDate": "2025-12-12T09:00:06.513Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000021,
+          "output": 0.000168,
+          "output_reasoning_tokens": 0.000168,
+          "output_reasoning": 0.000168
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-5.2-pro-2025-12-11",
+    "matchPattern": "(?i)^(openai/)?(gpt-5.2-pro-2025-12-11)$",
+    "startDate": "2025-12-12T09:00:06.513Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.000021,
+          "output": 0.000168,
+          "output_reasoning_tokens": 0.000168,
+          "output_reasoning": 0.000168
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-5.4",
+    "matchPattern": "(?i)^(openai/)?(gpt-5.4)$",
+    "startDate": "2026-03-05T00:00:00.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000025,
+          "input_cached_tokens": 2.5e-7,
+          "input_cache_read": 2.5e-7,
+          "output": 0.000015,
+          "output_reasoning_tokens": 0.000015,
+          "output_reasoning": 0.000015
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-5.4-pro",
+    "matchPattern": "(?i)^(openai/)?(gpt-5.4-pro)$",
+    "startDate": "2026-03-05T00:00:00.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00003,
+          "output": 0.00018,
+          "output_reasoning_tokens": 0.00018,
+          "output_reasoning": 0.00018
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-5.4-2026-03-05",
+    "matchPattern": "(?i)^(openai/)?(gpt-5.4-2026-03-05)$",
+    "startDate": "2026-03-05T00:00:00.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.0000025,
+          "input_cached_tokens": 2.5e-7,
+          "input_cache_read": 2.5e-7,
+          "output": 0.000015,
+          "output_reasoning_tokens": 0.000015,
+          "output_reasoning": 0.000015
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gpt-5.4-pro-2026-03-05",
+    "matchPattern": "(?i)^(openai/)?(gpt-5.4-pro-2026-03-05)$",
+    "startDate": "2026-03-05T00:00:00.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 0.00003,
+          "output": 0.00018,
+          "output_reasoning_tokens": 0.00018,
+          "output_reasoning": 0.00018
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gemini-3-flash-preview",
+    "matchPattern": "(?i)^(google/)?(gemini-3-flash-preview)$",
+    "startDate": "2025-12-21T12:01:42.282Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 5e-7,
+          "input_modality_1": 5e-7,
+          "prompt_token_count": 5e-7,
+          "promptTokenCount": 5e-7,
+          "input_cached_tokens": 5e-8,
+          "cached_content_token_count": 5e-8,
+          "output": 0.000003,
+          "output_modality_1": 0.000003,
+          "candidates_token_count": 0.000003,
+          "candidatesTokenCount": 0.000003,
+          "thoughtsTokenCount": 0.000003,
+          "thoughts_token_count": 0.000003,
+          "output_reasoning": 0.000003
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gemini-3.1-flash-lite-preview",
+    "matchPattern": "(?i)^(google/)?(gemini-3.1-flash-lite-preview)$",
+    "startDate": "2026-03-03T00:00:00.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input": 2.5e-7,
+          "input_modality_1": 2.5e-7,
+          "prompt_token_count": 2.5e-7,
+          "promptTokenCount": 2.5e-7,
+          "input_cached_tokens": 2.5e-8,
+          "cached_content_token_count": 2.5e-8,
+          "output": 0.0000015,
+          "output_modality_1": 0.0000015,
+          "candidates_token_count": 0.0000015,
+          "candidatesTokenCount": 0.0000015,
+          "thoughtsTokenCount": 0.0000015,
+          "thoughts_token_count": 0.0000015,
+          "output_reasoning": 0.0000015,
+          "input_audio_tokens": 5e-7
+        }
+      }
+    ]
+  },
+  {
+    "modelName": "gemini-live-2.5-flash-native-audio",
+    "matchPattern": "(?i)^(google/)?(gemini-live-2.5-flash-native-audio)$",
+    "startDate": "2026-03-16T00:00:00.000Z",
+    "pricingTiers": [
+      {
+        "name": "Standard",
+        "isDefault": true,
+        "priority": 0,
+        "conditions": [],
+        "prices": {
+          "input_text": 5e-7,
+          "input_audio": 0.000003,
+          "input_image": 0.000003,
+          "output_text": 0.000002,
+          "output_audio": 0.000012
+        }
+      }
+    ]
+  }
+];
diff --git a/internal-packages/llm-pricing/src/index.ts b/internal-packages/llm-pricing/src/index.ts
new file mode 100644
index 00000000000..3632434c137
--- /dev/null
+++ b/internal-packages/llm-pricing/src/index.ts
@@ -0,0 +1,11 @@
+export { ModelPricingRegistry } from "./registry.js";
+export { seedLlmPricing } from "./seed.js";
+export { defaultModelPrices } from "./defaultPrices.js";
+export type {
+  LlmModelWithPricing,
+  LlmCostResult,
+  LlmPricingTierWithPrices,
+  LlmPriceEntry,
+  PricingCondition,
+  DefaultModelDefinition,
+} from "./types.js";
diff --git a/internal-packages/llm-pricing/src/registry.test.ts b/internal-packages/llm-pricing/src/registry.test.ts
new file mode 100644
index 00000000000..679c8c4cfcf
--- /dev/null
+++ b/internal-packages/llm-pricing/src/registry.test.ts
@@ -0,0 +1,396 @@
+import { describe, it, expect, beforeEach } from "vitest";
+import { ModelPricingRegistry } from "./registry.js";
+import { defaultModelPrices } from "./defaultPrices.js";
+import type { LlmModelWithPricing } from "./types.js";
+
+// Convert POSIX-style (?i) inline flag to JS RegExp 'i' flag
+function compilePattern(pattern: string): RegExp {
+  if (pattern.startsWith("(?i)")) {
+    return new RegExp(pattern.slice(4), "i");
+  }
+  return new RegExp(pattern);
+}
+
+// Create a mock registry that we can load with test data without Prisma
+class TestableRegistry extends ModelPricingRegistry {
+  loadPatterns(models: LlmModelWithPricing[]) {
+    // Access private fields via any cast for testing
+    const self = this as any;
+    self._patterns = models.map((model) => ({
+      regex: compilePattern(model.matchPattern),
+      model,
+    }));
+    self._exactMatchCache = new Map();
+    self._loaded = true;
+  }
+}
+
+const gpt4o: LlmModelWithPricing = {
+  id: "model-gpt4o",
+  friendlyId: "llm_model_gpt4o",
+  modelName: "gpt-4o",
+  matchPattern: "^gpt-4o(-\\d{4}-\\d{2}-\\d{2})?$",
+  startDate: null,
+  pricingTiers: [
+    {
+      id: "tier-gpt4o-standard",
+      name: "Standard",
+      isDefault: true,
+      priority: 0,
+      conditions: [],
+      prices: [
+        { usageType: "input", price: 0.0000025 },
+        { usageType: "output", price: 0.00001 },
+        { usageType: "input_cached_tokens", price: 0.00000125 },
+      ],
+    },
+  ],
+};
+
+const claudeSonnet: LlmModelWithPricing = {
+  id: "model-claude-sonnet",
+  friendlyId: "llm_model_claude_sonnet",
+  modelName: "claude-sonnet-4-0",
+  matchPattern: "^claude-sonnet-4-0(-\\d{8})?$",
+  startDate: null,
+  pricingTiers: [
+    {
+      id: "tier-claude-sonnet-standard",
+      name: "Standard",
+      isDefault: true,
+      priority: 0,
+      conditions: [],
+      prices: [
+        { usageType: "input", price: 0.000003 },
+        { usageType: "output", price: 0.000015 },
+        { usageType: "input_cached_tokens", price: 0.0000015 },
+      ],
+    },
+  ],
+};
+
+describe("ModelPricingRegistry", () => {
+  let registry: TestableRegistry;
+
+  beforeEach(() => {
+    registry = new TestableRegistry(null as any);
+    registry.loadPatterns([gpt4o, claudeSonnet]);
+  });
+
+  describe("match", () => {
+    it("should match exact model name", () => {
+      const result = registry.match("gpt-4o");
+      expect(result).not.toBeNull();
+      expect(result!.modelName).toBe("gpt-4o");
+    });
+
+    it("should match model with date suffix", () => {
+      const result = registry.match("gpt-4o-2024-08-06");
+      expect(result).not.toBeNull();
+      expect(result!.modelName).toBe("gpt-4o");
+    });
+
+    it("should match claude model", () => {
+      const result = registry.match("claude-sonnet-4-0-20250514");
+      expect(result).not.toBeNull();
+      expect(result!.modelName).toBe("claude-sonnet-4-0");
+    });
+
+    it("should return null for unknown model", () => {
+      const result = registry.match("unknown-model-xyz");
+      expect(result).toBeNull();
+    });
+
+    it("should cache exact matches", () => {
+      registry.match("gpt-4o");
+      registry.match("gpt-4o");
+      // Second call should use cache - no way to verify without mocking, but it shouldn't error
+      expect(registry.match("gpt-4o")!.modelName).toBe("gpt-4o");
+    });
+
+    it("should cache misses", () => {
+      expect(registry.match("unknown")).toBeNull();
+      expect(registry.match("unknown")).toBeNull();
+    });
+  });
+
+  describe("calculateCost", () => {
+    it("should calculate cost for input and output tokens", () => {
+      const result = registry.calculateCost("gpt-4o", {
+        input: 1000,
+        output: 100,
+      });
+
+      expect(result).not.toBeNull();
+      expect(result!.matchedModelName).toBe("gpt-4o");
+      expect(result!.pricingTierName).toBe("Standard");
+      expect(result!.inputCost).toBeCloseTo(0.0025); // 1000 * 0.0000025
+      expect(result!.outputCost).toBeCloseTo(0.001); // 100 * 0.00001
+      expect(result!.totalCost).toBeCloseTo(0.0035);
+    });
+
+    it("should include cached token costs", () => {
+      const result = registry.calculateCost("gpt-4o", {
+        input: 500,
+        output: 50,
+        input_cached_tokens: 200,
+      });
+
+      expect(result).not.toBeNull();
+      expect(result!.costDetails["input"]).toBeCloseTo(0.00125); // 500 * 0.0000025
+      expect(result!.costDetails["output"]).toBeCloseTo(0.0005); // 50 * 0.00001
+      expect(result!.costDetails["input_cached_tokens"]).toBeCloseTo(0.00025); // 200 * 0.00000125
+      expect(result!.totalCost).toBeCloseTo(0.002);
+    });
+
+    it("should return null for unknown model", () => {
+      const result = registry.calculateCost("unknown-model", { input: 100, output: 50 });
+      expect(result).toBeNull();
+    });
+
+    it("should handle zero tokens", () => {
+      const result = registry.calculateCost("gpt-4o", { input: 0, output: 0 });
+      expect(result).not.toBeNull();
+      expect(result!.totalCost).toBe(0);
+    });
+
+    it("should handle missing usage types gracefully", () => {
+      const result = registry.calculateCost("gpt-4o", { input: 100 });
+      expect(result).not.toBeNull();
+      expect(result!.inputCost).toBeCloseTo(0.00025);
+      expect(result!.outputCost).toBe(0); // No output tokens
+      expect(result!.totalCost).toBeCloseTo(0.00025);
+    });
+  });
+
+  describe("isLoaded", () => {
+    it("should return false before loading", () => {
+      const freshRegistry = new TestableRegistry(null as any);
+      expect(freshRegistry.isLoaded).toBe(false);
+    });
+
+    it("should return true after loading", () => {
+      expect(registry.isLoaded).toBe(true);
+    });
+  });
+
+  describe("prefix stripping", () => {
+    it("should match gateway-prefixed model names", () => {
+      const result = registry.match("openai/gpt-4o");
+      expect(result).not.toBeNull();
+      expect(result!.modelName).toBe("gpt-4o");
+    });
+
+    it("should match openrouter-prefixed model names with date suffix", () => {
+      const result = registry.match("openai/gpt-4o-2024-08-06");
+      expect(result).not.toBeNull();
+      expect(result!.modelName).toBe("gpt-4o");
+    });
+
+    it("should return null for prefixed unknown model", () => {
+      const result = registry.match("xai/unknown-model");
+      expect(result).toBeNull();
+    });
+  });
+
+  describe("tier matching", () => {
+    const multiTierModel: LlmModelWithPricing = {
+      id: "model-gemini-pro",
+      friendlyId: "llm_model_gemini_pro",
+      modelName: "gemini-2.5-pro",
+      matchPattern: "^gemini-2\\.5-pro$",
+      startDate: null,
+      pricingTiers: [
+        {
+          id: "tier-large-context",
+          name: "Large Context",
+          isDefault: false,
+          priority: 0,
+          conditions: [
+            { usageDetailPattern: "input", operator: "gt" as const, value: 200000 },
+          ],
+          prices: [
+            { usageType: "input", price: 0.0000025 },
+            { usageType: "output", price: 0.00001 },
+          ],
+        },
+        {
+          id: "tier-standard",
+          name: "Standard",
+          isDefault: true,
+          priority: 1,
+          conditions: [],
+          prices: [
+            { usageType: "input", price: 0.00000125 },
+            { usageType: "output", price: 0.000005 },
+          ],
+        },
+      ],
+    };
+
+    it("should use conditional tier when conditions match", () => {
+      const tieredRegistry = new TestableRegistry(null as any);
+      tieredRegistry.loadPatterns([multiTierModel]);
+
+      const result = tieredRegistry.calculateCost("gemini-2.5-pro", {
+        input: 250000,
+        output: 1000,
+      });
+
+      expect(result).not.toBeNull();
+      expect(result!.pricingTierName).toBe("Large Context");
+      expect(result!.inputCost).toBeCloseTo(0.625); // 250000 * 0.0000025
+    });
+
+    it("should fall back to default tier when conditions do not match", () => {
+      const tieredRegistry = new TestableRegistry(null as any);
+      tieredRegistry.loadPatterns([multiTierModel]);
+
+      const result = tieredRegistry.calculateCost("gemini-2.5-pro", {
+        input: 1000,
+        output: 100,
+      });
+
+      expect(result).not.toBeNull();
+      expect(result!.pricingTierName).toBe("Standard");
+      expect(result!.inputCost).toBeCloseTo(0.00125); // 1000 * 0.00000125
+    });
+
+    it("should not let unconditional tier win over conditional match", () => {
+      // Model where unconditional tier has lower priority than conditional
+      const model: LlmModelWithPricing = {
+        ...multiTierModel,
+        pricingTiers: [
+          {
+            id: "tier-unconditional",
+            name: "Unconditional",
+            isDefault: false,
+            priority: 0,
+            conditions: [],
+            prices: [{ usageType: "input", price: 0.001 }],
+          },
+          {
+            id: "tier-conditional",
+            name: "Conditional",
+            isDefault: false,
+            priority: 1,
+            conditions: [
+              { usageDetailPattern: "input", operator: "gt" as const, value: 100 },
+            ],
+            prices: [{ usageType: "input", price: 0.0001 }],
+          },
+          {
+            id: "tier-default",
+            name: "Default",
+            isDefault: true,
+            priority: 2,
+            conditions: [],
+            prices: [{ usageType: "input", price: 0.01 }],
+          },
+        ],
+      };
+
+      const tieredRegistry = new TestableRegistry(null as any);
+      tieredRegistry.loadPatterns([model]);
+
+      // Condition matches — conditional tier should win, not the unconditional one
+      const result = tieredRegistry.calculateCost("gemini-2.5-pro", { input: 500 });
+      expect(result).not.toBeNull();
+      expect(result!.pricingTierName).toBe("Conditional");
+    });
+
+    it("should fall back to isDefault tier when no conditions match", () => {
+      const model: LlmModelWithPricing = {
+        ...multiTierModel,
+        pricingTiers: [
+          {
+            id: "tier-conditional",
+            name: "Conditional",
+            isDefault: false,
+            priority: 0,
+            conditions: [
+              { usageDetailPattern: "input", operator: "gt" as const, value: 999999 },
+            ],
+            prices: [{ usageType: "input", price: 0.001 }],
+          },
+          {
+            id: "tier-default",
+            name: "Default",
+            isDefault: true,
+            priority: 1,
+            conditions: [],
+            prices: [{ usageType: "input", price: 0.0001 }],
+          },
+        ],
+      };
+
+      const tieredRegistry = new TestableRegistry(null as any);
+      tieredRegistry.loadPatterns([model]);
+
+      const result = tieredRegistry.calculateCost("gemini-2.5-pro", { input: 100 });
+      expect(result).not.toBeNull();
+      expect(result!.pricingTierName).toBe("Default");
+    });
+  });
+
+  describe("defaultModelPrices (Langfuse JSON)", () => {
+    it("should load all models from the JSON file", () => {
+      expect(defaultModelPrices.length).toBeGreaterThan(100);
+    });
+
+    it("should compile all match patterns without errors", () => {
+      const langfuseRegistry = new TestableRegistry(null as any);
+      const models: LlmModelWithPricing[] = defaultModelPrices.map((def, i) => ({
+        id: `test-${i}`,
+        friendlyId: `llm_model_test${i}`,
+        modelName: def.modelName,
+        matchPattern: def.matchPattern,
+        startDate: def.startDate ? new Date(def.startDate) : null,
+        pricingTiers: def.pricingTiers.map((tier, j) => ({
+          id: `tier-${i}-${j}`,
+          name: tier.name,
+          isDefault: tier.isDefault,
+          priority: tier.priority,
+          conditions: tier.conditions,
+          prices: Object.entries(tier.prices).map(([usageType, price]) => ({
+            usageType,
+            price,
+          })),
+        })),
+      }));
+
+      // This should not throw — all 141 patterns should compile
+      expect(() => langfuseRegistry.loadPatterns(models)).not.toThrow();
+      expect(langfuseRegistry.isLoaded).toBe(true);
+    });
+
+    it("should match real-world model names from Langfuse patterns", () => {
+      const langfuseRegistry = new TestableRegistry(null as any);
+      const models: LlmModelWithPricing[] = defaultModelPrices.map((def, i) => ({
+        id: `test-${i}`,
+        friendlyId: `llm_model_test${i}`,
+        modelName: def.modelName,
+        matchPattern: def.matchPattern,
+        startDate: null,
+        pricingTiers: def.pricingTiers.map((tier, j) => ({
+          id: `tier-${i}-${j}`,
+          name: tier.name,
+          isDefault: tier.isDefault,
+          priority: tier.priority,
+          conditions: tier.conditions,
+          prices: Object.entries(tier.prices).map(([usageType, price]) => ({
+            usageType,
+            price,
+          })),
+        })),
+      }));
+      langfuseRegistry.loadPatterns(models);
+
+      // Test real model strings that SDKs send
+      expect(langfuseRegistry.match("gpt-4o")).not.toBeNull();
+      expect(langfuseRegistry.match("gpt-4o-mini")).not.toBeNull();
+      expect(langfuseRegistry.match("claude-sonnet-4-5-20250929")).not.toBeNull();
+      expect(langfuseRegistry.match("claude-sonnet-4-20250514")).not.toBeNull();
+    });
+  });
+});
diff --git a/internal-packages/llm-pricing/src/registry.ts b/internal-packages/llm-pricing/src/registry.ts
new file mode 100644
index 00000000000..80da40ba980
--- /dev/null
+++ b/internal-packages/llm-pricing/src/registry.ts
@@ -0,0 +1,223 @@
+import type { PrismaClient, PrismaReplicaClient } from "@trigger.dev/database";
+import type {
+  LlmModelWithPricing,
+  LlmCostResult,
+  LlmPricingTierWithPrices,
+  PricingCondition,
+} from "./types.js";
+
+type CompiledPattern = {
+  regex: RegExp;
+  model: LlmModelWithPricing;
+};
+
+// Convert POSIX-style (?i) inline flag to JS RegExp 'i' flag
+function compilePattern(pattern: string): RegExp {
+  if (pattern.startsWith("(?i)")) {
+    return new RegExp(pattern.slice(4), "i");
+  }
+  return new RegExp(pattern);
+}
+
+export class ModelPricingRegistry {
+  private _prisma: PrismaClient | PrismaReplicaClient;
+  private _patterns: CompiledPattern[] = [];
+  // TODO: When we add project-based models (users adding their own), this cache grows unbounded
+  // between reloads. Fine-tuned model IDs (e.g. "ft:gpt-3.5-turbo:org:name:id") create unique
+  // entries per model string. Consider adding an LRU cap or size limit at that point.
+  private _exactMatchCache: Map<string, LlmModelWithPricing | null> = new Map();
+  private _loaded = false;
+  private _readyResolve!: () => void;
+
+  /** Resolves once the initial `loadFromDatabase()` completes successfully. */
+  readonly isReady: Promise<void>;
+
+  constructor(prisma: PrismaClient | PrismaReplicaClient) {
+    this._prisma = prisma;
+    this.isReady = new Promise<void>((resolve) => {
+      this._readyResolve = resolve;
+    });
+  }
+
+  get isLoaded(): boolean {
+    return this._loaded;
+  }
+
+  async loadFromDatabase(): Promise<void> {
+    const models = await this._prisma.llmModel.findMany({
+      where: { projectId: null },
+      include: {
+        pricingTiers: {
+          include: { prices: true },
+          orderBy: { priority: "asc" },
+        },
+      },
+      orderBy: [{ startDate: "desc" }],
+    });
+
+    const compiled: CompiledPattern[] = [];
+
+    for (const model of models) {
+      try {
+        const regex = compilePattern(model.matchPattern);
+        const tiers: LlmPricingTierWithPrices[] = model.pricingTiers.map((tier) => ({
+          id: tier.id,
+          name: tier.name,
+          isDefault: tier.isDefault,
+          priority: tier.priority,
+          conditions: (tier.conditions as PricingCondition[]) ?? [],
+          prices: tier.prices.map((p) => ({
+            usageType: p.usageType,
+            price: Number(p.price),
+          })),
+        }));
+
+        compiled.push({
+          regex,
+          model: {
+            id: model.id,
+            friendlyId: model.friendlyId,
+            modelName: model.modelName,
+            matchPattern: model.matchPattern,
+            startDate: model.startDate,
+            pricingTiers: tiers,
+          },
+        });
+      } catch {
+        // Skip models with invalid regex patterns
+        console.warn(`Invalid regex pattern for model ${model.modelName}: ${model.matchPattern}`);
+      }
+    }
+
+    this._patterns = compiled;
+    this._exactMatchCache.clear();
+
+    if (!this._loaded) {
+      this._loaded = true;
+      this._readyResolve();
+    }
+  }
+
+  async reload(): Promise<void> {
+    await this.loadFromDatabase();
+  }
+
+  match(responseModel: string): LlmModelWithPricing | null {
+    if (!this._loaded) return null;
+
+    // Check exact match cache
+    const cached = this._exactMatchCache.get(responseModel);
+    if (cached !== undefined) return cached;
+
+    // Iterate compiled regex patterns
+    for (const { regex, model } of this._patterns) {
+      if (regex.test(responseModel)) {
+        this._exactMatchCache.set(responseModel, model);
+        return model;
+      }
+    }
+
+    // Fallback: strip provider prefix (e.g. "mistral/mistral-large-3" → "mistral-large-3")
+    // Gateway and OpenRouter prepend the provider to the model name.
+    if (responseModel.includes("/")) {
+      const stripped = responseModel.split("/").slice(1).join("/");
+      for (const { regex, model } of this._patterns) {
+        if (regex.test(stripped)) {
+          this._exactMatchCache.set(responseModel, model);
+          return model;
+        }
+      }
+    }
+
+    // Cache miss
+    this._exactMatchCache.set(responseModel, null);
+    return null;
+  }
+
+  calculateCost(
+    responseModel: string,
+    usageDetails: Record<string, number>
+  ): LlmCostResult | null {
+    const model = this.match(responseModel);
+    if (!model) return null;
+
+    const tier = this._matchPricingTier(model.pricingTiers, usageDetails);
+    if (!tier) return null;
+
+    const costDetails: Record<string, number> = {};
+    let totalCost = 0;
+
+    for (const priceEntry of tier.prices) {
+      const tokenCount = usageDetails[priceEntry.usageType] ?? 0;
+      if (tokenCount === 0) continue;
+      const cost = tokenCount * priceEntry.price;
+      costDetails[priceEntry.usageType] = cost;
+      totalCost += cost;
+    }
+
+    const inputCost = costDetails["input"] ?? 0;
+    const outputCost = costDetails["output"] ?? 0;
+
+    return {
+      matchedModelId: model.friendlyId,
+      matchedModelName: model.modelName,
+      pricingTierId: tier.id,
+      pricingTierName: tier.name,
+      inputCost,
+      outputCost,
+      totalCost,
+      costDetails,
+    };
+  }
+
+  private _matchPricingTier(
+    tiers: LlmPricingTierWithPrices[],
+    usageDetails: Record<string, number>
+  ): LlmPricingTierWithPrices | null {
+    if (tiers.length === 0) return null;
+
+    // Tiers are sorted by priority ascending (lowest first).
+    // First pass: evaluate tiers that have conditions — first match wins.
+    for (const tier of tiers) {
+      if (tier.conditions.length > 0 && this._evaluateConditions(tier.conditions, usageDetails)) {
+        return tier;
+      }
+    }
+
+    // Second pass: fall back to the default tier, or first tier with no conditions
+    const defaultTier = tiers.find((t) => t.isDefault);
+    if (defaultTier) return defaultTier;
+
+    const unconditional = tiers.find((t) => t.conditions.length === 0);
+    return unconditional ?? tiers[0] ?? null;
+  }
+
+  private _evaluateConditions(
+    conditions: PricingCondition[],
+    usageDetails: Record<string, number>
+  ): boolean {
+    return conditions.every((condition) => {
+      // Find matching usage detail key
+      const regex = new RegExp(condition.usageDetailPattern);
+      const matchingValue = Object.entries(usageDetails).find(([key]) => regex.test(key));
+      const value = matchingValue?.[1] ?? 0;
+
+      switch (condition.operator) {
+        case "gt":
+          return value > condition.value;
+        case "gte":
+          return value >= condition.value;
+        case "lt":
+          return value < condition.value;
+        case "lte":
+          return value <= condition.value;
+        case "eq":
+          return value === condition.value;
+        case "neq":
+          return value !== condition.value;
+        default:
+          return false;
+      }
+    });
+  }
+}
diff --git a/internal-packages/llm-pricing/src/seed.ts b/internal-packages/llm-pricing/src/seed.ts
new file mode 100644
index 00000000000..d068c62a66d
--- /dev/null
+++ b/internal-packages/llm-pricing/src/seed.ts
@@ -0,0 +1,62 @@
+import type { PrismaClient } from "@trigger.dev/database";
+import { generateFriendlyId } from "@trigger.dev/core/v3/isomorphic";
+import { defaultModelPrices } from "./defaultPrices.js";
+
+export async function seedLlmPricing(prisma: PrismaClient): Promise<{
+  modelsCreated: number;
+  modelsSkipped: number;
+}> {
+  let modelsCreated = 0;
+  let modelsSkipped = 0;
+
+  for (const modelDef of defaultModelPrices) {
+    // Check if this model already exists (don't overwrite admin changes)
+    const existing = await prisma.llmModel.findFirst({
+      where: {
+        projectId: null,
+        modelName: modelDef.modelName,
+      },
+    });
+
+    if (existing) {
+      modelsSkipped++;
+      continue;
+    }
+
+    // Create model + tiers atomically so partial models can't be left behind
+    await prisma.$transaction(async (tx) => {
+      const model = await tx.llmModel.create({
+        data: {
+          friendlyId: generateFriendlyId("llm_model"),
+          modelName: modelDef.modelName.trim(),
+          matchPattern: modelDef.matchPattern,
+          startDate: modelDef.startDate ? new Date(modelDef.startDate) : null,
+          source: "default",
+        },
+      });
+
+      for (const tier of modelDef.pricingTiers) {
+        await tx.llmPricingTier.create({
+          data: {
+            modelId: model.id,
+            name: tier.name,
+            isDefault: tier.isDefault,
+            priority: tier.priority,
+            conditions: tier.conditions,
+            prices: {
+              create: Object.entries(tier.prices).map(([usageType, price]) => ({
+                modelId: model.id,
+                usageType,
+                price,
+              })),
+            },
+          },
+        });
+      }
+    });
+
+    modelsCreated++;
+  }
+
+  return { modelsCreated, modelsSkipped };
+}
diff --git a/internal-packages/llm-pricing/src/types.ts b/internal-packages/llm-pricing/src/types.ts
new file mode 100644
index 00000000000..2deec6246ed
--- /dev/null
+++ b/internal-packages/llm-pricing/src/types.ts
@@ -0,0 +1,54 @@
+import type { Decimal } from "@trigger.dev/database";
+
+export type PricingCondition = {
+  usageDetailPattern: string;
+  operator: "gt" | "gte" | "lt" | "lte" | "eq" | "neq";
+  value: number;
+};
+
+export type LlmPriceEntry = {
+  usageType: string;
+  price: number;
+};
+
+export type LlmPricingTierWithPrices = {
+  id: string;
+  name: string;
+  isDefault: boolean;
+  priority: number;
+  conditions: PricingCondition[];
+  prices: LlmPriceEntry[];
+};
+
+export type LlmModelWithPricing = {
+  id: string;
+  friendlyId: string;
+  modelName: string;
+  matchPattern: string;
+  startDate: Date | null;
+  pricingTiers: LlmPricingTierWithPrices[];
+};
+
+export type LlmCostResult = {
+  matchedModelId: string;
+  matchedModelName: string;
+  pricingTierId: string;
+  pricingTierName: string;
+  inputCost: number;
+  outputCost: number;
+  totalCost: number;
+  costDetails: Record<string, number>;
+};
+
+export type DefaultModelDefinition = {
+  modelName: string;
+  matchPattern: string;
+  startDate?: string;
+  pricingTiers: Array<{
+    name: string;
+    isDefault: boolean;
+    priority: number;
+    conditions: PricingCondition[];
+    prices: Record<string, number>;
+  }>;
+};
diff --git a/internal-packages/llm-pricing/tsconfig.json b/internal-packages/llm-pricing/tsconfig.json
new file mode 100644
index 00000000000..c64cf33133b
--- /dev/null
+++ b/internal-packages/llm-pricing/tsconfig.json
@@ -0,0 +1,19 @@
+{
+  "compilerOptions": {
+    "target": "ES2019",
+    "lib": ["ES2019", "DOM", "DOM.Iterable", "DOM.AsyncIterable"],
+    "module": "Node16",
+    "moduleResolution": "Node16",
+    "moduleDetection": "force",
+    "verbatimModuleSyntax": false,
+    "esModuleInterop": true,
+    "forceConsistentCasingInFileNames": true,
+    "isolatedModules": true,
+    "preserveWatchOutput": true,
+    "skipLibCheck": true,
+    "noEmit": true,
+    "strict": true,
+    "resolveJsonModule": true
+  },
+  "exclude": ["node_modules"]
+}
diff --git a/internal-packages/tsql/src/query/printer.ts b/internal-packages/tsql/src/query/printer.ts
index b6e9547db06..d45002f6715 100644
--- a/internal-packages/tsql/src/query/printer.ts
+++ b/internal-packages/tsql/src/query/printer.ts
@@ -2370,6 +2370,21 @@ export class ClickHousePrinter {
     // Try to resolve column names through table context
     const resolvedChain = this.resolveFieldChain(chainWithPrefix);
 
+    // For Map columns, convert dot-notation to bracket syntax:
+    // metadata.user -> metadata['user']
+    if (resolvedChain.length > 1) {
+      const rootColumnSchema = this.resolveFieldToColumnSchema([node.chain[0]]);
+      if (rootColumnSchema?.type.startsWith("Map(")) {
+        const rootCol = this.printIdentifierOrIndex(resolvedChain[0]);
+        const mapKeys = resolvedChain.slice(1);
+        let result = rootCol;
+        for (const key of mapKeys) {
+          result = `${result}[${this.context.addValue(String(key))}]`;
+        }
+        return result;
+      }
+    }
+
     // Print each chain element
     let result = resolvedChain.map((part) => this.printIdentifierOrIndex(part)).join(".");
 
diff --git a/internal-packages/tsql/src/query/schema.ts b/internal-packages/tsql/src/query/schema.ts
index 2ea81091aad..00a28382de5 100644
--- a/internal-packages/tsql/src/query/schema.ts
+++ b/internal-packages/tsql/src/query/schema.ts
@@ -23,6 +23,9 @@ export type ClickHouseType =
   | "Date32"
   | "DateTime"
   | "DateTime64"
+  | "DateTime64(3)"
+  | "DateTime64(9)"
+  | "Decimal64(12)"
   | "UUID"
   | "Bool"
   | "JSON"
@@ -281,6 +284,7 @@ export type ColumnFormatType =
   | "runId"
   | "runStatus"
   | "duration"
+  | "durationNs"
   | "durationSeconds"
   | "costInDollars"
   | "cost"
diff --git a/packages/cli-v3/src/mcp/config.ts b/packages/cli-v3/src/mcp/config.ts
index c4532b27f5e..c3615420ad5 100644
--- a/packages/cli-v3/src/mcp/config.ts
+++ b/packages/cli-v3/src/mcp/config.ts
@@ -116,7 +116,7 @@ export const toolsMetadata = {
     name: "get_query_schema",
     title: "Get Query Schema",
     description:
-      "Get the column schema for a specific TRQL table. Available tables: 'runs' (task execution data), 'metrics' (CPU, memory, custom metrics). Returns columns, types, descriptions, and allowed values for the specified table.",
+      "Get the column schema for a specific TRQL table. Available tables: 'runs' (task execution data), 'metrics' (CPU, memory, custom metrics), 'llm_metrics' (LLM token usage, costs, latency). Returns columns, types, descriptions, and allowed values for the specified table.",
   },
   list_dashboards: {
     name: "list_dashboards",
diff --git a/packages/core/src/v3/schemas/style.ts b/packages/core/src/v3/schemas/style.ts
index eab62c5b41b..2f833b800ac 100644
--- a/packages/core/src/v3/schemas/style.ts
+++ b/packages/core/src/v3/schemas/style.ts
@@ -11,11 +11,12 @@ const AccessoryItem = z.object({
   text: z.string(),
   variant: z.string().optional(),
   url: z.string().optional(),
+  icon: z.string().optional(),
 });
 
 const Accessory = z.object({
   items: z.array(AccessoryItem),
-  style: z.enum(["codepath"]).optional(),
+  style: z.enum(["codepath", "pills"]).optional(),
 });
 
 export type Accessory = z.infer<typeof Accessory>;
diff --git a/packages/core/src/v3/taskContext/otelProcessors.ts b/packages/core/src/v3/taskContext/otelProcessors.ts
index 096f7c0ce76..1c0958d655d 100644
--- a/packages/core/src/v3/taskContext/otelProcessors.ts
+++ b/packages/core/src/v3/taskContext/otelProcessors.ts
@@ -30,6 +30,12 @@ export class TaskContextSpanProcessor implements SpanProcessor {
       span.setAttributes(
         flattenAttributes(taskContext.attributes, SemanticInternalAttributes.METADATA)
       );
+
+      // Set run tags as a proper array attribute (not flattened) so it arrives
+      // as an OTEL ArrayValue and can be extracted on the server side.
+      if (!taskContext.isRunDisabled && taskContext.ctx.run.tags?.length) {
+        span.setAttribute(SemanticInternalAttributes.RUN_TAGS, taskContext.ctx.run.tags);
+      }
     }
 
     if (!isPartialSpan(span) && !skipPartialSpan(span)) {
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
index 88ac6ad5421..854d4215447 100644
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@@ -302,6 +302,9 @@ importers:
       '@internal/cache':
         specifier: workspace:*
         version: link:../../internal-packages/cache
+      '@internal/llm-pricing':
+        specifier: workspace:*
+        version: link:../../internal-packages/llm-pricing
       '@internal/redis':
         specifier: workspace:*
         version: link:../../internal-packages/redis
@@ -1125,6 +1128,15 @@ importers:
         specifier: 18.2.69
         version: 18.2.69
 
+  internal-packages/llm-pricing:
+    dependencies:
+      '@trigger.dev/core':
+        specifier: workspace:*
+        version: link:../../packages/core
+      '@trigger.dev/database':
+        specifier: workspace:*
+        version: link:../database
+
   internal-packages/otlp-importer:
     dependencies:
       long: