Overhaul rack system with split FLOPS, VRAM, cooling, interconnect, and multi-vendor SKUs

Expand from 10 to 18 rack SKUs across NVIDIA, AMD, and custom ASIC vendors, each with distinct training vs inference FLOPS, VRAM capacity, cooling requirements, and interconnect technology. Adds cooling hierarchy (air/liquid/immersion) that gates rack deployment, VRAM requirements that gate model training by generation, interconnect multipliers for distributed training scaling, and PUE-based energy cost reduction for advanced cooling. Includes save migration from v4 to v5, 6 new research nodes, and UI updates showing split compute stats. Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
2026-04-25 02:27:03 -04:00
parent 54220fca70
commit fc1f371c8c
12 changed files with 749 additions and 100 deletions
@@ -3,19 +3,44 @@ import { FLOPS_TO_TOKENS_MULTIPLIER } from '@ai-tycoon/shared';

 export interface CapacityResult {
  totalFlops: number;
+  totalTrainingFlops: number;
+  totalInferenceFlops: number;
+  totalVramGB: number;
  trainingAllocation: number;
  inferenceAllocation: number;
+  effectiveTrainingFlops: number;
+  effectiveInferenceFlops: number;
  tokensPerSecondCapacity: number;
 }

 export function computeCapacity(state: GameState, infrastructure: InfrastructureState): CapacityResult {
-  const totalFlops = infrastructure.totalFlops;
+  const { totalTrainingFlops, totalInferenceFlops, totalVramGB } = infrastructure;
  const trainingAllocation = state.compute.trainingAllocation;
  const inferenceAllocation = 1 - trainingAllocation;
-  const inferenceFlops = totalFlops * inferenceAllocation;
-  const tokensPerSecondCapacity = inferenceFlops * FLOPS_TO_TOKENS_MULTIPLIER;

-  return { totalFlops, trainingAllocation, inferenceAllocation, tokensPerSecondCapacity };
+  // Training hardware can do inference at ~50% efficiency
+  // Inference hardware can do training at ~30% efficiency (no NVLink, poor scaling)
+  const effectiveTrainingFlops =
+    totalTrainingFlops * trainingAllocation +
+    totalInferenceFlops * trainingAllocation * 0.3;
+
+  const effectiveInferenceFlops =
+    totalInferenceFlops * inferenceAllocation +
+    totalTrainingFlops * inferenceAllocation * 0.5;
+
+  const tokensPerSecondCapacity = effectiveInferenceFlops * FLOPS_TO_TOKENS_MULTIPLIER;
+
+  return {
+    totalFlops: totalTrainingFlops + totalInferenceFlops,
+    totalTrainingFlops,
+    totalInferenceFlops,
+    totalVramGB,
+    trainingAllocation,
+    inferenceAllocation,
+    effectiveTrainingFlops,
+    effectiveInferenceFlops,
+    tokensPerSecondCapacity,
+  };
 }

 export function finalizeCompute(capacity: CapacityResult, totalTokenDemand: number): ComputeState {