[ { "name": "Baseline: all expert CPU", "avg_tps": 8.72, "best_tps": 8.74, "vram_gpu0": 620, "vram_gpu1": 6493, "vram_total": 7113, "status": "OK" }, { "name": "n-cpu-moe=60 (4 layers expert GPU)", "avg_tps": 8.72, "best_tps": 8.77, "vram_gpu0": 638, "vram_gpu1": 6493, "vram_total": 7131, "status": "OK" }, { "name": "n-cpu-moe=56 (8 layers expert GPU)", "avg_tps": 8.72, "best_tps": 8.8, "vram_gpu0": 624, "vram_gpu1": 6493, "vram_total": 7117, "status": "OK" }, { "name": "n-cpu-moe=52 (12 layers expert GPU)", "avg_tps": 8.76, "best_tps": 8.79, "vram_gpu0": 634, "vram_gpu1": 6493, "vram_total": 7127, "status": "OK" }, { "name": "n-cpu-moe=48 (16 layers expert GPU)", "avg_tps": 8.81, "best_tps": 8.95, "vram_gpu0": 632, "vram_gpu1": 6493, "vram_total": 7125, "status": "OK" } ]