[ { "ngl": 999, "cpu_moe": true, "t": 6, "tb": 6, "ub": 512, "b": 2048, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 50, "avg_tps": 26.169961832638464, "best_tps": 26.533887071573073, "vram_used": 4994, "vram_total": 12288, "label": "cpu_moe=True" }, { "ngl": 999, "cpu_moe": false, "t": 6, "tb": 6, "ub": 512, "b": 2048, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 50, "avg_tps": 11.065030380022206, "best_tps": 11.083028272674314, "vram_used": 11949, "vram_total": 12288, "label": "cpu_moe=False" }, { "ngl": 999, "cpu_moe": true, "t": 2, "tb": 2, "ub": 512, "b": 2048, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 50, "avg_tps": 21.473286428302767, "best_tps": 21.746637577851104, "vram_used": 4994, "vram_total": 12288, "label": "t=2 | tb=2" }, { "ngl": 999, "cpu_moe": true, "t": 4, "tb": 4, "ub": 512, "b": 2048, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 50, "avg_tps": 26.552358479030676, "best_tps": 27.314237654089343, "vram_used": 4991, "vram_total": 12288, "label": "t=4 | tb=4" }, { "ngl": 999, "cpu_moe": true, "t": 4, "tb": 6, "ub": 512, "b": 2048, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 50, "avg_tps": 26.347068485327956, "best_tps": 26.87924726131441, "vram_used": 4993, "vram_total": 12288, "label": "t=4 | tb=6" }, { "ngl": 999, "cpu_moe": true, "t": 6, "tb": 6, "ub": 512, "b": 2048, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 50, "avg_tps": 26.331286039513458, "best_tps": 26.81427299445741, "vram_used": 5001, "vram_total": 12288, "label": "t=6 | tb=6" }, { "ngl": 999, "cpu_moe": true, "t": 6, "tb": 8, "ub": 512, "b": 2048, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 50, "avg_tps": 26.391160513711274, "best_tps": 26.735573238878736, "vram_used": 5001, "vram_total": 12288, "label": "t=6 | tb=8" }, { "ngl": 999, "cpu_moe": true, "t": 8, "tb": 8, "ub": 512, "b": 2048, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 50, "avg_tps": 25.32340666199144, "best_tps": 25.87949347494079, "vram_used": 4995, "vram_total": 12288, "label": "t=8 | tb=8" }, { "ngl": 999, "cpu_moe": true, "t": 10, "tb": 10, "ub": 512, "b": 2048, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 50, "avg_tps": 23.752277317850815, "best_tps": 24.98242898809555, "vram_used": 5011, "vram_total": 12288, "label": "t=10 | tb=10" }, { "ngl": 999, "cpu_moe": true, "t": 12, "tb": 12, "ub": 512, "b": 2048, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 50, "avg_tps": 21.75032196383532, "best_tps": 23.18963400077116, "vram_used": 5104, "vram_total": 12288, "label": "t=12 | tb=12" }, { "ngl": 999, "cpu_moe": true, "t": 4, "tb": 4, "ub": 128, "b": 512, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 50, "avg_tps": 13.27593572827031, "best_tps": 13.337407402920235, "vram_used": 4391, "vram_total": 12288, "label": "ub=128 | b=512" }, { "ngl": 999, "cpu_moe": true, "t": 4, "tb": 4, "ub": 256, "b": 1024, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 50, "avg_tps": 26.638687188233188, "best_tps": 27.361082444434413, "vram_used": 4495, "vram_total": 12288, "label": "ub=256 | b=1024" }, { "ngl": 999, "cpu_moe": true, "t": 4, "tb": 4, "ub": 256, "b": 2048, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 50, "avg_tps": 26.29069503392877, "best_tps": 26.63368832924803, "vram_used": 4490, "vram_total": 12288, "label": "ub=256 | b=2048" }, { "ngl": 999, "cpu_moe": true, "t": 4, "tb": 4, "ub": 512, "b": 1024, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 50, "avg_tps": 26.518331831441134, "best_tps": 26.972021321271527, "vram_used": 4984, "vram_total": 12288, "label": "ub=512 | b=1024" }, { "ngl": 999, "cpu_moe": true, "t": 4, "tb": 4, "ub": 512, "b": 2048, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 50, "avg_tps": 26.401541912276873, "best_tps": 26.46530849236633, "vram_used": 4990, "vram_total": 12288, "label": "ub=512 | b=2048" }, { "ngl": 999, "cpu_moe": true, "t": 4, "tb": 4, "ub": 512, "b": 4096, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 50, "avg_tps": 26.892711500590455, "best_tps": 26.892711500590455, "vram_used": 5006, "vram_total": 12288, "label": "ub=512 | b=4096" }, { "ngl": 999, "cpu_moe": true, "t": 4, "tb": 4, "ub": 1024, "b": 2048, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 50, "avg_tps": 12.600209659679201, "best_tps": 12.759356030807627, "vram_used": 12020, "vram_total": 12288, "label": "ub=1024 | b=2048" }, { "ngl": 999, "cpu_moe": true, "t": 4, "tb": 4, "ub": 1024, "b": 4096, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 50, "avg_tps": 6.023959262370547, "best_tps": 8.284882268188156, "vram_used": 11931, "vram_total": 12288, "label": "ub=1024 | b=4096" }, { "ngl": 999, "cpu_moe": true, "t": 4, "tb": 4, "ub": 512, "b": 4096, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 50, "avg_tps": 12.96992950856374, "best_tps": 12.96992950856374, "vram_used": 12022, "vram_total": 12288, "label": "ctk=q4_0 | ctv=q4_0" }, { "ngl": 999, "cpu_moe": true, "t": 4, "tb": 4, "ub": 512, "b": 4096, "ctk": "q8_0", "ctv": "q8_0", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 50, "avg_tps": 11.420078920350697, "best_tps": 13.524778595767653, "vram_used": 12030, "vram_total": 12288, "label": "ctk=q8_0 | ctv=q8_0" }, { "ngl": 999, "cpu_moe": true, "t": 4, "tb": 4, "ub": 512, "b": 4096, "ctk": "f16", "ctv": "f16", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 50, "avg_tps": 11.978106511464183, "best_tps": 13.729190013094977, "vram_used": 11518, "vram_total": 12288, "label": "ctk=f16 | ctv=f16" }, { "ngl": 999, "cpu_moe": true, "t": 4, "tb": 4, "ub": 512, "b": 4096, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 50, "avg_tps": 16.164278220452957, "best_tps": 22.645890325274323, "vram_used": 11623, "vram_total": 12288, "label": "mmap=True | poll=50 | prio=2" }, { "ngl": 999, "cpu_moe": true, "t": 4, "tb": 4, "ub": 512, "b": 4096, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": false, "prio": 2, "poll": 50, "avg_tps": 16.555542780023114, "best_tps": 23.333815015033892, "vram_used": 9062, "vram_total": 12288, "label": "mmap=False | poll=50 | prio=2" }, { "ngl": 999, "cpu_moe": true, "t": 4, "tb": 4, "ub": 512, "b": 4096, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 0, "avg_tps": 13.003619379106329, "best_tps": 13.031594557134142, "vram_used": 11994, "vram_total": 12288, "label": "mmap=True | poll=0 | prio=2" }, { "ngl": 999, "cpu_moe": true, "t": 4, "tb": 4, "ub": 512, "b": 4096, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": true, "prio": 2, "poll": 100, "avg_tps": 5.7762452690702935, "best_tps": 5.795560155803046, "vram_used": 11953, "vram_total": 12288, "label": "mmap=True | poll=100 | prio=2" }, { "ngl": 999, "cpu_moe": true, "t": 4, "tb": 4, "ub": 512, "b": 4096, "ctk": "q4_0", "ctv": "q4_0", "fa": "on", "mlock": true, "mmap": true, "prio": 3, "poll": 50, "avg_tps": 12.59406799687573, "best_tps": 14.966737641114795, "vram_used": 11996, "vram_total": 12288, "label": "mmap=True | poll=50 | prio=3" } ]