Better output from the same model. Fused computation, adaptive precision, surgical expert loading. 305 KB, 19 backends, zero dependencies. https://inference-x.com
21 lines
994 B
Bash
Executable File
21 lines
994 B
Bash
Executable File
#!/bin/bash
|
|
# ═══════════════════════════════════════════════════════════════════════════════
|
|
# INFERENCE-X — Benchmark Script
|
|
# Copyright (C) 2025-2026 Salka Elmadani. All rights reserved.
|
|
# Licensed under the Business Source License 1.1 (BSL-1.1)
|
|
# See LICENSE file for full terms. See LICENSE for terms.
|
|
# ═══════════════════════════════════════════════════════════════════════════════
|
|
|
|
MODEL=${1:-"./model.gguf"}
|
|
TOKENS=${2:-10}
|
|
|
|
echo "Benchmarking $TOKENS tokens on: $MODEL"
|
|
echo "Hardware: $(uname -m), $(nproc) cores, $(free -h | awk '/Mem:/{print $2}') RAM"
|
|
echo "---"
|
|
|
|
time ./inference-x "$MODEL" \
|
|
-p "Count from 1 to 100." \
|
|
-n "$TOKENS" \
|
|
-t 0.0 \
|
|
--bench
|