# auto_aiperf.sh 配置文件(bash 语法)

# 基础环境
NAMESPACE="ai-inference"
RELEASE_NAME="infernex"
CHART_DIR="${CHART_DIR:-/path/to/InferNex/charts/infernex}"
PROJECT_DIR="${PROJECT_DIR:-$(cd "$(dirname "${BASH_SOURCE[0]}")/../.." && pwd)}"
ARTIFACTS_DIR="${PROJECT_DIR}/artifacts"
BASE_RESULT_DIR_NAME="Qwen_Qwen3-8B-openai-chat-fixed_schedule"

# 轮询与等待
POLL_INTERVAL_SECONDS=5
POST_UNINSTALL_WAIT_SECONDS=20
PODS_READY_TIMEOUT_SECONDS=900
LOOP_INTERVAL_SECONDS=10

# 进程匹配与网关
AIPERF_PROCESS_PATTERN="aiperf profile"
GATEWAY_SERVICE_NAME="inference-gateway-istio"
GATEWAY_SERVICE_PORT="80"

# decode 指标采集脚本
PYTHON_BIN="python3"
DECODE_COLLECTOR_SCRIPT="${PROJECT_DIR}/scripts/perf/collect_kv_transfer_metrics.py"
DECODE_COST_IDLE_TIMEOUT=10

# aiperf 命令(bash 数组)
AIPERF_CMD=(
  aiperf profile
  --input-file traces/toolagent_trace.jsonl
  --custom-dataset-type mooncake_trace
  --model Qwen/Qwen3-8B
  --endpoint-type chat
  --synthesis-max-isl 15000
  --extra-inputs ignore_eos:true
  --isl-block-size 512
  --streaming
)