# Optimizing inference

perf_infer_gpu_many: perf_infer_gpu_one
transformers_agents: agents
quantization: quantization/overview