# Here is the command-line style inference code. CUDA_VISIBLE_DEVICES=0 \ swift infer \ --adapters output/v0-20250416-154745/checkpoint-93 \ --stream true \ --temperature 0 \ --max_new_tokens 2048