# Load model (FP16 for speed) pipe = MidV418Pipeline.from_pretrained( "duckai/midv-418", torch_dtype=torch.float16, device="cuda" )