update
This commit is contained in:
5
demo.py
5
demo.py
@@ -254,7 +254,7 @@ def main():
|
|||||||
default=1,
|
default=1,
|
||||||
help="Streaming only. Every N-th frame after scale frames is kept as a keyframe. 1 = every frame.",
|
help="Streaming only. Every N-th frame after scale frames is kept as a keyframe. 1 = every frame.",
|
||||||
)
|
)
|
||||||
parser.add_argument("--kv_cache_sliding_window", type=int, default=64)
|
parser.add_argument("--kv_cache_sliding_window", type=int, default=16)
|
||||||
parser.add_argument("--kv_cache_scale_frames", type=int, default=8)
|
parser.add_argument("--kv_cache_scale_frames", type=int, default=8)
|
||||||
parser.add_argument("--use_sdpa", action="store_true", default=False,
|
parser.add_argument("--use_sdpa", action="store_true", default=False,
|
||||||
help="Use SDPA backend (no flashinfer needed). Default: FlashInfer")
|
help="Use SDPA backend (no flashinfer needed). Default: FlashInfer")
|
||||||
@@ -340,8 +340,7 @@ def main():
|
|||||||
num_scale_frames=args.num_scale_frames,
|
num_scale_frames=args.num_scale_frames,
|
||||||
)
|
)
|
||||||
|
|
||||||
t_infer = time.time() - t0
|
print(f"Inference done in {time.time() - t0:.1f}s")
|
||||||
print(f"Inference done: {t_infer:.1f}s ({num_frames / t_infer:.1f} FPS)")
|
|
||||||
|
|
||||||
# ── Post-process ─────────────────────────────────────────────────────────
|
# ── Post-process ─────────────────────────────────────────────────────────
|
||||||
predictions, images_cpu = postprocess(predictions, images)
|
predictions, images_cpu = postprocess(predictions, images)
|
||||||
|
|||||||
Reference in New Issue
Block a user