From 3edbd7c8f73804e4549891746ba770e103c45e80 Mon Sep 17 00:00:00 2001 From: Asmita Goswami Date: Thu, 19 Dec 2024 09:44:37 +0000 Subject: [PATCH] Migrating HL compile and export to infer APIs Signed-off-by:Asmita Goswami --- QEfficient/cloud/infer.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/QEfficient/cloud/infer.py b/QEfficient/cloud/infer.py index ba086015..fd7e431d 100644 --- a/QEfficient/cloud/infer.py +++ b/QEfficient/cloud/infer.py @@ -102,7 +102,7 @@ def main( batch_size=batch_size, mos=mos, mxint8_kv_cache=mxint8, - num_devices=(0 if device_group is None else len(device_group)), + num_devices = (0 if device_group is None else len(device_group)), full_batch_size=full_batch_size, allow_mxint8_mdp_io=allow_mxint8_mdp_io, enable_qnn=enable_qnn,