[ILUVATAR_GPU] Support for iluvatar_gpu (#4565)

tianyuzhou668 · web-flow · commit 2da1e99faba8 · 2025-09-23T12:21:06.000+08:00
diff --git a/paddlex/inference/models/common/static_infer.py b/paddlex/inference/models/common/static_infer.py
@@ -445,6 +445,12 @@ def _create(
                     # Delete unsupported passes in dcu
                     config.delete_pass("conv2d_add_act_fuse_pass")
                     config.delete_pass("conv2d_add_fuse_pass")
+            elif self._option.device_type == "iluvatar_gpu":
+                config.enable_custom_device("iluvatar_gpu", int(self._option.device_id))
+                if hasattr(config, "enable_new_ir"):
+                    config.enable_new_ir(self._option.enable_new_ir)
+                if hasattr(config, "enable_new_executor"):
+                    config.enable_new_executor()
             else:
                 assert self._option.device_type == "cpu"
                 config.disable_gpu()
diff --git a/paddlex/inference/models/common/vlm/fusion_ops.py b/paddlex/inference/models/common/vlm/fusion_ops.py
@@ -49,6 +49,8 @@ def get_env_device():
         return "gcu"
     elif "intel_hpu" in paddle.device.get_all_custom_device_type():
         return "intel_hpu"
+    elif "iluvatar_gpu" in paddle.device.get_all_custom_device_type():
+        return "iluvatar_gpu"
     elif paddle.is_compiled_with_rocm():
         return "rocm"
     elif paddle.is_compiled_with_xpu():
@@ -61,7 +63,7 @@ def get_env_device():
 except ImportError:
     fused_rotary_position_embedding = None
 try:
-    if get_env_device() in ["npu", "mlu", "gcu"]:
+    if get_env_device() in ["npu", "mlu", "gcu", "iluvatar_gpu"]:
         from paddle.base import core
 
         for lib in os.listdir(os.getenv("CUSTOM_DEVICE_ROOT")):
@@ -84,7 +86,7 @@ def fusion_rope(
     rotary_emb,
     context_parallel_degree=-1,
 ):
-    if get_env_device() not in ["gcu", "intel_hpu"]:
+    if get_env_device() not in ["gcu", "intel_hpu", "iluvatar_gpu"]:
         assert past_key_value is None, "fuse rotary not support cache kv for now"
     batch_size, seq_length, num_heads, head_dim = query_states.shape
     _, kv_seq_len, num_key_value_heads, _ = key_states.shape
@@ -93,7 +95,7 @@ def fusion_rope(
             get_env_device() == "gpu"
         ), "context parallel only support cuda device for now"
         kv_seq_len *= context_parallel_degree
-    if get_env_device() not in ["gcu", "intel_hpu"]:
+    if get_env_device() not in ["gcu", "intel_hpu", "iluvatar_gpu"]:
         cos, sin = rotary_emb(value_states, seq_len=kv_seq_len)
     if get_env_device() == "npu":
         query_states = core.eager._run_custom_op("fused_rope", query_states, cos, sin)[
diff --git a/paddlex/inference/utils/pp_option.py b/paddlex/inference/utils/pp_option.py
@@ -54,7 +54,7 @@ class PaddlePredictorOption(object):
         "mkldnn",
         "mkldnn_bf16",
     )
-    SUPPORT_DEVICE = ("gpu", "cpu", "npu", "xpu", "mlu", "dcu", "gcu")
+    SUPPORT_DEVICE = ("gpu", "cpu", "npu", "xpu", "mlu", "dcu", "gcu", "iluvatar_gpu")
 
     def __init__(self, **kwargs):
         super().__init__()
diff --git a/paddlex/repo_apis/PaddleOCR_api/text_rec/config.py b/paddlex/repo_apis/PaddleOCR_api/text_rec/config.py
@@ -249,6 +249,7 @@ def update_device(self, device: str):
             "Global.use_npu": False,
             "Global.use_mlu": False,
             "Global.use_gcu": False,
+            "Global.use_iluvatar_gpu": False,
         }
 
         device_cfg = {
@@ -258,6 +259,7 @@ def update_device(self, device: str):
             "mlu": {"Global.use_mlu": True},
             "npu": {"Global.use_npu": True},
             "gcu": {"Global.use_gcu": True},
+            "iluvatar_gpu": {"Global.use_iluvatar_gpu": True},
         }
         default_cfg.update(device_cfg[device])
         self.update(default_cfg)
diff --git a/paddlex/utils/device.py b/paddlex/utils/device.py
@@ -25,7 +25,7 @@
 )
 from .flags import DISABLE_DEV_MODEL_WL
 
-SUPPORTED_DEVICE_TYPE = ["cpu", "gpu", "xpu", "npu", "mlu", "gcu", "dcu"]
+SUPPORTED_DEVICE_TYPE = ["cpu", "gpu", "xpu", "npu", "mlu", "gcu", "dcu", "iluvatar_gpu"]
 
 
 def constr_device(device_type, device_ids):

Original file line number	Diff line number	Diff line change
`@@ -54,7 +54,7 @@ class PaddlePredictorOption(object):`
`54`	`54`	`"mkldnn",`
`55`	`55`	`"mkldnn_bf16",`
`56`	`56`	`)`
`57`		`- SUPPORT_DEVICE = ("gpu", "cpu", "npu", "xpu", "mlu", "dcu", "gcu")`
	`57`	`+ SUPPORT_DEVICE = ("gpu", "cpu", "npu", "xpu", "mlu", "dcu", "gcu", "iluvatar_gpu")`
`58`	`58`
`59`	`59`	`def __init__(self, **kwargs):`
`60`	`60`	`super().__init__()`
Original file line number	Diff line number	Diff line change
`@@ -249,6 +249,7 @@ def update_device(self, device: str):`
`249`	`249`	`"Global.use_npu": False,`
`250`	`250`	`"Global.use_mlu": False,`
`251`	`251`	`"Global.use_gcu": False,`
	`252`	`+ "Global.use_iluvatar_gpu": False,`
`252`	`253`	`}`
`253`	`254`
`254`	`255`	`device_cfg = {`
`@@ -258,6 +259,7 @@ def update_device(self, device: str):`
`258`	`259`	`"mlu": {"Global.use_mlu": True},`
`259`	`260`	`"npu": {"Global.use_npu": True},`
`260`	`261`	`"gcu": {"Global.use_gcu": True},`
	`262`	`+ "iluvatar_gpu": {"Global.use_iluvatar_gpu": True},`
`261`	`263`	`}`
`262`	`264`	`default_cfg.update(device_cfg[device])`
`263`	`265`	`self.update(default_cfg)`
Original file line number	Diff line number	Diff line change
`@@ -25,7 +25,7 @@`
`25`	`25`	`)`
`26`	`26`	`from .flags import DISABLE_DEV_MODEL_WL`
`27`	`27`
`28`		`-SUPPORTED_DEVICE_TYPE = ["cpu", "gpu", "xpu", "npu", "mlu", "gcu", "dcu"]`
	`28`	`+SUPPORTED_DEVICE_TYPE = ["cpu", "gpu", "xpu", "npu", "mlu", "gcu", "dcu", "iluvatar_gpu"]`
`29`	`29`
`30`	`30`
`31`	`31`	`def constr_device(device_type, device_ids):`