diff --git a/paddlex/inference/models/doc_vlm/modeling/paddleocr_vl/_paddleocr_vl.py b/paddlex/inference/models/doc_vlm/modeling/paddleocr_vl/_paddleocr_vl.py index ab5a9cd87e..f7f4cac5c0 100644 --- a/paddlex/inference/models/doc_vlm/modeling/paddleocr_vl/_paddleocr_vl.py +++ b/paddlex/inference/models/doc_vlm/modeling/paddleocr_vl/_paddleocr_vl.py @@ -65,9 +65,6 @@ class PaddleOCRVLForConditionalGeneration(Ernie4_5PretrainedModel): _tied_weights_keys = ["lm_head.weight"] config_class = PaddleOCRVLConfig _no_split_modules = ["Ernie4_5DecoderLayer", "SiglipEncoderLayer"] - # Keep visual encoder in fp32 for ROCm stability (MIOpen bf16 conv has bugs) - # This also improves precision for vision processing - _keep_in_fp32_modules = ["visual", "mlp_AR"] base_model_prefix = "" def __init__(self, config): diff --git a/paddlex/inference/models/runners/paddle_static/runner.py b/paddlex/inference/models/runners/paddle_static/runner.py index 894feb3b12..9f84c4aac9 100644 --- a/paddlex/inference/models/runners/paddle_static/runner.py +++ b/paddlex/inference/models/runners/paddle_static/runner.py @@ -403,9 +403,6 @@ def _create(self): config.set_optimization_level(3) if self._model_name == "PP-DocLayoutV3": config.delete_pass("matmul_add_act_fuse_pass") - if paddle.is_compiled_with_rocm(): - config.delete_pass("conv2d_add_act_fuse_pass") - config.delete_pass("conv2d_add_fuse_pass") elif self._config["device_type"] == "npu": config.enable_custom_device("npu", self._config.get("device_id", 0)) if hasattr(config, "enable_new_ir"): @@ -459,9 +456,6 @@ def _create(self): config.disable_mkldnn() if hasattr(config, "enable_new_executor"): config.enable_new_executor() - if paddle.is_compiled_with_rocm(): - config.delete_pass("conv2d_add_act_fuse_pass") - config.delete_pass("conv2d_add_fuse_pass") elif self._config["device_type"] == "iluvatar_gpu": config.enable_custom_device( "iluvatar_gpu", int(self._config.get("device_id", 0)) @@ -493,18 +487,12 @@ def _create(self): if hasattr(config, "enable_new_executor"): config.enable_new_executor() config.set_optimization_level(3) - if paddle.is_compiled_with_rocm(): - config.delete_pass("conv2d_add_act_fuse_pass") - config.delete_pass("conv2d_add_fuse_pass") config.enable_memory_optim() for del_p in self._config.get("delete_pass", []): config.delete_pass(del_p) if not DEBUG: config.disable_glog_info() - if paddle.is_compiled_with_rocm(): - config.delete_pass("conv2d_add_act_fuse_pass") - config.delete_pass("conv2d_add_fuse_pass") predictor = paddle_inference.create_predictor(config)