openvinotoolkit · eaidova · May 28, 2025 · May 26, 2025 · May 28, 2025 · May 28, 2025
diff --git a/tools/who_what_benchmark/examples/openvino_batched_eval.py b/tools/who_what_benchmark/examples/openvino_batched_eval.py
@@ -16,17 +16,14 @@
 
 from openvino_tokenizers import convert_tokenizer
 from openvino import serialize
-from transformers import AutoTokenizer
+from transformers import AutoTokenizer, AutoConfig
 
 model_id = "TinyLlama/TinyLlama-1.1B-Chat-v1.0"
 MAX_NEW_TOKENS = 128
 SEQS_PER_REQUEST = 5
 MAX_SEQUENCES = 100
 
-
-model = OVModelForCausalLM.from_pretrained(
-    model_id, export=True, trust_remote_code=True
-)
+model = OVModelForCausalLM.from_pretrained(model_id, export=True)
 tokenizer = AutoTokenizer.from_pretrained(model_id)
 model_path = PosixPath(tempfile.gettempdir()) / model_id
 model.save_pretrained(model_path)

diff --git a/tools/who_what_benchmark/whowhatbench/model_loaders.py b/tools/who_what_benchmark/whowhatbench/model_loaders.py
@@ -22,13 +22,16 @@ def __init__(self, model, model_dir, model_type):
 
         if model_type == "text" or model_type == "visual-text":
             try:
-                self.config = AutoConfig.from_pretrained(model_dir, trust_remote_code=True)
-            except Exception:
                 self.config = AutoConfig.from_pretrained(model_dir)
+            except Exception:
+                self.config = AutoConfig.from_pretrained(model_dir, trust_remote_code=True)
         elif model_type == "text-to-image":
             from diffusers import DiffusionPipeline
-            self.config = DiffusionPipeline.load_config(
-                model_dir, trust_remote_code=True)
+            try:
+                self.config = DiffusionPipeline.load_config(model_dir)
+            except Exception:
+                self.config = DiffusionPipeline.load_config(model_dir, trust_remote_code=True)
+
 
     def __getattr__(self, attr):
         if attr in self.__dict__:
@@ -89,7 +92,12 @@ def load_text_hf_pipeline(model_id, device):
     model_kwargs = {}
 
     if not torch.cuda.is_available or device.lower() == "cpu":
-        config = AutoConfig.from_pretrained(model_id, trust_remote_code=True)
+        trust_remote_code = False
+        try:
+            config = AutoConfig.from_pretrained(model_id)
+        except Exception:
+            config = AutoConfig.from_pretrained(model_id, trust_remote_code=True)
+            trust_remote_code = True
         is_gptq = False
         is_awq = False
         if getattr(config, "quantization_config", None):
@@ -99,13 +107,19 @@ def load_text_hf_pipeline(model_id, device):
             # infer in FP32
             model_kwargs["torch_dtype"] = torch.float32
         with mock_torch_cuda_is_available(is_gptq or is_awq):
-            model = AutoModelForCausalLM.from_pretrained(model_id, trust_remote_code=True, device_map="cpu", **model_kwargs)
+            model = AutoModelForCausalLM.from_pretrained(model_id, trust_remote_code=trust_remote_code, device_map="cpu", **model_kwargs)
         if is_awq:
             model.is_awq = is_awq
     else:
-        model = AutoModelForCausalLM.from_pretrained(
-            model_id, trust_remote_code=True, device_map=device.lower(), **model_kwargs
-        )
+        try:
+            model = AutoModelForCausalLM.from_pretrained(
+                model_id, trust_remote_code=False, device_map=device.lower(), **model_kwargs
+            )
+        except Exception:
+            model = AutoModelForCausalLM.from_pretrained(
+                model_id, trust_remote_code=True, device_map=device.lower(), **model_kwargs
+            )
+
     model.eval()
     return model
 
@@ -126,7 +140,7 @@ def load_text_model(
         from optimum.intel.openvino import OVModelForCausalLM
         try:
             model = OVModelForCausalLM.from_pretrained(
-                model_id, trust_remote_code=True, device=device, ov_config=ov_config
+                model_id, device=device, ov_config=ov_config
             )
         except Exception:
             try:
@@ -177,23 +191,22 @@ def load_text2image_model(
     elif use_hf:
         from diffusers import DiffusionPipeline
         logger.info("Using HF Transformers API")
-        model = DiffusionPipeline.from_pretrained(
-            model_id, trust_remote_code=True)
+        try:
+            model = DiffusionPipeline.from_pretrained(model_id)
+        except Exception:
+            model =  DiffusionPipeline.from_pretrained(model_id, trust_remote_code=True)
     else:
         logger.info("Using Optimum API")
         from optimum.intel import OVPipelineForText2Image
         TEXT2IMAGEPipeline = OVPipelineForText2Image
 
         try:
             model = TEXT2IMAGEPipeline.from_pretrained(
-                model_id, trust_remote_code=True, device=device, ov_config=ov_config, safety_checker=None,
+                model_id, device=device, ov_config=ov_config, safety_checker=None,
             )
         except ValueError:
-            config = AutoConfig.from_pretrained(
-                model_id, trust_remote_code=True)
             model = TEXT2IMAGEPipeline.from_pretrained(
                 model_id,
-                config=config,
                 trust_remote_code=True,
                 use_cache=True,
                 device=device,
@@ -223,19 +236,25 @@ def load_visual_text_model(
 ):
     if use_hf:
         logger.info("Using HF Transformers API")
-        config = AutoConfig.from_pretrained(model_id, trust_remote_code=True)
+        trust_remote_code = False
+        try:
+            config = AutoConfig.from_pretrained(model_id, trust_remote_code=False)
+        except Exception:
+            config = AutoConfig.from_pretrained(model_id, trust_remote_code=True)
+            trust_remote_code = True
+
         try:
             model = AutoModelForVision2Seq.from_pretrained(
-                model_id, trust_remote_code=True, device_map=device.lower()
+                model_id, trust_remote_code=trust_remote_code, device_map=device.lower()
             )
         except ValueError:
             try:
                 model = AutoModel.from_pretrained(
-                    model_id, trust_remote_code=True, device_map=device.lower()
+                    model_id, trust_remote_code=trust_remote_code, device_map=device.lower()
                 )
             except ValueError:
                 model = AutoModelForCausalLM.from_pretrained(
-                    model_id, trust_remote_code=True, device_map=device.lower(), _attn_implementation="eager", use_flash_attention_2=False
+                    model_id, trust_remote_code=trust_remote_code, device_map=device.lower(), _attn_implementation="eager", use_flash_attention_2=False
                 )
         model.eval()
         try:
@@ -255,7 +274,7 @@ def load_visual_text_model(
         from optimum.intel.openvino import OVModelForVisualCausalLM
         try:
             model = OVModelForVisualCausalLM.from_pretrained(
-                model_id, trust_remote_code=True, device=device, ov_config=ov_config
+                model_id, device=device, ov_config=ov_config
             )
         except ValueError:
             config = AutoConfig.from_pretrained(model_id, trust_remote_code=True)
@@ -301,13 +320,11 @@ def load_imagetext2image_model(
         from optimum.intel.openvino import OVPipelineForImage2Image
         try:
             model = OVPipelineForImage2Image.from_pretrained(
-                model_id, trust_remote_code=True, device=device, ov_config=ov_config, safety_checker=None,
+                model_id, device=device, ov_config=ov_config, safety_checker=None,
             )
         except ValueError:
-            config = AutoConfig.from_pretrained(model_id, trust_remote_code=True)
             model = OVPipelineForImage2Image.from_pretrained(
                 model_id,
-                config=config,
                 trust_remote_code=True,
                 use_cache=True,
                 device=device,
@@ -348,14 +365,12 @@ def load_inpainting_model(
         from optimum.intel.openvino import OVPipelineForInpainting
         try:
             model = OVPipelineForInpainting.from_pretrained(
-                model_id, trust_remote_code=True, device=device, ov_config=ov_config, safety_checker=None,
+                model_id, device=device, ov_config=ov_config, safety_checker=None,
             )
         except ValueError as e:
             logger.error("Failed to load inpaiting pipeline. Details:\n", e)
-            config = AutoConfig.from_pretrained(model_id, trust_remote_code=True)
             model = OVPipelineForInpainting.from_pretrained(
                 model_id,
-                config=config,
                 trust_remote_code=True,
                 use_cache=True,
                 device=device,

diff --git a/tools/who_what_benchmark/whowhatbench/whowhat_metrics.py b/tools/who_what_benchmark/whowhatbench/whowhat_metrics.py
@@ -110,12 +110,18 @@ def evaluate_divergency(tokenizer, data_gold, data_prediction):
 
 class TextSimilarity:
     def __init__(self, model_id) -> None:
-        tokenizer = AutoTokenizer.from_pretrained(model_id, trust_remote_code=True)
+        trust_remote_code = False
+        try:
+            tokenizer = AutoTokenizer.from_pretrained(model_id, trust_remote_code=False)
+        except Exception:
+            trust_remote_code = True
+            tokenizer = AutoTokenizer.from_pretrained(model_id, trust_remote_code=True)
+
         if hasattr(tokenizer, "pad_token") and tokenizer.pad_token:
             pad_token = tokenizer.pad_token
         else:
             pad_token = tokenizer.eos_token
-        self.model = SentenceTransformer(model_id, tokenizer_kwargs={"pad_token": pad_token}, trust_remote_code=True)
+        self.model = SentenceTransformer(model_id, tokenizer_kwargs={"pad_token": pad_token}, trust_remote_code=trust_remote_code)
 
     def evaluate(self, gt, prediction):
         return evaluate_similarity(self.model, gt, prediction)

diff --git a/tools/who_what_benchmark/whowhatbench/wwb.py b/tools/who_what_benchmark/whowhatbench/wwb.py
@@ -212,17 +212,33 @@ def load_tokenizer(args):
             from llama_cpp.llama_tokenizer import LlamaHFTokenizer
             tokenizer = LlamaHFTokenizer.from_pretrained(args.tokenizer)
         else:
+            try:
+                tokenizer = AutoTokenizer.from_pretrained(
+                    args.tokenizer, trust_remote_code=False
+                )
+            except Exception:
+                tokenizer = AutoTokenizer.from_pretrained(
+                    args.tokenizer, trust_remote_code=True
+                )
+    elif args.base_model is not None:
+        try:
             tokenizer = AutoTokenizer.from_pretrained(
-                args.tokenizer, trust_remote_code=True
+                args.base_model, trust_remote_code=False
+            )
+        except Exception:
+            tokenizer = AutoTokenizer.from_pretrained(
+                args.base_model, trust_remote_code=True
             )
-    elif args.base_model is not None:
-        tokenizer = AutoTokenizer.from_pretrained(
-            args.base_model, trust_remote_code=True
-        )
     elif args.target_model is not None:
-        tokenizer = AutoTokenizer.from_pretrained(
-            args.target_model, trust_remote_code=True
-        )
+        try:
+            tokenizer = AutoTokenizer.from_pretrained(
+                args.target_model, trust_remote_code=False
+            )
+        except:
+            tokenizer = AutoTokenizer.from_pretrained(
+                args.target_model, trust_remoter_code=True
+            )
+
 
     return tokenizer
 
@@ -232,13 +248,20 @@ def load_processor(args):
     if model_id is None:
         return None, None
 
-    config = AutoConfig.from_pretrained(model_id, trust_remote_code=True)
+    trust_remote_code = False
+    try:
+        config = AutoConfig.from_pretrained(model_id, trust_remote_code=False)
+    except Exception:
+        config = AutoConfig.from_pretrained(model_id, trust_remote_code=True)
+        trust_remote_code = True
     if "llava-qwen" in config.model_type:
         preprocessor_id = config.mm_vision_tower
     else:
         preprocessor_id = model_id
 
-    return AutoProcessor.from_pretrained(preprocessor_id, trust_remote_code=True), config
+    preprocessor = AutoProcessor.from_pretrained(preprocessor_id, trust_remote_code=trust_remote_code) 
+
+    return preprocessor, config
 
 
 def diff_strings(a: str, b: str, *, use_loguru_colors: bool = False) -> str: