fix(hf-integration): handle logits as tuple in hf_adapter, convert torch.Tensor to list in hf_tokenizer.decode for decoding compatibility

2026-01-23 21:10:54 +00:00 · 2025-10-05 20:47:36 +03:00
parent 3843e64098
commit c31eed8551
2 changed files with 23 additions and 5 deletions
--- a/hf-proxy/src/hf_proxy/hf_adapter.py
+++ b/hf-proxy/src/hf_proxy/hf_adapter.py
@@ -99,7 +99,11 @@ class HFGPTAdapter(PreTrainedModel):
        return_dict = return_dict if return_dict is not None else self.config.use_return_dict
        
        # Основной forward pass
-        logits = self.llm_model(input_ids)
+        outputs = self.llm_model(input_ids)
+        if isinstance(outputs, tuple):
+            logits = outputs[0]
+        else:
+            logits = outputs
        
        loss = None
        if labels is not None:
--- a/hf-proxy/src/hf_proxy/hf_tokenizer.py
+++ b/hf-proxy/src/hf_proxy/hf_tokenizer.py
@@ -56,10 +56,24 @@ class HFTokenizerAdapter:
        add_special_tokens = kwargs.get('add_special_tokens', True)
        
        # Кодируем текст
-        input_ids = self.llm_tokenizer.encode(
-            text, 
-            add_special_tokens=add_special_tokens
-        )
+        #input_ids = self.llm_tokenizer.encode(
+        #    text, 
+        #    add_special_tokens=add_special_tokens
+        #)
+        if isinstance(text, str):
+            input_ids = self.llm_tokenizer.encode(
+                text, 
+                add_special_tokens=add_special_tokens
+            )
+            input_ids = [input_ids]  # <-- оборачиваем в batch
+        else:
+            # Список строк, батч-режим!
+            input_ids = [
+                self.llm_tokenizer.encode(
+                    t,
+                    add_special_tokens=add_special_tokens
+                ) for t in text
+            ]
        
        # Применяем truncation
        if truncation and max_length is not None and len(input_ids) > max_length: