fix(langchain-classic): fix init_chat_model for HuggingFace models (#33943)

georgeykalangi · web-flow · commit 16c984ef0aad · 2025-12-12T11:05:48.000-05:00
diff --git a/libs/partners/huggingface/langchain_huggingface/chat_models/huggingface.py b/libs/partners/huggingface/langchain_huggingface/chat_models/huggingface.py
@@ -627,8 +627,54 @@ def from_model_id(
                 HuggingFacePipeline,
             )
 
+            task = task if task is not None else "text-generation"
+
+            # Separate pipeline-specific kwargs from ChatHuggingFace kwargs
+            # Parameters that should go to HuggingFacePipeline.from_model_id
+            pipeline_specific_kwargs = {}
+
+            # Extract pipeline-specific parameters
+            pipeline_keys = [
+                "backend",
+                "device",
+                "device_map",
+                "model_kwargs",
+                "pipeline_kwargs",
+                "batch_size",
+            ]
+            for key in pipeline_keys:
+                if key in kwargs:
+                    pipeline_specific_kwargs[key] = kwargs.pop(key)
+
+            # Remaining kwargs (temperature, max_tokens, etc.) should go to
+            # pipeline_kwargs for generation parameters, which ChatHuggingFace
+            # will inherit from the LLM
+            if "pipeline_kwargs" not in pipeline_specific_kwargs:
+                pipeline_specific_kwargs["pipeline_kwargs"] = {}
+
+            # Add generation parameters to pipeline_kwargs
+            # Map max_tokens to max_new_tokens for HuggingFace pipeline
+            generation_params = {}
+            for k, v in list(kwargs.items()):
+                if k == "max_tokens":
+                    generation_params["max_new_tokens"] = v
+                    kwargs.pop(k)
+                elif k in (
+                    "temperature",
+                    "max_new_tokens",
+                    "top_p",
+                    "top_k",
+                    "repetition_penalty",
+                    "do_sample",
+                ):
+                    generation_params[k] = v
+                    kwargs.pop(k)
+
+            pipeline_specific_kwargs["pipeline_kwargs"].update(generation_params)
+
+            # Create the HuggingFacePipeline
             llm = HuggingFacePipeline.from_model_id(
-                model_id=model_id, task=cast(str, task), **kwargs
+                model_id=model_id, task=task, **pipeline_specific_kwargs
             )
         elif backend == "endpoint":
             from langchain_huggingface.llms.huggingface_endpoint import (
diff --git a/libs/partners/huggingface/pyproject.toml b/libs/partners/huggingface/pyproject.toml
@@ -46,6 +46,7 @@ test = [
     "langchain-core",
     "langchain-tests",
     "langchain-community",
+    "langchain",
 ]
 lint = ["ruff>=0.13.1,<0.14.0"]
 dev = [
@@ -61,6 +62,7 @@ typing = [
 [tool.uv.sources]
 langchain-core = { path = "../../core", editable = true }
 langchain-tests = { path = "../../standard-tests", editable = true }
+langchain = { path = "../../langchain_v1", editable = true }
 
 [tool.mypy]
 disallow_untyped_defs = "True"
diff --git a/libs/partners/huggingface/tests/unit_tests/test_chat_models.py b/libs/partners/huggingface/tests/unit_tests/test_chat_models.py
@@ -337,3 +337,55 @@ def test_profile() -> None:
         llm=empty_llm,
     )
     assert model.profile
+
+
+def test_init_chat_model_huggingface() -> None:
+    """Test that init_chat_model works with HuggingFace models.
+
+    This test verifies that the fix for issue #28226 works correctly.
+    The issue was that init_chat_model didn't properly handle HuggingFace
+    model initialization, particularly the required 'task' parameter and
+    parameter separation between HuggingFacePipeline and ChatHuggingFace.
+    """
+    from langchain.chat_models.base import init_chat_model
+
+    # Test basic initialization with default task
+    # Note: This test may skip in CI if model download fails, but it verifies
+    # that the initialization code path works correctly
+    try:
+        llm = init_chat_model(
+            model="microsoft/Phi-3-mini-4k-instruct",
+            model_provider="huggingface",
+            temperature=0,
+            max_tokens=1024,
+        )
+
+        # Verify that ChatHuggingFace was created successfully
+        assert llm is not None
+        from langchain_huggingface import ChatHuggingFace
+
+        assert isinstance(llm, ChatHuggingFace)
+
+        # Verify that the llm attribute is set (this was the bug - it was missing)
+        assert hasattr(llm, "llm")
+        assert llm.llm is not None
+
+        # Test with explicit task parameter
+        llm2 = init_chat_model(
+            model="microsoft/Phi-3-mini-4k-instruct",
+            model_provider="huggingface",
+            task="text-generation",
+            temperature=0.5,
+        )
+        assert isinstance(llm2, ChatHuggingFace)
+        assert llm2.llm is not None
+    except (
+        ImportError,
+        OSError,
+        RuntimeError,
+        ValueError,
+    ) as e:
+        # If model download fails in CI, skip the test rather than failing
+        # The important part is that the code path doesn't raise ValidationError
+        # about missing 'llm' field, which was the original bug
+        pytest.skip(f"Skipping test due to model download/initialization error: {e}")
diff --git a/libs/partners/huggingface/uv.lock b/libs/partners/huggingface/uv.lock