From dee92a88b6c3d2d0d31fe7f9c7c105296fe65077 Mon Sep 17 00:00:00 2001
From: Jingyuan-zhu <jzhu22@wustl.edu>
Date: Tue, 10 Feb 2026 06:20:25 +0000
Subject: [PATCH 1/2] refactor: improve environment and dependency
 compatibility

- Restore Python 3.9 support by replacing PEP 604 union types with typing.Union

- Decouple sglang dependency via lazy loading in AutoPipeline

- Fix ImportError by handling the removal of telemetry API in transformers >=4.41
---
 src/lmflow/pipeline/auto_pipeline.py | 10 +++++++---
 src/lmflow/pipeline/finetuner.py     | 11 +++++++----
 src/lmflow/utils/protocol.py         | 22 +++++++++++-----------
 src/lmflow/utils/versioning.py       |  4 ++--
 4 files changed, 27 insertions(+), 20 deletions(-)

diff --git a/src/lmflow/pipeline/auto_pipeline.py b/src/lmflow/pipeline/auto_pipeline.py
index e55e74102..a7ab2dd3e 100644
--- a/src/lmflow/pipeline/auto_pipeline.py
+++ b/src/lmflow/pipeline/auto_pipeline.py
@@ -4,21 +4,25 @@
 from lmflow.pipeline.evaluator import Evaluator
 from lmflow.pipeline.finetuner import Finetuner
 from lmflow.pipeline.inferencer import Inferencer
-from lmflow.pipeline.sglang_inferencer import SGLangInferencer
 from lmflow.pipeline.rm_inferencer import RewardModelInferencer
 from lmflow.pipeline.rm_tuner import RewardModelTuner
-from lmflow.utils.versioning import is_package_version_at_least, is_ray_available, is_trl_available, is_vllm_available
+from lmflow.utils.versioning import is_package_version_at_least, is_ray_available, is_sglang_available, is_trl_available, is_vllm_available
 
 PIPELINE_MAPPING = {
     "evaluator": Evaluator,
     "finetuner": Finetuner,
     "inferencer": Inferencer,
-    "sglang_inferencer": SGLangInferencer,
     "rm_inferencer": RewardModelInferencer,
     "rm_tuner": RewardModelTuner,
 }
 PIPELINE_NEEDS_EXTRAS = []
 
+if is_sglang_available():
+    from lmflow.pipeline.sglang_inferencer import SGLangInferencer
+    PIPELINE_MAPPING["sglang_inferencer"] = SGLangInferencer
+else:
+    PIPELINE_NEEDS_EXTRAS.append("sglang_inferencer")
+
 if not is_package_version_at_least("transformers", "4.35.0"):
     from lmflow.pipeline.raft_aligner import RaftAligner
 
diff --git a/src/lmflow/pipeline/finetuner.py b/src/lmflow/pipeline/finetuner.py
index 6be4611c1..a4ff2c25c 100644
--- a/src/lmflow/pipeline/finetuner.py
+++ b/src/lmflow/pipeline/finetuner.py
@@ -17,9 +17,11 @@
     set_seed,
 )
 from transformers.trainer_utils import get_last_checkpoint
-from transformers.utils import (
-    send_example_telemetry,
-)
+
+try:
+    from transformers.utils import send_example_telemetry
+except ImportError:
+    send_example_telemetry = None
 
 from lmflow.args import DatasetArguments, FinetunerArguments, ModelArguments
 from lmflow.datasets.dataset import Dataset
@@ -73,7 +75,8 @@ def __init__(
         # Sending telemetry. Tracking the example usage helps us better
         # allocate resources to maintain them. The information sent is the one
         # passed as arguments along with your Python/PyTorch versions.
-        send_example_telemetry("run_clm", model_args, data_args)
+        if send_example_telemetry is not None:
+            send_example_telemetry("run_clm", model_args, data_args)
 
         # Setup logging
         logging.basicConfig(
diff --git a/src/lmflow/utils/protocol.py b/src/lmflow/utils/protocol.py
index c8779df2d..41ed217a6 100644
--- a/src/lmflow/utils/protocol.py
+++ b/src/lmflow/utils/protocol.py
@@ -10,7 +10,7 @@
 import math
 import pickle
 from dataclasses import dataclass, field
-from typing import Any, Optional
+from typing import Any, Dict, List, Optional, Set, Union
 
 import numpy as np
 import tensordict
@@ -65,7 +65,7 @@ def union_tensor_dict(tensor_dict1: TensorDict, tensor_dict2: TensorDict) -> Ten
     return tensor_dict1
 
 
-def _array_equal(array1: np.ndarray, array2: np.ndarray, visited: set[int]) -> bool:
+def _array_equal(array1: np.ndarray, array2: np.ndarray, visited: Set[int]) -> bool:
     """
     Recursively compares two NumPy arrays for strict equality, with special
     handling for object-dtype arrays, NaN values, and circular references.
@@ -92,7 +92,7 @@ def _array_equal(array1: np.ndarray, array2: np.ndarray, visited: set[int]) -> b
     return all(_deep_equal(x, y, visited) for x, y in zip(array1.flat, array2.flat, strict=False))
 
 
-def _deep_equal(a: Any, b: Any, visited: set[int]) -> bool:
+def _deep_equal(a: Any, b: Any, visited: Set[int]) -> bool:
     """
     Recursively performs a deep comparison between two Python objects.
     - Handles NaN values correctly (NaN == NaN evaluates to True).
@@ -128,7 +128,7 @@ def _deep_equal(a: Any, b: Any, visited: set[int]) -> bool:
     return result
 
 
-def union_numpy_dict(tensor_dict1: dict[str, np.ndarray], tensor_dict2: dict[str, np.ndarray]) -> dict[str, np.ndarray]:
+def union_numpy_dict(tensor_dict1: Dict[str, np.ndarray], tensor_dict2: Dict[str, np.ndarray]) -> Dict[str, np.ndarray]:
     for key, val in tensor_dict2.items():
         if key in tensor_dict1:
             assert isinstance(tensor_dict2[key], np.ndarray)
@@ -142,7 +142,7 @@ def union_numpy_dict(tensor_dict1: dict[str, np.ndarray], tensor_dict2: dict[str
     return tensor_dict1
 
 
-def list_of_dict_to_dict_of_list(list_of_dict: list[dict]):
+def list_of_dict_to_dict_of_list(list_of_dict: List[dict]):
     if len(list_of_dict) == 0:
         return {}
     keys = list_of_dict[0].keys()
@@ -154,7 +154,7 @@ def list_of_dict_to_dict_of_list(list_of_dict: list[dict]):
     return output
 
 
-def collate_fn(x: list["DataProtoItem"]):
+def collate_fn(x: List["DataProtoItem"]):
     batch = []
     non_tensor_batch = []
     for data in x:
@@ -167,7 +167,7 @@ def collate_fn(x: list["DataProtoItem"]):
     return DataProto(batch=batch, non_tensor_batch=non_tensor_batch)
 
 
-def get_tensordict(tensor_dict: dict[str, torch.Tensor | list], non_tensor_dict: dict = None) -> TensorDict:
+def get_tensordict(tensor_dict: Dict[str, Union[torch.Tensor, list]], non_tensor_dict: dict = None) -> TensorDict:
     """Create a TensorDict from tensors and non-tensor data.
 
     Automatically handles nested structures in lists by converting them to NonTensorStack.
@@ -223,7 +223,7 @@ def get_tensordict(tensor_dict: dict[str, torch.Tensor | list], non_tensor_dict:
             # Convert to NonTensorStack to handle nested structures
             tensor_dict[key] = NonTensorStack.from_list([NonTensorData(item) for item in val])
 
-        assert isinstance(val, torch.Tensor | list)
+        assert isinstance(val, (torch.Tensor, list))
 
         if batch_size is None:
             batch_size = val.size(0) if isinstance(val, torch.Tensor) else len(val)
@@ -300,11 +300,11 @@ def __getitem__(self, item):
             return self.slice(item.start, item.stop, item.step)
 
         # Case 2: List, numpy array, or torch tensor - use sel_idxs
-        elif isinstance(item, list | np.ndarray | torch.Tensor):
+        elif isinstance(item, (list, np.ndarray, torch.Tensor)):
             return self.select_idxs(item)
 
         # Case 3: Single integer - return DataProtoItem for backward compatibility
-        elif isinstance(item, int | np.integer):
+        elif isinstance(item, (int, np.integer)):
             tensor_data = self.batch[item] if self.batch is not None else None
             non_tensor_data = {key: val[item] for key, val in self.non_tensor_batch.items()}
             return DataProtoItem(batch=tensor_data, non_tensor_batch=non_tensor_data, meta_info=self.meta_info)
@@ -387,7 +387,7 @@ def check_consistency(self):
                 )
 
     @classmethod
-    def from_single_dict(cls, data: dict[str, torch.Tensor | np.ndarray], meta_info=None):
+    def from_single_dict(cls, data: Dict[str, Union[torch.Tensor, np.ndarray]], meta_info=None):
         """Create a DataProto from a dict of tensors and non_tensors"""
         tensors = {}
         non_tensors = {}
diff --git a/src/lmflow/utils/versioning.py b/src/lmflow/utils/versioning.py
index 0b52798fd..05d56bc96 100644
--- a/src/lmflow/utils/versioning.py
+++ b/src/lmflow/utils/versioning.py
@@ -2,7 +2,7 @@
 import logging
 import sys
 from pathlib import Path
-from typing import Union
+from typing import Union, List, Tuple
 
 import pkg_resources
 
@@ -29,7 +29,7 @@ def _is_package_available(package_name: str, skippable: bool = False):
                 raise e
 
 
-def _is_packages_available(packages: Union[list[str], list[tuple[str, bool]]]):
+def _is_packages_available(packages: Union[List[str], List[Tuple[str, bool]]]):
     if isinstance(packages[0], str):
         return all([_is_package_available(package) for package in packages])
     elif isinstance(packages[0], tuple):

From 3194ac7e0cf7a5ae1889cbd1403a78f47e1731d7 Mon Sep 17 00:00:00 2001
From: Jingyuan-zhu <jzhu22@wustl.edu>
Date: Wed, 11 Feb 2026 03:31:13 +0000
Subject: [PATCH 2/2] git commit -m "refactor: improve environment and
 dependency compatibility

- Restore Python 3.9 support by replacing PEP 604 union types with typing.Union.
- Decouple sglang dependency via lazy loading in AutoPipeline.
- Fix transformers telemetry API compatibility (>=4.41).
- Replace pkg_resources with importlib.metadata in version checks.
- Improve conversation template robustness:
  - add tokenizer/hf_auto modes
  - strict tokenizer mode with clear error
  - hf_auto fallback path
  - safer assistant mask handling for chat-template tokenization
  - handle missing block_size safely in tokenization flow.
- Add dependency constraints to reduce datasets/pyarrow and transformers drift."
---
 src/lmflow/args.py                          | 10 +++++-
 src/lmflow/models/hf_decoder_model.py       | 34 ++++++++++++++++++---
 src/lmflow/tokenization/hf_decoder_model.py |  9 +++++-
 src/lmflow/utils/versioning.py              |  9 +++---
 4 files changed, 52 insertions(+), 10 deletions(-)

diff --git a/src/lmflow/args.py b/src/lmflow/args.py
index 5b09c075a..b32d8866a 100644
--- a/src/lmflow/args.py
+++ b/src/lmflow/args.py
@@ -569,7 +569,15 @@ class DatasetArguments:
         default=False, metadata={"help": "Whether to train on prompt for conversation datasets such as ShareGPT."}
     )
     conversation_template: Optional[str] = field(
-        default=None, metadata={"help": "The template for conversation datasets."}
+        default=None,
+        metadata={
+            "help": (
+                "The template for conversation datasets. Supports LMFlow preset names "
+                "(e.g. llama3, qwen2_5, deepseek_v3) and special values "
+                "`tokenizer` / `hf_auto` to use tokenizer.chat_template "
+                "(`tokenizer` is strict; `hf_auto` falls back to LMFlow default when unavailable)."
+            )
+        },
     )
     dataset_cache_dir: Optional[str] = field(
         default=None,
diff --git a/src/lmflow/models/hf_decoder_model.py b/src/lmflow/models/hf_decoder_model.py
index bb899fd04..14b6b4753 100644
--- a/src/lmflow/models/hf_decoder_model.py
+++ b/src/lmflow/models/hf_decoder_model.py
@@ -107,7 +107,7 @@ def tokenize(self, dataset: Dataset, add_special_tokens=True, *args, **kwargs) -
         # Preprocessing the datasets.
         # First we tokenize all the texts.
         if dataset.get_backend() != "huggingface":
-            raise NotImplementedError("tokenization of datasets with non-huggingface backend arenot supported yet")
+            raise NotImplementedError("tokenization of datasets with non-huggingface backend are not supported yet")
 
         dataset_type = dataset.get_type()
         model_args = self.model_args
@@ -116,6 +116,12 @@ def tokenize(self, dataset: Dataset, add_special_tokens=True, *args, **kwargs) -
         column_names = list(hf_raw_datasets.features)
         data_args = raw_datasets.get_data_args()
 
+        if data_args.block_size is None:
+            data_args.block_size = self.tokenizer.model_max_length
+            logger.warning(
+                f"`block_size` is not provided. Using tokenizer.model_max_length={self.tokenizer.model_max_length}."
+            )
+
         # Requires three types of information for tokenizing different datasets
         #   1) Which fields require tokenization, e.g.
         #        "text2float": "text", but not "float"
@@ -137,15 +143,35 @@ def tokenize(self, dataset: Dataset, add_special_tokens=True, *args, **kwargs) -
             add_special_tokens = False
         elif dataset_type == "conversation":
             if data_args.conversation_template:
-                if data_args.conversation_template in PRESET_TEMPLATES.keys():
+                if data_args.conversation_template == "tokenizer":
+                    if getattr(self.tokenizer, "chat_template", None):
+                        conversation_template = self.tokenizer.chat_template
+                    else:
+                        raise NotImplementedError(
+                            "Requested tokenizer chat template, but tokenizer.chat_template is not available."
+                        )
+                elif data_args.conversation_template == "hf_auto":
+                    if getattr(self.tokenizer, "chat_template", None):
+                        conversation_template = self.tokenizer.chat_template
+                    else:
+                        logger.warning(
+                            "Requested `hf_auto`, but tokenizer.chat_template is unavailable. "
+                            "Falling back to LMFlow default template."
+                        )
+                        conversation_template = PRESET_TEMPLATES["empty"]
+                elif data_args.conversation_template in PRESET_TEMPLATES.keys():
                     conversation_template = PRESET_TEMPLATES[data_args.conversation_template]
                 else:
                     raise NotImplementedError(
                         f"Conversation template {data_args.conversation_template} is not supported yet."
                     )
             else:
-                logger.warning("No conversation template provided. Using default template.")
-                conversation_template = PRESET_TEMPLATES["empty"]
+                if getattr(self.tokenizer, "chat_template", None):
+                    logger.warning("No conversation template provided. Using tokenizer.chat_template.")
+                    conversation_template = self.tokenizer.chat_template
+                else:
+                    logger.warning("No conversation template provided. Using default template.")
+                    conversation_template = PRESET_TEMPLATES["empty"]
 
             logger.warning(f"Conversation template: {conversation_template}")
         else:
diff --git a/src/lmflow/tokenization/hf_decoder_model.py b/src/lmflow/tokenization/hf_decoder_model.py
index a7104621e..b33bb5cc3 100644
--- a/src/lmflow/tokenization/hf_decoder_model.py
+++ b/src/lmflow/tokenization/hf_decoder_model.py
@@ -142,9 +142,16 @@ def conversation_tokenize_function(
                 if data_args.train_on_prompt:
                     labels = encoded_conversation["input_ids"]
                 else:
+                    assistant_masks = encoded_conversation.get("assistant_masks", None)
+                    if assistant_masks is None:
+                        raise RuntimeError(
+                            "Tokenizer chat template path requires `assistant_masks` for label masking when "
+                            "`train_on_prompt=False`. Please upgrade transformers/tokenizer support, "
+                            "or use an LMFlow conversation template."
+                        )
                     labels = [
                         encoded_conversation["input_ids"][index] if mask == 1 else -100
-                        for index, mask in enumerate(encoded_conversation["assistant_masks"])
+                        for index, mask in enumerate(assistant_masks)
                     ]
 
                 token_dict["input_ids"][i].extend(encoded_conversation["input_ids"])
diff --git a/src/lmflow/utils/versioning.py b/src/lmflow/utils/versioning.py
index 05d56bc96..c3a3f107d 100644
--- a/src/lmflow/utils/versioning.py
+++ b/src/lmflow/utils/versioning.py
@@ -1,10 +1,11 @@
 import importlib
 import logging
 import sys
+from importlib import metadata
 from pathlib import Path
 from typing import Union, List, Tuple
 
-import pkg_resources
+from packaging.version import Version, InvalidVersion
 
 logger = logging.getLogger(__name__)
 
@@ -40,10 +41,10 @@ def _is_packages_available(packages: Union[List[str], List[Tuple[str, bool]]]):
 
 def is_package_version_at_least(package_name, min_version):
     try:
-        package_version = pkg_resources.get_distribution(package_name).version
-        if pkg_resources.parse_version(package_version) < pkg_resources.parse_version(min_version):
+        package_version = metadata.version(package_name)
+        if Version(package_version) < Version(min_version):
             return False
-    except pkg_resources.DistributionNotFound:
+    except (metadata.PackageNotFoundError, InvalidVersion):
         return False
     return True