Specifically, if I upgrade transformers, then I run into
File "/home/hackathon/grpo-art-basic/.venv/lib/python3.12/site-packages/transformers/models/auto/auto_factory.py", line 604, in from_pretrained
return model_class.from_pretrained(
^^^^^^^^^^^^^^^
File "/home/hackathon/grpo-art-basic/.venv/lib/python3.12/site-packages/transformers/modeling_utils.py", line 277, in _wrapper
return func(*args, **kwargs)
^^^^^^^^^^^^^^^
File "/home/hackathon/grpo-art-basic/.venv/lib/python3.12/site-packages/transformers/modeling_utils.py", line 4971, in from_pretrained
model = cls(config, *model_args, **model_kwargs)
^^^^^^^^^^^^^^^
TypeError: GptOssForCausalLM.__init__() got an unexpected keyword argument 'enable_prefix_caching'
and then if I upgrade unsloth and torch, I run into
File "/home/hackathon/.local/share/uv/python/cpython-3.12.12-linux-x86_64-gnu/lib/python3.12/importlib/__init__.py", line 90, in import_module
return _bootstrap._gcd_import(name[level:], package, level)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "/home/hackathon/grpo-art-basic/.venv/lib/python3.12/site-packages/vllm/engine/arg_utils.py", line 24, in <module>
from vllm.config import (BlockSize, CacheConfig, CacheDType, CompilationConfig,
File "/home/hackathon/grpo-art-basic/.venv/lib/python3.12/site-packages/vllm/config.py", line 35, in <module>
from vllm.model_executor.layers.quantization import QuantizationMethods
File "/home/hackathon/grpo-art-basic/.venv/lib/python3.12/site-packages/vllm/model_executor/__init__.py", line 4, in <module>
from vllm.model_executor.parameter import (BasevLLMParameter,
File "/home/hackathon/grpo-art-basic/.venv/lib/python3.12/site-packages/vllm/model_executor/parameter.py", line 10, in <module>
from vllm.distributed import get_tensor_model_parallel_rank
File "/home/hackathon/grpo-art-basic/.venv/lib/python3.12/site-packages/vllm/distributed/__init__.py", line 4, in <module>
from .communication_op import *
File "/home/hackathon/grpo-art-basic/.venv/lib/python3.12/site-packages/vllm/distributed/communication_op.py", line 9, in <module>
from .parallel_state import get_tp_group
File "/home/hackathon/grpo-art-basic/.venv/lib/python3.12/site-packages/vllm/distributed/parallel_state.py", line 150, in <module>
from vllm.platforms import current_platform
File "/home/hackathon/grpo-art-basic/.venv/lib/python3.12/site-packages/vllm/platforms/__init__.py", line 267, in __getattr__
_current_platform = resolve_obj_by_qualname(
^^^^^^^^^^^^^^^^^^^^^^^^
File "/home/hackathon/grpo-art-basic/.venv/lib/python3.12/site-packages/vllm/utils/__init__.py", line 2539, in resolve_obj_by_qualname
module = importlib.import_module(module_name)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "/home/hackathon/.local/share/uv/python/cpython-3.12.12-linux-x86_64-gnu/lib/python3.12/importlib/__init__.py", line 90, in import_module
return _bootstrap._gcd_import(name[level:], package, level)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "/home/hackathon/grpo-art-basic/.venv/lib/python3.12/site-packages/vllm/platforms/cuda.py", line 18, in <module>
import vllm._C # noqa
^^^^^^^^^^^^^^
ImportError: /home/hackathon/grpo-art-basic/.venv/lib/python3.12/site-packages/vllm/_C.abi3.so: undefined symbol: _ZNK3c106SymInt6sym_neERKS0_