- 
                Notifications
    You must be signed in to change notification settings 
- Fork 38
Open
Labels
questionFurther information is requestedFurther information is requested
Description
Question
Hi, I would like to use inseq to get the attribution from Llama3.1-8b-instruct model, but I got the following error when initialising the inseq model:
This is my code:
model = inseq.load_model("meta-llama/Llama-3.1-8B-Instruct", "attention")
out = model.attribute(
    "Hello ladies and",
    generation_args={"max_new_tokens": 128},
    n_steps=500,
    internal_batch_size=50
).show()
ValueError                                Traceback (most recent call last)
Cell In[4], [line 1](vscode-notebook-cell:?execution_count=4&line=1)
----> [1](vscode-notebook-cell:?execution_count=4&line=1) model = inseq.load_model("meta-llama/Llama-3.1-8B-Instruct", "attention")
      [2](vscode-notebook-cell:?execution_count=4&line=2) out = model.attribute(
      [3](vscode-notebook-cell:?execution_count=4&line=3)     "Hello ladies and",
      [4](vscode-notebook-cell:?execution_count=4&line=4)     generation_args={"max_new_tokens": 128},
      [5](vscode-notebook-cell:?execution_count=4&line=5)     n_steps=500,
      [6](vscode-notebook-cell:?execution_count=4&line=6)     internal_batch_size=50
      [7](vscode-notebook-cell:?execution_count=4&line=7) ).show()
File /mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/__init__.py:47, in load_model(model, attribution_method, framework, **kwargs)
     [45](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/__init__.py:45) load_msg = f"Loading {model_name} {method_desc}"
     [46](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/__init__.py:46) with optional(not isnotebook(), Status(load_msg), logger.info, msg=load_msg):
---> [47](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/__init__.py:47)     return FRAMEWORKS_MAP[framework].load(model, attribution_method, **kwargs)
File /mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/huggingface_model.py:163, in HuggingfaceModel.load(model, attribution_method, tokenizer, device, model_kwargs, tokenizer_kwargs, **kwargs)
    [159](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/huggingface_model.py:159)     return HuggingfaceEncoderDecoderModel(
    [160](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/huggingface_model.py:160)         model, attribution_method, tokenizer, device, model_kwargs, tokenizer_kwargs, **kwargs
    [161](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/huggingface_model.py:161)     )
    [162](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/huggingface_model.py:162) else:
--> [163](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/huggingface_model.py:163)     return HuggingfaceDecoderOnlyModel(
    [164](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/huggingface_model.py:164)         model, attribution_method, tokenizer, device, model_kwargs, tokenizer_kwargs, **kwargs
    [165](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/huggingface_model.py:165)     )
File /mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/huggingface_model.py:494, in HuggingfaceDecoderOnlyModel.__init__(self, model, attribution_method, tokenizer, device, model_kwargs, tokenizer_kwargs, **kwargs)
    [484](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/huggingface_model.py:484) def __init__(
    [485](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/huggingface_model.py:485)     self,
    [486](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/huggingface_model.py:486)     model: Union[str, PreTrainedModel],
   (...)
    [492](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/huggingface_model.py:492)     **kwargs,
    [493](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/huggingface_model.py:493) ) -> NoReturn:
--> [494](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/huggingface_model.py:494)     super().__init__(model, attribution_method, tokenizer, device, model_kwargs, tokenizer_kwargs, **kwargs)
    [495](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/huggingface_model.py:495)     self.tokenizer.padding_side = "left"
    [496](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/huggingface_model.py:496)     self.tokenizer.truncation_side = "left"
File /mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/huggingface_model.py:122, in HuggingfaceModel.__init__(self, model, attribution_method, tokenizer, device, model_kwargs, tokenizer_kwargs, **kwargs)
    [120](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/huggingface_model.py:120) self.pad_token = self._convert_ids_to_tokens(pad_token_id, skip_special_tokens=False)
    [121](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/huggingface_model.py:121) if self.tokenizer.pad_token is None:
--> [122](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/huggingface_model.py:122)     self.tokenizer.pad_token = self.pad_token
    [123](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/huggingface_model.py:123) if self.model.config.pad_token_id is None:
    [124](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/inseq/models/huggingface_model.py:124)     self.model.config.pad_token_id = pad_token_id
File /mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/transformers/tokenization_utils_base.py:1081, in SpecialTokensMixin.__setattr__(self, key, value)
   [1078](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/transformers/tokenization_utils_base.py:1078)         key = key_without_id
   [1080](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/transformers/tokenization_utils_base.py:1080)     if key != "additional_special_tokens" and not isinstance(value, (str, AddedToken)) and value is not None:
-> [1081](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/transformers/tokenization_utils_base.py:1081)         raise ValueError(f"Cannot set a non-string value as the {key}")
   [1082](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/transformers/tokenization_utils_base.py:1082)     self._special_tokens_map[key] = value
   [1083](https://vscode-remote+tunnel-002bxiaotang-002dpod.vscode-resource.vscode-cdn.net/mnt/ceph_rbd/miniconda3/envs/inseq/lib/python3.10/site-packages/transformers/tokenization_utils_base.py:1083) else:
ValueError: Cannot set a non-string value as the pad_token
Metadata
Metadata
Assignees
Labels
questionFurther information is requestedFurther information is requested