-
Notifications
You must be signed in to change notification settings - Fork 16
Description
When I run pretrain scripts,
I got this:
File "/data/lc/Multi-image/multi_token/multi_token/language_models/mistral.py", line 85, in forward
) = self.prepare_inputs_labels_for_multimodal(
File "/data/lc/Multi-image/multi_token/multi_token/language_models/base_model.py", line 69, in prepare_inputs_labels_for_multimodal
m_vals = m.forward(kwargs.get(m.name))
File "/root/miniconda3/envs/multi-image/lib/python3.10/site-packages/torch/utils/_contextlib.py", line 115, in decorate_context
return func(*args, **kwargs)
File "/data/lc/Multi-image/multi_token/multi_token/modalities/vision_clip.py", line 177, in forward
image_features.append(self.module.forward(image_batch))
File "/root/miniconda3/envs/multi-image/lib/python3.10/site-packages/torch/utils/_contextlib.py", line 115, in decorate_context
return func(*args, **kwargs)
File "/data/lc/Multi-image/multi_token/multi_token/modalities/vision_clip.py", line 40, in forward
image_forward_outs = self.image_model(
File "/root/miniconda3/envs/multi-image/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1511, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
File "/root/miniconda3/envs/multi-image/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1520, in _call_impl
return forward_call(*args, **kwargs)
File "/root/miniconda3/envs/multi-image/lib/python3.10/site-packages/transformers/models/clip/modeling_clip.py", line 925, in forward
return self.vision_model(
File "/root/miniconda3/envs/multi-image/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1511, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
File "/root/miniconda3/envs/multi-image/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1520, in _call_impl
return forward_call(*args, **kwargs)
File "/root/miniconda3/envs/multi-image/lib/python3.10/site-packages/transformers/models/clip/modeling_clip.py", line 849, in forward
hidden_states = self.embeddings(pixel_values)
File "/root/miniconda3/envs/multi-image/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1511, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
File "/root/miniconda3/envs/multi-image/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1520, in _call_impl
return forward_call(args, **kwargs)
File "/root/miniconda3/envs/multi-image/lib/python3.10/site-packages/transformers/models/clip/modeling_clip.py", line 190, in forward
patch_embeds = self.patch_embedding(pixel_values.to(dtype=target_dtype)) # shape = [, width, grid, grid]
File "/root/miniconda3/envs/multi-image/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1511, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
File "/root/miniconda3/envs/multi-image/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1520, in _call_impl
return forward_call(*args, **kwargs)
File "/root/miniconda3/envs/multi-image/lib/python3.10/site-packages/torch/nn/modules/conv.py", line 460, in forward
return self._conv_forward(input, self.weight, self.bias)
File "/root/miniconda3/envs/multi-image/lib/python3.10/site-packages/torch/nn/modules/conv.py", line 456, in _conv_forward
return F.conv2d(input, weight, bias, self.stride,
RuntimeError: weight should have at least three dimension