unsloth
/

DeepSeek-OCR

Image-Text-to-Text

vision-language

Model card Files Files and versions

danielhanchen commited on 17 days ago

Commit

af03e36

·

verified ·

1 Parent(s): 425319b

Update modeling_deepseekv2.py

Files changed (1) hide show

modeling_deepseekv2.py +8 -4

modeling_deepseekv2.py CHANGED Viewed

@@ -34,10 +34,14 @@ from torch.nn import BCEWithLogitsLoss, CrossEntropyLoss, MSELoss
 from transformers.activations import ACT2FN
 from transformers.cache_utils import Cache, DynamicCache
 from transformers.modeling_attn_mask_utils import _prepare_4d_causal_attention_mask
-from transformers.models.llama.modeling_llama import (
-    LlamaAttention,
-    LlamaFlashAttention2
-)
 from transformers.modeling_outputs import (
     BaseModelOutputWithPast,
     CausalLMOutputWithPast,

 from transformers.activations import ACT2FN
 from transformers.cache_utils import Cache, DynamicCache
 from transformers.modeling_attn_mask_utils import _prepare_4d_causal_attention_mask
+try:
+    from transformers.models.llama.modeling_llama import LlamaAttention
+except:
+    LlamaAttention = None
+try:
+    from transformers.models.llama.modeling_llama import LlamaFlashAttention2
+except:
+    LlamaFlashAttention2 = None
 from transformers.modeling_outputs import (
     BaseModelOutputWithPast,
     CausalLMOutputWithPast,