adilkh26 commited on
Commit
617855e
·
verified ·
1 Parent(s): ab47f68

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -1
app.py CHANGED
@@ -1,6 +1,7 @@
1
  import gradio as gr
2
  import torch
3
  from transformers import AutoModel, AutoTokenizer
 
4
 
5
  # Model name
6
  model_name = "OpenGVLab/InternVideo2_5_Chat_8B"
@@ -13,7 +14,8 @@ model = AutoModel.from_pretrained(
13
  model_name,
14
  trust_remote_code=True,
15
  torch_dtype=torch.float16, # Use float16 for lower memory usage
16
- device_map="auto" # Automatically place model on available GPU
 
17
  )
18
 
19
  # Define inference function
 
1
  import gradio as gr
2
  import torch
3
  from transformers import AutoModel, AutoTokenizer
4
+ import deepspeed
5
 
6
  # Model name
7
  model_name = "OpenGVLab/InternVideo2_5_Chat_8B"
 
14
  model_name,
15
  trust_remote_code=True,
16
  torch_dtype=torch.float16, # Use float16 for lower memory usage
17
+ device_map="auto", # Automatically place model on available GPU
18
+ deepspeed={"stage": 3}
19
  )
20
 
21
  # Define inference function