adilkh26 commited on
Commit
b8969f6
·
verified ·
1 Parent(s): 8cf71ba

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -3
app.py CHANGED
@@ -1,6 +1,6 @@
1
  import gradio as gr
2
  import torch
3
- from transformers import AutoModel, AutoTokenizer
4
  import deepspeed
5
 
6
  # Model name
@@ -10,12 +10,12 @@ model_name = "OpenGVLab/InternVideo2_5_Chat_8B"
10
  tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
11
 
12
  # Load model efficiently
13
- model = AutoModel.from_pretrained(
14
  model_name,
15
  trust_remote_code=True,
16
  torch_dtype=torch.float16, # Use float16 for lower memory usage
17
  device_map="auto", # Automatically place model on available GPU
18
- deepspeed={"stage": 3}
19
  )
20
 
21
  # Define inference function
 
1
  import gradio as gr
2
  import torch
3
+ from transformers import AutoModel, AutoTokenizer, AutoModelForCasualLM
4
  import deepspeed
5
 
6
  # Model name
 
10
  tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
11
 
12
  # Load model efficiently
13
+ model = AutoModelForCasualLM.from_pretrained(
14
  model_name,
15
  trust_remote_code=True,
16
  torch_dtype=torch.float16, # Use float16 for lower memory usage
17
  device_map="auto", # Automatically place model on available GPU
18
+
19
  )
20
 
21
  # Define inference function