Yixin1234 commited on
Commit
8f77b64
·
1 Parent(s): 3382272

try to fix api errors

Browse files
Files changed (2) hide show
  1. app.py +7 -6
  2. requirements.txt +6 -3
app.py CHANGED
@@ -4,6 +4,8 @@ from deepseek_vl.utils.io import load_pil_images
4
  import torch
5
 
6
  model_path = "deepseek-ai/deepseek-vl-1.3b-chat"
 
 
7
  vl_chat_processor = VLChatProcessor.from_pretrained(model_path)
8
  tokenizer = vl_chat_processor.tokenizer
9
  vl_gpt = MultiModalityCausalLM.from_pretrained(model_path, trust_remote_code=True).to("cpu")
@@ -19,6 +21,7 @@ def qa(image, question):
19
  images=pil_images,
20
  force_batchify=True
21
  ).to("cpu")
 
22
  inputs_embeds = vl_gpt.prepare_inputs_embeds(**prepare_inputs)
23
  outputs = vl_gpt.language_model.generate(
24
  inputs_embeds=inputs_embeds,
@@ -26,7 +29,7 @@ def qa(image, question):
26
  pad_token_id=tokenizer.eos_token_id,
27
  bos_token_id=tokenizer.bos_token_id,
28
  eos_token_id=tokenizer.eos_token_id,
29
- max_new_tokens=512,
30
  do_sample=False,
31
  use_cache=True
32
  )
@@ -41,8 +44,6 @@ demo = gr.Interface(
41
  description="Upload an image and enter a question. Experience DeepSeek-VL's vision-language capabilities."
42
  )
43
 
44
- demo.launch(
45
- server_name="0.0.0.0",
46
- server_port=7860,
47
- share=True
48
- )
 
4
  import torch
5
 
6
  model_path = "deepseek-ai/deepseek-vl-1.3b-chat"
7
+
8
+ # Load processors and model (CPU on free Spaces)
9
  vl_chat_processor = VLChatProcessor.from_pretrained(model_path)
10
  tokenizer = vl_chat_processor.tokenizer
11
  vl_gpt = MultiModalityCausalLM.from_pretrained(model_path, trust_remote_code=True).to("cpu")
 
21
  images=pil_images,
22
  force_batchify=True
23
  ).to("cpu")
24
+
25
  inputs_embeds = vl_gpt.prepare_inputs_embeds(**prepare_inputs)
26
  outputs = vl_gpt.language_model.generate(
27
  inputs_embeds=inputs_embeds,
 
29
  pad_token_id=tokenizer.eos_token_id,
30
  bos_token_id=tokenizer.bos_token_id,
31
  eos_token_id=tokenizer.eos_token_id,
32
+ max_new_tokens=256, # smaller is faster on CPU
33
  do_sample=False,
34
  use_cache=True
35
  )
 
44
  description="Upload an image and enter a question. Experience DeepSeek-VL's vision-language capabilities."
45
  )
46
 
47
+ if __name__ == "__main__":
48
+ # No server_name/server_port/share on Spaces
49
+ demo.queue(concurrency_count=1, max_size=8).launch()
 
 
requirements.txt CHANGED
@@ -1,4 +1,7 @@
1
- gradio
2
- torch
3
- transformers
 
 
 
4
  git+https://github.com/deepseek-ai/DeepSeek-VL.git
 
1
+ gradio>=4.31.0
2
+ transformers>=4.40.0
3
+ torch>=2.2.0
4
+ sentencepiece
5
+ timm>=0.9.16
6
+ accelerate
7
  git+https://github.com/deepseek-ai/DeepSeek-VL.git