Docfile commited on
Commit
ef3b5a8
·
1 Parent(s): 6b03de8

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +16 -1
app.py CHANGED
@@ -13,9 +13,24 @@ from g4f import Provider, models
13
  from langchain.llms.base import LLM
14
  from langchain.embeddings import HuggingFaceEmbeddings
15
  from langchain_g4f import G4FLLM
 
 
 
 
16
 
 
 
17
 
18
- llm = LLM = G4FLLM(model=models.gpt_35_turbo,provider=Provider.DeepAi,)
 
 
 
 
 
 
 
 
 
19
 
20
  embeddings = HuggingFaceEmbeddings(
21
  model_name="sentence-transformers/all-mpnet-base-v2"
 
13
  from langchain.llms.base import LLM
14
  from langchain.embeddings import HuggingFaceEmbeddings
15
  from langchain_g4f import G4FLLM
16
+ from langchain.callbacks.streaming_stdout import StreamingStdOutCallbackHandler
17
+ from huggingface_hub import hf_hub_download
18
+ from langchain.llms import LlamaCpp
19
+ from langchain import PromptTemplate, LLMChain
20
 
21
+ model_name_or_path = "hlhr202/llama-7B-ggml-int4"
22
+ model_basename = "ggml-model-q4_0.bin" # the model is in bin format
23
 
24
+ model_path = hf_hub_download(repo_id=model_name_or_path, filename=model_basename)
25
+
26
+ n_gpu_layers = 40 # Change this value based on your model and your GPU VRAM pool.
27
+ n_batch = 256
28
+
29
+ llm = LlamaCpp(
30
+ model_path, callbacks=[StreamingStdOutCallbackHandler()]
31
+ )
32
+
33
+ #llm = LLM = G4FLLM(model=models.gpt_35_turbo,provider=Provider.DeepAi,)
34
 
35
  embeddings = HuggingFaceEmbeddings(
36
  model_name="sentence-transformers/all-mpnet-base-v2"