Spaces:

georad
/

sbsmapper

Running

App Files Files Community

georad commited on Apr 30

Commit

1d8da39

verified ·

1 Parent(s): f1b1ddc

Update pages/type_text.py

Browse files

Files changed (1) hide show

pages/type_text.py +7 -10

pages/type_text.py CHANGED Viewed

@@ -41,14 +41,14 @@ numMAPPINGS_input = 5
 @st.cache_resource
 def load_model():
     model = SentenceTransformer('all-MiniLM-L6-v2') # fastest
     return model
 model = load_model()
-#model = SentenceTransformer('all-MiniLM-L6-v2') # fastest
-#model = SentenceTransformer('all-mpnet-base-v2') # best performance
-#model = SentenceTransformers('all-distilroberta-v1')
-#model = SentenceTransformer('sentence-transformers/msmarco-bert-base-dot-v5')
-#model = SentenceTransformer('clips/mfaq')
 INTdesc_embedding = model.encode(INTdesc_input)
@@ -73,12 +73,11 @@ HF_model_results_displayed = HF_model_results_sorted[0:numMAPPINGS_input]
 @st.cache_resource
 def load_pipe():
-    pipe = pipeline("text-generation", model="meta-llama/Llama-3.2-1B-Instruct", device_map=device,) # device_map="auto", torch_dtype=torch.bfloat16
     return pipe
 pipe = load_pipe()
-#pipe = pipeline("text-generation", model="meta-llama/Llama-3.2-1B-Instruct", device_map=device,) # device_map="auto", torch_dtype=torch.bfloat16
 dictA = {"Score": [], "SBS Code": [], "SBS Description V2.0": []}
 dfALL = pd.DataFrame.from_dict(dictA)
@@ -97,8 +96,6 @@ if INTdesc_input is not None and createSBScodes_clicked == True:
     st.dataframe(data=dfALL, hide_index=True)
-    display_format = "ask REASONING MODEL: Which, if any, of the above SBS descriptions corresponds best to " + INTdesc_input +"? "
-    #st.write(display_format)
     question = "Which one, if any, of the below Saudi Billing System descriptions A, B, C, D, or E corresponds best to " + INTdesc_input +"? "
     shortlist = [SBScorpus[result[0]["corpus_id"]], SBScorpus[result[1]["corpus_id"]], SBScorpus[result[2]["corpus_id"]], SBScorpus[result[3]["corpus_id"]], SBScorpus[result[4]["corpus_id"]]]
     prompt = question + " " +"A: "+ shortlist[0] + " " +"B: " + shortlist[1] + " " + "C: " + shortlist[2] + " " + "D: " + shortlist[3] + " " + "E: " + shortlist[4]

 @st.cache_resource
 def load_model():
     model = SentenceTransformer('all-MiniLM-L6-v2') # fastest
+    #model = SentenceTransformer('all-mpnet-base-v2') # best performance
+    #model = SentenceTransformers('all-distilroberta-v1')
+    #model = SentenceTransformer('sentence-transformers/msmarco-bert-base-dot-v5')
+    #model = SentenceTransformer('clips/mfaq')
     return model
 model = load_model()
 INTdesc_embedding = model.encode(INTdesc_input)
 @st.cache_resource
 def load_pipe():
+    #pipe = pipeline("text-generation", model="meta-llama/Llama-3.2-1B-Instruct", device_map=device,) # device_map="auto", torch_dtype=torch.bfloat16
+    pipe = pipeline("text-generation", model="Qwen/Qwen2-1.5B-Instruct", device_map=device,) # device_map="auto", torch_dtype="auto"
     return pipe
 pipe = load_pipe()
 dictA = {"Score": [], "SBS Code": [], "SBS Description V2.0": []}
 dfALL = pd.DataFrame.from_dict(dictA)
     st.dataframe(data=dfALL, hide_index=True)
     question = "Which one, if any, of the below Saudi Billing System descriptions A, B, C, D, or E corresponds best to " + INTdesc_input +"? "
     shortlist = [SBScorpus[result[0]["corpus_id"]], SBScorpus[result[1]["corpus_id"]], SBScorpus[result[2]["corpus_id"]], SBScorpus[result[3]["corpus_id"]], SBScorpus[result[4]["corpus_id"]]]
     prompt = question + " " +"A: "+ shortlist[0] + " " +"B: " + shortlist[1] + " " + "C: " + shortlist[2] + " " + "D: " + shortlist[3] + " " + "E: " + shortlist[4]