Rajagopal commited on
Commit
65c0e5a
·
0 Parent(s):

Duplicate from Rajagopal/Nand1OpenPDF

Browse files
Files changed (5) hide show
  1. .gitattributes +34 -0
  2. README.md +13 -0
  3. Wipro logo.png +0 -0
  4. app.py +73 -0
  5. requirements.txt +7 -0
.gitattributes ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tflite filter=lfs diff=lfs merge=lfs -text
29
+ *.tgz filter=lfs diff=lfs merge=lfs -text
30
+ *.wasm filter=lfs diff=lfs merge=lfs -text
31
+ *.xz filter=lfs diff=lfs merge=lfs -text
32
+ *.zip filter=lfs diff=lfs merge=lfs -text
33
+ *.zst filter=lfs diff=lfs merge=lfs -text
34
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ title: csrd trying
3
+ emoji: 🏆
4
+ colorFrom: yellow
5
+ colorTo: gray
6
+ sdk: streamlit
7
+ sdk_version: 1.21.0
8
+ app_file: app.py
9
+ pinned: false
10
+ duplicated_from: Rajagopal/Nand1OpenPDF
11
+ ---
12
+
13
+ Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
Wipro logo.png ADDED
app.py ADDED
@@ -0,0 +1,73 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import os
2
+ from langchain.chains import RetrievalQA
3
+ from langchain.llms import AzureOpenAI
4
+ from langchain.document_loaders import TextLoader
5
+ from langchain.document_loaders import PyPDFLoader
6
+ from langchain.indexes import VectorstoreIndexCreator
7
+ from langchain.text_splitter import CharacterTextSplitter
8
+ from langchain.embeddings import OpenAIEmbeddings
9
+ from langchain.vectorstores import Chroma
10
+ from langchain.chains.question_answering import load_qa_chain
11
+ from langchain.llms import AzureOpenAI
12
+ from langchain.chains.question_answering import load_qa_chain
13
+ import streamlit as st
14
+ from PIL import Image
15
+ import time
16
+
17
+ @st.cache_data
18
+ def findanswer(Nand_url, Nand_question):
19
+ if True:
20
+ if Nand_url:
21
+ index = None
22
+ loader1 = PyPDFLoader(Nand_url)
23
+ langchainembeddings = OpenAIEmbeddings(deployment="textembedding", chunk_size=1)
24
+
25
+ index = VectorstoreIndexCreator(
26
+ # split the documents into chunks
27
+ text_splitter=CharacterTextSplitter(chunk_size=1000, chunk_overlap=0),
28
+ # select which embeddings we want to use
29
+ embedding=langchainembeddings,
30
+ # use Chroma as the vectorestore to index and search embeddings
31
+ vectorstore_cls=Chroma
32
+ ).from_loaders([loader1])
33
+ # st.write("indexed PDF...AI finding answer....please wait")
34
+ if Nand_question:
35
+ answer = index.query(llm=llmgpt3, question=yourquestion, chain_type="map_reduce")
36
+ return answer
37
+
38
+
39
+
40
+ image = Image.open('Wipro logo.png')
41
+ st.image(image, width=100)
42
+
43
+ st.write("Learn best practices in Data Centre Sustainability")
44
+
45
+
46
+
47
+
48
+ os.environ['OPENAI_API_TYPE'] = 'azure'
49
+ os.environ['OPENAI_API_VERSION'] = '2023-03-15-preview'
50
+
51
+ llmgpt3 = AzureOpenAI( deployment_name="testdavanci", model_name="text-davinci-003" )
52
+ #llmchatgpt = AzureOpenAI( deployment_name="esujnand", model_name="gpt-35-turbo" )
53
+
54
+ samplequestions = ["What is Energy Star 4.0 Standard?", "What is RoHS Directive?", "What is Green IT?", "Benefits of greening IT?", "Holistic Approach to Green IT",
55
+ "Using IT: Environmentally Sound Practices", "Designing Green Computers", "Epeat" ]
56
+
57
+
58
+ with st.form("my_form"):
59
+
60
+ myurl = st.text_input("What is the URL?", "https://sites.pitt.edu/~dtipper/2011/GreenPaper.pdf")
61
+
62
+ yourquestion = st.selectbox(
63
+ 'Select', samplequestions )
64
+
65
+ # Every form must have a submit button.
66
+ submitted = st.form_submit_button("Ask question")
67
+ if submitted:
68
+ #st.write("AI is looking for the answer...It will take atleast 2 mintutes... Answers will appear below....")
69
+ Nandanswer = findanswer(myurl, yourquestion )
70
+ st.write(Nandanswer)
71
+
72
+
73
+
requirements.txt ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ openai
2
+ langchain
3
+ streamlit
4
+ PyPDF2
5
+ tiktoken
6
+ pypdf
7
+ chromadb