pdf loader change
Browse files
utils.py
CHANGED
@@ -6,10 +6,10 @@ import faiss
|
|
6 |
from langchain import HuggingFaceHub
|
7 |
from langchain.chains import ConversationalRetrievalChain
|
8 |
from langchain.chat_models import ChatOpenAI
|
9 |
-
from langchain.document_loaders import DirectoryLoader, TextLoader, UnstructuredHTMLLoader, UnstructuredPDFLoader, UnstructuredWordDocumentLoader
|
10 |
from langchain.embeddings import OpenAIEmbeddings, HuggingFaceHubEmbeddings
|
11 |
from langchain.memory import ConversationBufferWindowMemory
|
12 |
-
from langchain.llms.openai import OpenAI
|
13 |
from langchain.prompts.chat import (
|
14 |
ChatPromptTemplate,
|
15 |
HumanMessagePromptTemplate,
|
@@ -83,7 +83,7 @@ def set_model(model):
|
|
83 |
llm = ChatOpenAI(model_name="gpt-3.5-turbo", temperature=0.5)
|
84 |
elif model == "GPT-4":
|
85 |
print("Loading GPT-4")
|
86 |
-
llm = OpenAI(model_name="gpt-4", temperature=
|
87 |
elif model == "Flan UL2":
|
88 |
print("Loading Flan-UL2")
|
89 |
llm = HuggingFaceHub(repo_id="google/flan-ul2", model_kwargs={"temperature": 0.1, "max_new_tokens":500})
|
@@ -202,7 +202,7 @@ def load_documents(file_paths):
|
|
202 |
elif file_path.endswith(".html"):
|
203 |
loader = UnstructuredHTMLLoader(file_path)
|
204 |
elif file_path.endswith(".pdf"):
|
205 |
-
loader =
|
206 |
else:
|
207 |
print("Unsupported file type")
|
208 |
raise Exception("Unsupported file type")
|
|
|
6 |
from langchain import HuggingFaceHub
|
7 |
from langchain.chains import ConversationalRetrievalChain
|
8 |
from langchain.chat_models import ChatOpenAI
|
9 |
+
from langchain.document_loaders import DirectoryLoader, TextLoader, UnstructuredHTMLLoader, UnstructuredPDFLoader, UnstructuredWordDocumentLoader, PyPDFLoader
|
10 |
from langchain.embeddings import OpenAIEmbeddings, HuggingFaceHubEmbeddings
|
11 |
from langchain.memory import ConversationBufferWindowMemory
|
12 |
+
from langchain.llms.openai import OpenAI, OpenAIChat
|
13 |
from langchain.prompts.chat import (
|
14 |
ChatPromptTemplate,
|
15 |
HumanMessagePromptTemplate,
|
|
|
83 |
llm = ChatOpenAI(model_name="gpt-3.5-turbo", temperature=0.5)
|
84 |
elif model == "GPT-4":
|
85 |
print("Loading GPT-4")
|
86 |
+
llm = OpenAI(model_name="gpt-4", temperature=1)
|
87 |
elif model == "Flan UL2":
|
88 |
print("Loading Flan-UL2")
|
89 |
llm = HuggingFaceHub(repo_id="google/flan-ul2", model_kwargs={"temperature": 0.1, "max_new_tokens":500})
|
|
|
202 |
elif file_path.endswith(".html"):
|
203 |
loader = UnstructuredHTMLLoader(file_path)
|
204 |
elif file_path.endswith(".pdf"):
|
205 |
+
loader = PyPDFLoader(file_path)
|
206 |
else:
|
207 |
print("Unsupported file type")
|
208 |
raise Exception("Unsupported file type")
|