rohan13 commited on
Commit
c932e0c
·
1 Parent(s): 43a973e

pdf loader change

Browse files
Files changed (1) hide show
  1. utils.py +4 -4
utils.py CHANGED
@@ -6,10 +6,10 @@ import faiss
6
  from langchain import HuggingFaceHub
7
  from langchain.chains import ConversationalRetrievalChain
8
  from langchain.chat_models import ChatOpenAI
9
- from langchain.document_loaders import DirectoryLoader, TextLoader, UnstructuredHTMLLoader, UnstructuredPDFLoader, UnstructuredWordDocumentLoader
10
  from langchain.embeddings import OpenAIEmbeddings, HuggingFaceHubEmbeddings
11
  from langchain.memory import ConversationBufferWindowMemory
12
- from langchain.llms.openai import OpenAI
13
  from langchain.prompts.chat import (
14
  ChatPromptTemplate,
15
  HumanMessagePromptTemplate,
@@ -83,7 +83,7 @@ def set_model(model):
83
  llm = ChatOpenAI(model_name="gpt-3.5-turbo", temperature=0.5)
84
  elif model == "GPT-4":
85
  print("Loading GPT-4")
86
- llm = OpenAI(model_name="gpt-4", temperature=0.1)
87
  elif model == "Flan UL2":
88
  print("Loading Flan-UL2")
89
  llm = HuggingFaceHub(repo_id="google/flan-ul2", model_kwargs={"temperature": 0.1, "max_new_tokens":500})
@@ -202,7 +202,7 @@ def load_documents(file_paths):
202
  elif file_path.endswith(".html"):
203
  loader = UnstructuredHTMLLoader(file_path)
204
  elif file_path.endswith(".pdf"):
205
- loader = UnstructuredPDFLoader(file_path)
206
  else:
207
  print("Unsupported file type")
208
  raise Exception("Unsupported file type")
 
6
  from langchain import HuggingFaceHub
7
  from langchain.chains import ConversationalRetrievalChain
8
  from langchain.chat_models import ChatOpenAI
9
+ from langchain.document_loaders import DirectoryLoader, TextLoader, UnstructuredHTMLLoader, UnstructuredPDFLoader, UnstructuredWordDocumentLoader, PyPDFLoader
10
  from langchain.embeddings import OpenAIEmbeddings, HuggingFaceHubEmbeddings
11
  from langchain.memory import ConversationBufferWindowMemory
12
+ from langchain.llms.openai import OpenAI, OpenAIChat
13
  from langchain.prompts.chat import (
14
  ChatPromptTemplate,
15
  HumanMessagePromptTemplate,
 
83
  llm = ChatOpenAI(model_name="gpt-3.5-turbo", temperature=0.5)
84
  elif model == "GPT-4":
85
  print("Loading GPT-4")
86
+ llm = OpenAI(model_name="gpt-4", temperature=1)
87
  elif model == "Flan UL2":
88
  print("Loading Flan-UL2")
89
  llm = HuggingFaceHub(repo_id="google/flan-ul2", model_kwargs={"temperature": 0.1, "max_new_tokens":500})
 
202
  elif file_path.endswith(".html"):
203
  loader = UnstructuredHTMLLoader(file_path)
204
  elif file_path.endswith(".pdf"):
205
+ loader = PyPDFLoader(file_path)
206
  else:
207
  print("Unsupported file type")
208
  raise Exception("Unsupported file type")