Skip to content

Commit

Permalink
tutorial32
Browse files Browse the repository at this point in the history
  • Loading branch information
ronidas39 committed Jan 18, 2024
1 parent f23a393 commit ec3164b
Show file tree
Hide file tree
Showing 5 changed files with 33 additions and 2 deletions.
2 changes: 1 addition & 1 deletion tutorial2/single_url.py
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
from langchain.document_loaders import youtube
import io

loader=youtube.YoutubeLoader.from_youtube_url("https://www.youtube.com/watch?v=kjmsd-1coZo")
loader=youtube.YoutubeLoader.from_youtube_url("https://youtu.be/cF4nkvuJpEU")
docs=loader.load()
print(docs)
with io.open("transcript.txt","w",encoding="utf-8")as f1:
Expand Down
2 changes: 1 addition & 1 deletion tutorial2/transcript.txt

Large diffs are not rendered by default.

Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
31 changes: 31 additions & 0 deletions tutorial32/main.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,31 @@
from langchain.document_loaders import AsyncChromiumLoader
from langchain.document_transformers import Html2TextTransformer
from langchain.text_splitter import RecursiveCharacterTextSplitter
from langchain.vectorstores import Chroma
from langchain.embeddings import OpenAIEmbeddings
from langchain.chat_models import ChatOpenAI
from langchain.chains import RetrievalQA

urls=["https://www.espncricinfo.com/series/afghanistan-in-india-2023-24-1389384/india-vs-afghanistan-3rd-t20i-1389398/full-scorecard"]
loader=AsyncChromiumLoader(urls=urls)
htmldocs=loader.load()
tf=Html2TextTransformer()
fd=tf.transform_documents(htmldocs)
ts=RecursiveCharacterTextSplitter(chunk_size=1000,chunk_overlap=0)
splits=ts.split_documents(fd)
llm=ChatOpenAI(model="gpt-4",temperature=0.8)
embeddings=OpenAIEmbeddings()
chroma_db=Chroma.from_documents(
documents=splits,
embedding=embeddings
)
query="Rinku Singh scores on the match between india vs afghanistan"
chain=RetrievalQA.from_chain_type(
llm=llm,
chain_type="stuff",
retriever=chroma_db.as_retriever()
)
response=chain(query)
print(response)


Binary file added tutorial32/tutorial32.pptx
Binary file not shown.

0 comments on commit ec3164b

Please sign in to comment.