0% found this document useful (0 votes)

13 views

Demo

Uploaded by

fahim.nsudrive3

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

13 views

Demo

Uploaded by

fahim.nsudrive3

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 3

conda create -n ragpipe python=3.

11 -y && conda activate ragpipe

pip install torch sentence_transformers transformers accelerate

pip install langchain==0.1.14
pip install langchain-experimental==0.0.56
pip install langchain-community==0.0.31
pip install faiss-cpu==1.8.0
pip install pdfplumber==0.11.0
pip install gradio==4.25.0
pip install ollama
pip install pypdf
conda install jupyter -y
pip uninstall charset_normalizer -y
pip install charset_normalizer
jupyter notebook

from langchain_community.document_loaders import PDFPlumberLoader

from langchain_experimental.text_splitter import SemanticChunker
from langchain_community.embeddings import HuggingFaceEmbeddings
from langchain_community.vectorstores import FAISS
from langchain_community.llms import Ollama
from langchain.prompts import PromptTemplate
from langchain.chains.llm import LLMChain
from langchain.chains.combine_documents.stuff import StuffDocumentsChain
from langchain.chains import RetrievalQA
from langchain_community.document_loaders import TextLoader
from pypdf import PdfReader
import ollama
import gradio as gr
import os
import json

def triplextract(text, entity_types, predicates):

input_format = """
**Entity Types:**
{entity_types}

**Predicates:**
{predicates}

**Text:**
{text}
"""

message = input_format.format(
entity_types = json.dumps({"entity_types": entity_types}),
predicates = json.dumps({"predicates": predicates}),
text = text)

# Pass the message as a single string

prompt = message
output = ollama.generate(model='triplex', prompt=prompt)
return output

entity_types = ["PERSON", "LOCATION"]

predicates = ["PROFESSION", "BASED_IN"]

reader = PdfReader("/home/Ubuntu/myfiles/mypdf.pdf")
text = ""
for page in reader.pages:
text += page.extract_text() + "\n"

prediction = triplextract(text, entity_types, predicates)

response_string = prediction['response'].strip('```json\n').strip()
response_string = response_string.lstrip('\n')
response_string = response_string.strip('```')
response_string = response_string.replace('```', '')
response_string = response_string.replace("json", "")
response_json = json.loads(response_string)
entities_and_triples = response_json['entities_and_triples']
print(entities_and_triples)

with open('output.txt', 'w') as f:

f.write(text)

loader = TextLoader("./output.txt")
docs =loader.load()

# Split into chunks

text_splitter = SemanticChunker(HuggingFaceEmbeddings())
documents = text_splitter.split_documents(docs)

# Instantiate the embedding model

embedder = HuggingFaceEmbeddings()

# Create the vector store and fill it with embeddings

vector = FAISS.from_documents(documents, embedder)
retriever = vector.as_retriever(search_type="similarity", search_kwargs={"k": 3})

# Define llm
llm = Ollama(model="mistral")

# Define the prompt

prompt = """
1. Use the following pieces of context to answer the question at the end.
2. If you don't know the answer, just say that "I don't know" but don't make up an
answer on your own.\n
3. Keep the answer crisp and limited to 3,4 sentences.

Context: {context}

Question: {question}

Helpful Answer:"""

QA_CHAIN_PROMPT = PromptTemplate.from_template(prompt)

llm_chain = LLMChain(
llm=llm,
prompt=QA_CHAIN_PROMPT,
callbacks=None,
verbose=True)

document_prompt = PromptTemplate(
input_variables=["page_content", "source"],
template="Context:\ncontent:{page_content}\nsource:{source}",
)

combine_documents_chain = StuffDocumentsChain(
llm_chain=llm_chain,
document_variable_name="context",
document_prompt=document_prompt,
callbacks=None)

qa = RetrievalQA(
combine_documents_chain=combine_documents_chain,
verbose=True,
retriever=retriever,
return_source_documents=True)

def respond(question,history):
return qa(question)["result"]

gr.ChatInterface(
respond,
chatbot=gr.Chatbot(height=500),
textbox=gr.Textbox(placeholder="Ask me question related to Fahd Mirza",
container=False, scale=7),
title="Fahd's Chatbot",
examples=["Where Fahd Lives", "Who is Fahd"],
cache_examples=True,
retry_btn=None,

).launch(share = True)

Hoodoo Herb and Root Magic A Materia Magica of Africanamerican Conjure PDF
3% (36)
Hoodoo Herb and Root Magic A Materia Magica of Africanamerican Conjure PDF
5 pages
Python: Learn Python in 24 Hours
From Everand
Python: Learn Python in 24 Hours
Alex Nordeen
4/5 (12)
Chapter 3 Parts of Computer
No ratings yet
Chapter 3 Parts of Computer
30 pages
Chatbot+Code
No ratings yet
Chatbot+Code
2 pages
QA_Using_Gemini_Langchain_ChromaDB_PDF
No ratings yet
QA_Using_Gemini_Langchain_ChromaDB_PDF
2 pages
Chatbot Code
No ratings yet
Chatbot Code
2 pages
Chatbot+Code
No ratings yet
Chatbot+Code
2 pages
Lab experiment 1 LLM
No ratings yet
Lab experiment 1 LLM
3 pages
zref
No ratings yet
zref
8 pages
Introduction
No ratings yet
Introduction
17 pages
gen ai 7,8,9,10
No ratings yet
gen ai 7,8,9,10
7 pages
Notes_By Kishor
No ratings yet
Notes_By Kishor
11 pages
multimodel_text
No ratings yet
multimodel_text
9 pages
NLP - Cheatsheet
No ratings yet
NLP - Cheatsheet
10 pages
Labsheet9
No ratings yet
Labsheet9
2 pages
Python Scripts
No ratings yet
Python Scripts
5 pages
Langchain Onepager
No ratings yet
Langchain Onepager
1 page
duckduckgo download
No ratings yet
duckduckgo download
3 pages
Build a research assistant using pydanticAI
100% (1)
Build a research assistant using pydanticAI
9 pages
Lab experiment 1
No ratings yet
Lab experiment 1
3 pages
Introducing Transformers Agents 20
No ratings yet
Introducing Transformers Agents 20
8 pages
Case Study
No ratings yet
Case Study
25 pages
Quick Python Guide
From Everand
Quick Python Guide
Coder1
No ratings yet
20BCE1779 - Web Mining - Lab-4
No ratings yet
20BCE1779 - Web Mining - Lab-4
10 pages
Langchain App Design
No ratings yet
Langchain App Design
7 pages
NLP Lab1
No ratings yet
NLP Lab1
6 pages
Course Project Report For: Artificial Intelligence EL-3011
No ratings yet
Course Project Report For: Artificial Intelligence EL-3011
8 pages
Programs code
No ratings yet
Programs code
7 pages
NgRx SignalStore: An effortless solution for state management
From Everand
NgRx SignalStore: An effortless solution for state management
Abdelfattah Ragab
No ratings yet
cs-3308-unit-7-programming-assignment
No ratings yet
cs-3308-unit-7-programming-assignment
8 pages
trip_planner_example
No ratings yet
trip_planner_example
7 pages
ML Assignment
No ratings yet
ML Assignment
5 pages
MultiModel-RAG
No ratings yet
MultiModel-RAG
18 pages
Assessment - 2: - K Mary Nikitha
No ratings yet
Assessment - 2: - K Mary Nikitha
27 pages
LLM Prcess
No ratings yet
LLM Prcess
7 pages
dl_pro_456
No ratings yet
dl_pro_456
8 pages
Computer Ssm 2
No ratings yet
Computer Ssm 2
8 pages
Super Quick - In-Context Learning With Personal Data Using LLAMA 2.0 On CPU - by Ashhadul Islam - Aug, 2023 - Python in Plain English
No ratings yet
Super Quick - In-Context Learning With Personal Data Using LLAMA 2.0 On CPU - by Ashhadul Islam - Aug, 2023 - Python in Plain English
20 pages
50 Recipes for Programming Node.js
From Everand
50 Recipes for Programming Node.js
Jamie Munro
3/5 (4)
cymbal_ingest_to_vector_database_all_steps
No ratings yet
cymbal_ingest_to_vector_database_all_steps
6 pages
How To Build Your Own Custom ChatGPT Bot With Custom Knowledge Base - Better Programming
No ratings yet
How To Build Your Own Custom ChatGPT Bot With Custom Knowledge Base - Better Programming
8 pages
OLLAMA AI CHATBOT
No ratings yet
OLLAMA AI CHATBOT
6 pages
Fine-tuned vs RAG Short Notes ?
No ratings yet
Fine-tuned vs RAG Short Notes ?
25 pages
An AI-Driven PDF Query System Leveraging OpenAI LLM and LangChain for Enhanced Data Retrieval[#1602597]-4445287
No ratings yet
An AI-Driven PDF Query System Leveraging OpenAI LLM and LangChain for Enhanced Data Retrieval[#1602597]-4445287
13 pages
building RAG apps
No ratings yet
building RAG apps
32 pages
NLP (1)
No ratings yet
NLP (1)
12 pages
mini project docubot power point
No ratings yet
mini project docubot power point
17 pages
LangChain Talk
No ratings yet
LangChain Talk
35 pages
LangChain Talk
No ratings yet
LangChain Talk
35 pages
02 Data Connections
No ratings yet
02 Data Connections
32 pages
Web Mining Lab Source Code 1-12 PRINT
No ratings yet
Web Mining Lab Source Code 1-12 PRINT
43 pages
Parts of Speech Tagger
No ratings yet
Parts of Speech Tagger
12 pages
Shubham Jade MSC It 31031420010 NLP Practical Journal
No ratings yet
Shubham Jade MSC It 31031420010 NLP Practical Journal
17 pages
what limitation is solved by our model
No ratings yet
what limitation is solved by our model
10 pages
Anthropic-cookbook:Skills:Contextual-embeddings:Guide.ipynb at Main · Anthropics
No ratings yet
Anthropic-cookbook:Skills:Contextual-embeddings:Guide.ipynb at Main · Anthropics
21 pages
2403RES29 - Hemant Choudhary - CS582 - Assignment - 1
No ratings yet
2403RES29 - Hemant Choudhary - CS582 - Assignment - 1
5 pages
IR Pract
No ratings yet
IR Pract
7 pages
Agentic RAG_removed
No ratings yet
Agentic RAG_removed
9 pages
Reproducibility at ICLR 2019
No ratings yet
Reproducibility at ICLR 2019
82 pages
Flowise AI Tutorial #3 File Loaders, Text Splitters, Embeddings & Vector Stores
No ratings yet
Flowise AI Tutorial #3 File Loaders, Text Splitters, Embeddings & Vector Stores
3 pages
Self Evaluation Exercises (1)
No ratings yet
Self Evaluation Exercises (1)
12 pages
Python Reference: An Alphabetical Guide
From Everand
Python Reference: An Alphabetical Guide
Jo Foster
No ratings yet
2021 Dm00354244 Stm32 Microcontroller Debug Toolbox Stmicroelectronics
No ratings yet
2021 Dm00354244 Stm32 Microcontroller Debug Toolbox Stmicroelectronics
118 pages
Fine Pitch FPC (Flexible Printed Circuit) Connectors - 0.25mm & 0.3mm Pitch
No ratings yet
Fine Pitch FPC (Flexible Printed Circuit) Connectors - 0.25mm & 0.3mm Pitch
4 pages
Use Spyglass Predictive Analysis For Effective RTL Coding
No ratings yet
Use Spyglass Predictive Analysis For Effective RTL Coding
3 pages
Outer-Loop Development and DVE Flight Test Assessment of UH-60
No ratings yet
Outer-Loop Development and DVE Flight Test Assessment of UH-60
14 pages
Inflow v3 Quick Start Guide
No ratings yet
Inflow v3 Quick Start Guide
10 pages
Bombay High Court Technical Manpower On Contract Basis: Annexure - E
No ratings yet
Bombay High Court Technical Manpower On Contract Basis: Annexure - E
8 pages
Acuetix Swastik
No ratings yet
Acuetix Swastik
89 pages
Ict Exam Questions For Primary Schools 1 6 1
No ratings yet
Ict Exam Questions For Primary Schools 1 6 1
5 pages
Unit-4-Development Life Cycle
No ratings yet
Unit-4-Development Life Cycle
30 pages
ISolarDesign User Manual
No ratings yet
ISolarDesign User Manual
39 pages
PLC - Revision
No ratings yet
PLC - Revision
5 pages
Oraciones Del U7-U12 de B3
No ratings yet
Oraciones Del U7-U12 de B3
18 pages
TTU Thesis Format
No ratings yet
TTU Thesis Format
23 pages
The Best Day of My Life
No ratings yet
The Best Day of My Life
6 pages
SD3 HEPHAIS 1600-400 COMFORT-S en Datasheet
No ratings yet
SD3 HEPHAIS 1600-400 COMFORT-S en Datasheet
4 pages
Dpc-7600 8600 Daewoo DVD Portable Player
No ratings yet
Dpc-7600 8600 Daewoo DVD Portable Player
46 pages
Computer Organization and Architecture: Designing For Performance, Global Edition, 11th Edition William Stallings - Ebook PDF Download PDF
100% (4)
Computer Organization and Architecture: Designing For Performance, Global Edition, 11th Edition William Stallings - Ebook PDF Download PDF
49 pages
DS GS-2326 en
No ratings yet
DS GS-2326 en
6 pages
Companies and Intellectual Property Commission (CIPC) EServices
No ratings yet
Companies and Intellectual Property Commission (CIPC) EServices
1 page
Mappa Di Memoria / Memory Map: Gfx4 Access Mode
No ratings yet
Mappa Di Memoria / Memory Map: Gfx4 Access Mode
46 pages
BDS WebUI User Guide V5.0
No ratings yet
BDS WebUI User Guide V5.0
463 pages
Sky Mobile Bill
No ratings yet
Sky Mobile Bill
4 pages
Boolean Algebra
No ratings yet
Boolean Algebra
34 pages
Cloud Native Application Architecture: Nanodegree Program Syllabus
No ratings yet
Cloud Native Application Architecture: Nanodegree Program Syllabus
17 pages
NEC Aspire Multi-Button User Guide
No ratings yet
NEC Aspire Multi-Button User Guide
164 pages
B Maxx® Bm3400: Parameters Manual
No ratings yet
B Maxx® Bm3400: Parameters Manual
534 pages
Lab 2
No ratings yet
Lab 2
7 pages
Capstone Project Proposal
No ratings yet
Capstone Project Proposal
6 pages

Demo

Uploaded by

Demo

Uploaded by

conda create -n ragpipe python=3.

11 -y && conda activate ragpipe

pip install torch sentence_transformers transformers accelerate

from langchain_community.document_loaders import PDFPlumberLoader

def triplextract(text, entity_types, predicates):

# Pass the message as a single string

entity_types = ["PERSON", "LOCATION"]

prediction = triplextract(text, entity_types, predicates)

with open('output.txt', 'w') as f:

# Split into chunks

# Instantiate the embedding model

# Create the vector store and fill it with embeddings

# Define the prompt

You might also like