0% found this document useful (0 votes)

27 views3 pages

Duckduckgo Download

This document outlines a Streamlit application that integrates various AI and web scraping functionalities, allowing users to interact with an AI chatbot and perform web searches. It includes features for searching DuckDuckGo, scraping webpage content, generating AI responses, and downloading content. The application utilizes LangChain components for managing chat history and processing text data.

Uploaded by

veldutinagasai97

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

27 views3 pages

Duckduckgo Download

Uploaded by

veldutinagasai97

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 3

import streamlit as st

import requests
from bs4 import BeautifulSoup
from duckduckgo_search import DDGS
from langchain_ollama import ChatOllama, OllamaEmbeddings
from langchain.memory import ChatMessageHistory
from langchain_core.output_parsers import StrOutputParser
from langchain_core.prompts import ChatPromptTemplate
from langchain.vectorstores import FAISS
from langchain.text_splitter import RecursiveCharacterTextSplitter
import json

# Function to search DuckDuckGo

def duckduckgo_search(query, num_results=5):
with DDGS() as ddgs: # Use the DDGS class
results = [r for r in ddgs.text(query, max_results=num_results)] # Perform
search
# Extract URLs from results (check the correct key)
return [result.get("href") for result in results] if results else [] # Updated
key to "href"

# Function to scrape text from a webpage

def scrape_text(url):
try:
response = requests.get(url, headers={"User-Agent": "Mozilla/5.0"})
soup = BeautifulSoup(response.text, "html.parser")
return " ".join([p.text for p in soup.find_all("p")]) # Extract text from
<p> tags
except Exception as e:
return f"Error scraping {url}: {e}"

# Function to download scraped content as a file

def download_content(content, filename):
st.download_button(
label="Download Content",
data=content,
file_name=filename,
mime="text/plain"
)

# Initialize the Ollama LLM model

llm = ChatOllama(model="deepseek-r1:latest")

# Initialize Streamlit UI
st.set_page_config(page_title="Enterprise AI Chatbot", layout="wide")

st.title("🚀 Enterprise AI Chatbot with LangChain & Streamlit")

st.write("Ask anything and interact with your AI assistant!")

# Chat history
if "history" not in st.session_state:
st.session_state.history = ChatMessageHistory()

# User input
user_input = st.text_input("You:", key="user_input")

if st.button("Ask"):
if user_input:
# Add user input to history
st.session_state.history.add_user_message(user_input)

# Get AI response
ai_response = llm.invoke(st.session_state.history.messages)
st.session_state.history.add_ai_message(ai_response.content)

# Display chat
for msg in st.session_state.history.messages:
if msg.type == "human":
st.write(f"👤 You: {msg.content}")
else:
st.write(f"🤖 AI: {msg.content}")

# Web Crawling and Search

st.sidebar.header("Keyword-Based Web Crawler")
keyword = st.sidebar.text_input("Enter a keyword to search & scrape:")

if st.sidebar.button("Crawl & Search"):

if keyword:
st.write(f"🔍 Searching DuckDuckGo for: **{keyword}**...")
urls = duckduckgo_search(keyword)

if urls:
st.write("✅ Found pages:", urls)

# Store URLs in session state for later use

st.session_state.urls = urls

# Scrape content from the retrieved URLs

scraped_texts = [scrape_text(url) for url in urls]

# Split scraped text into chunks

text_splitter = RecursiveCharacterTextSplitter(chunk_size=200,
chunk_overlap=20)
texts = text_splitter.create_documents(scraped_texts)

# Create FAISS index

embeddings = OllamaEmbeddings(model="nomic-embed-text:latest")
db = FAISS.from_documents(texts, embeddings)
retriever = db.as_retriever()

# User searches inside the scraped content

search_query = st.text_input("Search in scraped content:")

if st.button("Search in Scraped Data"):

docs = retriever.invoke(search_query)
if docs:
st.write("🔍 Retrieved Text:", docs[0].page_content[:300])
else:
st.write("No relevant results found.")
else:
st.write("No search results found.")

# Button to retrieve and display content from generated websites

if "urls" in st.session_state:
if st.sidebar.button("Retrieve Content from Websites"):
st.write("📄 Retrieved Content from Websites:")
for i, url in enumerate(st.session_state.urls):
st.write(f"### Content from: {url}")
content = scrape_text(url)
st.write(content[:1000]) # Display the first 1000 characters of the
content

# Add a download button for each scraped content

download_content(content, f"scraped_content_{i + 1}.txt")
st.write("---")

# Prompt-based AI interaction
st.sidebar.header("AI-Powered Prompt Generator")
topic = st.sidebar.text_input("Enter a topic for AI-generated content:")

if st.sidebar.button("Generate"):
prompt_template = ChatPromptTemplate.from_template("Tell me a joke about
{topic}")
chain = prompt_template | llm | StrOutputParser()
ai_output = chain.invoke({"topic": topic})
st.sidebar.write(f"📝 AI Response: {ai_output}")

st.sidebar.markdown("📌 Enterprise AI solution using LangChain + Streamlit")

Essential n8n Playbook
From Everand
Essential n8n Playbook
Leandro Calado
No ratings yet
Quiz Game Documentation
71% (14)
Quiz Game Documentation
33 pages
Agent Ai
No ratings yet
Agent Ai
30 pages
Research Proposal
No ratings yet
Research Proposal
16 pages
Toshiba Qosmio x70-A Quanta Bdd Da0bddmb8h0 Rev a1a Схема
100% (1)
Toshiba Qosmio x70-A Quanta Bdd Da0bddmb8h0 Rev a1a Схема
37 pages
Sithfal-Task2 Explation Matter
No ratings yet
Sithfal-Task2 Explation Matter
6 pages
Ollama Ai Chatbot
No ratings yet
Ollama Ai Chatbot
6 pages
Another Hack Test3
No ratings yet
Another Hack Test3
4 pages
Lab Experiment 1 LLM
No ratings yet
Lab Experiment 1 LLM
3 pages
Langchain Onepager
No ratings yet
Langchain Onepager
1 page
Python v3 URL and Page
No ratings yet
Python v3 URL and Page
4 pages
Introduction To Web Crawling Chapter - 13
No ratings yet
Introduction To Web Crawling Chapter - 13
3 pages
Lab Experiment 1
No ratings yet
Lab Experiment 1
3 pages
Demo
No ratings yet
Demo
3 pages
How To Build Your Own Custom ChatGPT Bot With Custom Knowledge Base - Better Programming
No ratings yet
How To Build Your Own Custom ChatGPT Bot With Custom Knowledge Base - Better Programming
8 pages
Python Code Explanation
No ratings yet
Python Code Explanation
4 pages
Generative Ai
No ratings yet
Generative Ai
1 page
Web Scraping and Data Collection CheatSheet 1731972399
No ratings yet
Web Scraping and Data Collection CheatSheet 1731972399
10 pages
Python Web Crawler
No ratings yet
Python Web Crawler
15 pages
03 Web Scraping
No ratings yet
03 Web Scraping
41 pages
Sans Titre
No ratings yet
Sans Titre
11 pages
A Simple Python Web Crawler...
100% (1)
A Simple Python Web Crawler...
5 pages
Programming Assignment Unit 07 - CS 3308 - Information Retrieval - University of The People
No ratings yet
Programming Assignment Unit 07 - CS 3308 - Information Retrieval - University of The People
4 pages
Assignment 1
No ratings yet
Assignment 1
5 pages
Trip Planner Example
No ratings yet
Trip Planner Example
7 pages
Chatbot Code
No ratings yet
Chatbot Code
2 pages
Building A Streamlit Chatbot With LangChain and Llama 3.1 - Exploring LLMs - 3 - by Abou Zuhayr - Sep, 2024 - GoPenAI
No ratings yet
Building A Streamlit Chatbot With LangChain and Llama 3.1 - Exploring LLMs - 3 - by Abou Zuhayr - Sep, 2024 - GoPenAI
15 pages
LLM Prcess
No ratings yet
LLM Prcess
7 pages
Data Engineering Concepts #2 - Sending Data Using An API - by Bar Dadon - Dev Genius
No ratings yet
Data Engineering Concepts #2 - Sending Data Using An API - by Bar Dadon - Dev Genius
14 pages
ML Assignment
No ratings yet
ML Assignment
5 pages
Chatbot Code
No ratings yet
Chatbot Code
2 pages
Course Project Report For: Artificial Intelligence EL-3011
No ratings yet
Course Project Report For: Artificial Intelligence EL-3011
8 pages
Synopsis
No ratings yet
Synopsis
3 pages
Chatbot Code
No ratings yet
Chatbot Code
2 pages
ConversaiLabs Assignment - 1
No ratings yet
ConversaiLabs Assignment - 1
1 page
Multithreading Crawler Project OS
No ratings yet
Multithreading Crawler Project OS
11 pages
Subdomain Scanner
No ratings yet
Subdomain Scanner
2 pages
Ai Lab 02
No ratings yet
Ai Lab 02
12 pages
Web Crawler PY
No ratings yet
Web Crawler PY
27 pages
Sahil Malhotra 16 BCE 0113 Web Mining L51+L52: 1. Universal Crawling 1.1. CODE
No ratings yet
Sahil Malhotra 16 BCE 0113 Web Mining L51+L52: 1. Universal Crawling 1.1. CODE
11 pages
Prop MPT
No ratings yet
Prop MPT
73 pages
Web Mining Lab Source Code 1-12 PRINT
No ratings yet
Web Mining Lab Source Code 1-12 PRINT
43 pages
Practical7 IR
No ratings yet
Practical7 IR
3 pages
App
No ratings yet
App
7 pages
Ballerono Cappuchino
No ratings yet
Ballerono Cappuchino
10 pages
L3-Chains - Jupyter Notebook
No ratings yet
L3-Chains - Jupyter Notebook
12 pages
Introduction
No ratings yet
Introduction
17 pages
RajSingh WIexp4
No ratings yet
RajSingh WIexp4
7 pages
Google Search Ai Agent Using Phidata and Groq: Name: Register Number: Course
No ratings yet
Google Search Ai Agent Using Phidata and Groq: Name: Register Number: Course
7 pages
20BCE1779 - Web Mining - Lab-4
No ratings yet
20BCE1779 - Web Mining - Lab-4
10 pages
QA Using Gemini Langchain ChromaDB PDF
No ratings yet
QA Using Gemini Langchain ChromaDB PDF
2 pages
An Effective Query System Using Llms and Langchain IJERTV12IS060161
No ratings yet
An Effective Query System Using Llms and Langchain IJERTV12IS060161
4 pages
Build A Research Assistant Using pydanticAI
100% (1)
Build A Research Assistant Using pydanticAI
9 pages
Create - Folder - If - Not - Exists: STR None
No ratings yet
Create - Folder - If - Not - Exists: STR None
5 pages
Zref
No ratings yet
Zref
8 pages
77 Final
No ratings yet
77 Final
24 pages
WebScraping Lessons 4
No ratings yet
WebScraping Lessons 4
5 pages
F6Us9XWGTfenbcduDaGuFQ - Openai Workingcourse Dall e Intro To Dall e
No ratings yet
F6Us9XWGTfenbcduDaGuFQ - Openai Workingcourse Dall e Intro To Dall e
10 pages
Aditya Polytechnic Beed: Microproject On
No ratings yet
Aditya Polytechnic Beed: Microproject On
29 pages
Web Scraping Using Python: A Step by Step Guide: September 2019
No ratings yet
Web Scraping Using Python: A Step by Step Guide: September 2019
7 pages
Web Scraping Report
No ratings yet
Web Scraping Report
14 pages
RAG Project Documentation
No ratings yet
RAG Project Documentation
3 pages
Inspiring Powershell Articles
From Everand
Inspiring Powershell Articles
Murat Yildirimoglu
No ratings yet
Sony, Apple, Boselink
No ratings yet
Sony, Apple, Boselink
5 pages
Langchain LLM
No ratings yet
Langchain LLM
25 pages
Arvr Testing Process
No ratings yet
Arvr Testing Process
5 pages
Evaluation Metrics PPT
No ratings yet
Evaluation Metrics PPT
10 pages
LangChain Concepts Updated With Tealium
No ratings yet
LangChain Concepts Updated With Tealium
17 pages
About AR VR Device
No ratings yet
About AR VR Device
6 pages
Evaluation Metrics Formulas
No ratings yet
Evaluation Metrics Formulas
9 pages
LangChain Concepts Full Presentation
No ratings yet
LangChain Concepts Full Presentation
17 pages
Langchain Concepts
No ratings yet
Langchain Concepts
7 pages
Test Automation For AR Applications
No ratings yet
Test Automation For AR Applications
9 pages
Calculator
0% (1)
Calculator
9 pages
QX Brochure
No ratings yet
QX Brochure
27 pages
Microcontroller Inputs and Outputs
No ratings yet
Microcontroller Inputs and Outputs
1 page
Survey Ppt.1
No ratings yet
Survey Ppt.1
14 pages
E-Ball Technology: Presented By, K. Malathi (15U51A0521)
No ratings yet
E-Ball Technology: Presented By, K. Malathi (15U51A0521)
19 pages
Computer Fundamental MCQ Questions and Answers-Technical Aptitude
No ratings yet
Computer Fundamental MCQ Questions and Answers-Technical Aptitude
5 pages
How To Add AdSense Ads at The End of The Post in Blogger
No ratings yet
How To Add AdSense Ads at The End of The Post in Blogger
2 pages
4G Optimization and KPI Analysis
100% (1)
4G Optimization and KPI Analysis
19 pages
KTSM00002 FactoryTalk View Connectivity Guide KEPWARE
No ratings yet
KTSM00002 FactoryTalk View Connectivity Guide KEPWARE
18 pages
ITR Front Pages
100% (1)
ITR Front Pages
5 pages
Oracle: Question & Answers
No ratings yet
Oracle: Question & Answers
7 pages
12th Computer Applications All Practical Programs English Medium PDF Download
No ratings yet
12th Computer Applications All Practical Programs English Medium PDF Download
33 pages
Prolixgal Ethical-Hacking
No ratings yet
Prolixgal Ethical-Hacking
1 page
Unit 1 - ARM7
No ratings yet
Unit 1 - ARM7
67 pages
WinCNC Optiscout Operations-Manual
No ratings yet
WinCNC Optiscout Operations-Manual
11 pages
100 Essential Resources For Hardware & Electrical Engineers Ebook
No ratings yet
100 Essential Resources For Hardware & Electrical Engineers Ebook
65 pages
A Model Data Management Plan Standard Operating Procedure: Results From The DIA Clinical Data Management Community, Committee On Clinical Data Management Plan
No ratings yet
A Model Data Management Plan Standard Operating Procedure: Results From The DIA Clinical Data Management Community, Committee On Clinical Data Management Plan
10 pages
ChandraSekhar Byna
No ratings yet
ChandraSekhar Byna
7 pages
Azure Disaster Recovery Full Presentation
No ratings yet
Azure Disaster Recovery Full Presentation
14 pages
مقياس موهبة الصف الثالث المتوسط نموذج الإجابة PDF
No ratings yet
مقياس موهبة الصف الثالث المتوسط نموذج الإجابة PDF
1 page
Archers Voice - Free Download, Borrow, and Streaming - Internet Archive
No ratings yet
Archers Voice - Free Download, Borrow, and Streaming - Internet Archive
4 pages
CUH PCULog0
No ratings yet
CUH PCULog0
2 pages
IT Questions
No ratings yet
IT Questions
108 pages
Ena Solar Inverter GT-Manual
No ratings yet
Ena Solar Inverter GT-Manual
32 pages
Venkatesh Maipathii
No ratings yet
Venkatesh Maipathii
12 pages
System Analysis Toolkit Users Guide
No ratings yet
System Analysis Toolkit Users Guide
124 pages
Manually Update Samsung Phone To Android 10 One UI 2.0 and 2.1
No ratings yet
Manually Update Samsung Phone To Android 10 One UI 2.0 and 2.1
4 pages

Duckduckgo Download

Uploaded by

Duckduckgo Download

Uploaded by

import streamlit as st

# Function to search DuckDuckGo

# Function to scrape text from a webpage

# Function to download scraped content as a file

# Initialize the Ollama LLM model

st.title("🚀 Enterprise AI Chatbot with LangChain & Streamlit")

# Web Crawling and Search

if st.sidebar.button("Crawl & Search"):

# Store URLs in session state for later use

# Scrape content from the retrieved URLs

# Split scraped text into chunks

# Create FAISS index

# User searches inside the scraped content

if st.button("Search in Scraped Data"):

# Button to retrieve and display content from generated websites

# Add a download button for each scraped content

st.sidebar.markdown("📌 **Enterprise AI solution using LangChain + Streamlit**")

You might also like

st.sidebar.markdown("📌 Enterprise AI solution using LangChain + Streamlit")