Spaces:
Running
Running
Create app.py
Browse files
app.py
ADDED
@@ -0,0 +1,65 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import streamlit as st
|
2 |
+
from bs4 import BeautifulSoup
|
3 |
+
import requests
|
4 |
+
from groq import Groq
|
5 |
+
|
6 |
+
# Define the Website class
|
7 |
+
class Website:
|
8 |
+
def __init__(self, url):
|
9 |
+
self.url = url
|
10 |
+
try:
|
11 |
+
response = requests.get(url)
|
12 |
+
soup = BeautifulSoup(response.content, 'html.parser')
|
13 |
+
self.title = soup.title.string if soup.title else "No title found"
|
14 |
+
for irrelevant in soup.body(["script", "style", "img", "input"]):
|
15 |
+
irrelevant.decompose()
|
16 |
+
self.text = soup.body.get_text(separator="\n", strip=True)
|
17 |
+
except Exception as e:
|
18 |
+
self.title = "Error loading page"
|
19 |
+
self.text = str(e)
|
20 |
+
|
21 |
+
# Initialize Groq client
|
22 |
+
api_key = "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"
|
23 |
+
client = Groq(api_key=api_key)
|
24 |
+
|
25 |
+
# Streamlit UI
|
26 |
+
st.title("Welcome to WebBot")
|
27 |
+
st.write("Enter a website URL and ask questions about its content!")
|
28 |
+
|
29 |
+
# Input fields
|
30 |
+
url = st.text_input("Website URL:", "https://example.com or .ac.ke " )
|
31 |
+
user_query = st.text_area("What would you like to know about this website")
|
32 |
+
|
33 |
+
if st.button("Submit"):
|
34 |
+
# Scrape website content
|
35 |
+
with st.spinner("Scraping website..."):
|
36 |
+
website = Website(url)
|
37 |
+
|
38 |
+
if "Error" in website.title:
|
39 |
+
st.error("Failed to load the website. Please check the URL.")
|
40 |
+
else:
|
41 |
+
st.success("Website loaded successfully!")
|
42 |
+
st.write(f"**Website Title:** {website.title}")
|
43 |
+
|
44 |
+
# Call Groq API for processing
|
45 |
+
st.write("Querying the website...")
|
46 |
+
with st.spinner("Processing your query..."):
|
47 |
+
try:
|
48 |
+
chat_streaming = client.chat.completions.create(
|
49 |
+
messages=[
|
50 |
+
{"role": "system", "content": "You are a helpful assistant specializing in extracting and analyzing website content. Answer questions based on the provided website's content. Ensure responses are clear, concise, and formatted in Markdown for better readability."},
|
51 |
+
{"role": "user", "content": f"{user_query} Here's the content:\n{website.text}"}
|
52 |
+
],
|
53 |
+
model="llama3-groq-70b-8192-tool-use-preview",
|
54 |
+
temperature=0.3,
|
55 |
+
max_tokens=1200,
|
56 |
+
top_p=1,
|
57 |
+
stream=True,
|
58 |
+
)
|
59 |
+
response = ""
|
60 |
+
for chunk in chat_streaming:
|
61 |
+
response += chunk.choices[0].delta.content
|
62 |
+
st.write("### Response:")
|
63 |
+
st.write(response)
|
64 |
+
except Exception as e:
|
65 |
+
st.error(f"Failed to process query: {e}")
|