Added tasks integration

Added required positional argument placeholder
fix wiki commands
2024-02-06 21:17:49 +01:00 · 2024-02-06 21:05:02 +01:00 · 2024-02-06 20:51:31 +01:00 · 2024-02-06 20:48:08 +01:00 · 2024-02-06 11:39:10 +01:00 · 2024-02-06 03:46:17 +01:00
2 changed files with 37 additions and 9 deletions
--- a/functions.py
+++ b/functions.py
@@ -4,8 +4,8 @@ import scraper_functions as sf
 def processmsg(msg, rcpt):
    if "youtube.com/watch" in msg:
        return msg.replace("youtube.com", "iv.datura.network")
-    elif msg.startswith("!wiki"):
-        return sf.query_external_website("https://en.wikipedia.org/wiki/", msg.split(" ")[1])
+    elif msg.startswith("!"):
+        return command(msg, "")
    elif "good bot" in msg:
        return "^_^"

@@ -13,10 +13,17 @@ def command(msg, rcpt):
    if msg.startswith("!help"):
        response = "chatbot commands:"  + "\n"
        response += "!help            Show this help page" + "\n"
-        response += "!ai [message]    Ask llama2"
+        response += "!ai [message]    Ask llama2" + "\n"
+        response += "!wiki [message]    Ask wiki"
        return response
    elif msg.startswith("!ai"):
        client = ollama.Client(host='https://ollama.krov.dmz.rs')
        response = client.chat(model='llama2-uncensored:latest', messages=[{'role':'user','content':f'{msg[4:]}'}])
        return(response['message']['content'])
+    elif msg.startswith("!wiki"):
+        cmd, query = msg.split(" ", 1)
+        return sf.query_external_website("https://en.wikipedia.org", "/wiki/" + query)
+    elif msg.startswith("!tasks"):
+        content = sf.getDmzTasks()
+        return content

--- a/scraper_functions.py
+++ b/scraper_functions.py
@@ -1,12 +1,33 @@
 import requests
 from bs4 import BeautifulSoup
+from urllib.parse import quote

 def query_external_website(base_url, query):
    try:
-        page = requests.get(base_url + query)
+        page = requests.get(base_url + quote(query))
        soup = BeautifulSoup(page.content, "html.parser")
-        title = soup.find("span", class_="mw-page-title-main").text
-        content = soup.find(id="mw-content-text").select("p")[2].text
-        return "\nTITLE:\n" + title + "\n\nCONTENT:\n" + content + "\n\nFULL LINK:\n" + base_url + query
-    except:
-        return "Can't parse search result :("
+        title = soup.find(id="firstHeading").text
+        mainContentElement = soup.find(id="mw-content-text")
+        if "This page is a redirect" in mainContentElement.text:
+            redirectLink = mainContentElement.find(class_="redirectMsg").find_all("a")[0]["href"]
+            return query_external_website(base_url, redirectLink)
+        content = next((paragraph for paragraph in mainContentElement.select("p") if not paragraph.has_attr("class")), None)
+        if content == None:
+            raise Exception("Can't parse search result :(")
+        return "\nTITLE:\n" + title + "\n\nCONTENT:\n" + content.text + "\n\nFULL LINK:\n" + base_url + quote(query)
+    except Exception as e:
+        return e
+
+def getDmzTasks():
+    try:
+        page = requests.get("https://todo.dmz.rs/")
+        soup = BeautifulSoup(page.content, "html.parser")
+        tasks = soup.find_all(class_="task")
+        result = "\nActive tasks:\n"
+        for task in tasks:
+            taskIndex = task.select("div")[0].text
+            taskTitle = task.select("div")[1].text
+            result += taskIndex + " " + taskTitle + "\n"
+        return result
+    except Exception as e:
+        return e
Author	SHA1	Message	Date
t3xhno	97d613df58	Added tasks integration	2024-02-06 21:17:49 +01:00
t3xhno	1e56a84a4c	Added required positional argument placeholder	2024-02-06 21:05:02 +01:00
fram3d	c011383f0e	fix wiki commands	2024-02-06 20:51:31 +01:00
fram3d	544f8052e9	fix wiki placing it into command functions	2024-02-06 20:48:08 +01:00
t3xhno	161abdf32e	Better wiki redirect	2024-02-06 11:39:10 +01:00
texhno	a256bc277d	Better heading selector	2024-02-06 03:46:17 +01:00
texhno	d4d14806db	Raise exception on None content	2024-02-06 03:37:26 +01:00
texhno	6df3c82a7e	Get first available paragraph from query	2024-02-06 03:34:43 +01:00
texhno	41e38ef80f	Correct url link from multiword wiki query	2024-02-06 02:58:45 +01:00
texhno	0813460e8b	Merge branch 'master' of ssh://gitea.dmz.rs:2222/Decentrala/chatbot	2024-02-06 02:49:46 +01:00
texhno	4ca01a868d	Multiword wiki query added	2024-02-06 02:49:40 +01:00
fram3d	1795a87c4b	add wiki to help	2024-02-06 02:47:01 +01:00
texhno	9704474c29	Merge branch 'master' of ssh://gitea.dmz.rs:2222/Decentrala/chatbot	2024-02-06 02:38:46 +01:00
texhno	5b4ae05582	Merge pull request 'scraper_functions' (#1 ) from scraper_functions into master Reviewed-on: #1	2024-02-06 01:24:57 +00:00