-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathbot.py
141 lines (133 loc) · 4.12 KB
/
bot.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
import feedparser
import sqlite3
import os
import asyncio
from hashlib import sha1
from json import dumps
import telegram
import html2markdown
from time import mktime, time
from datetime import datetime
from dateutil import parser
def connect_to_db():
if not os.path.exists('simple.db'):
create_db()
return sqlite3.connect('simple.db')
def create_db():
conn = sqlite3.connect('simple.db')
c = conn.cursor()
c.execute('''CREATE TABLE feeds (ID INTEGER PRIMARY KEY, URL VARCHAR(2083) UNIQUE);''')
c.execute('''CREATE TABLE entries (ID INTEGER PRIMARY KEY, Feed INTEGER,
Title VARCHAR(2083), PubDate DECIMAL, FOREIGN KEY(Feed) REFERENCES
feeds(ID), CONSTRAINT uniqueness UNIQUE (Title, PubDate, Feed));''')
conn.commit()
conn.close()
def check_new(conn, url, title, timestamp):
c = conn.cursor()
sql = "SELECT ID FROM feeds WHERE URL = ?"
c.execute(sql, [url])
ids = c.fetchone()
new = False
send = False
if not ids:
sql = "INSERT INTO feeds (URL) VALUES (?);"
c.execute(sql, [url])
sql = "INSERT INTO entries (Feed, Title, PubDate) VALUES (?, ?, ?);"
c.execute(sql, [c.lastrowid, title, timestamp])
new = True
send = False
else:
sql = "SELECT Title FROM entries WHERE Feed = ? AND Title = ? AND PubDate = ?"
c.execute(sql, [ids[0], title, timestamp])
result = c.fetchall()
if not result:
sql = "INSERT INTO entries (Feed, Title, PubDate) VALUES (?, ?, ?);"
try:
c.execute(sql, [ids[0], title, timestamp])
send = True
except sqlite3.IntegrityError as e:
print("Error inserting " + str(title) + " - " + str(timestamp) + ". Got error: " + str(e))
send = False
conn.commit()
return new, send
def get_timestamp(entry):
timestamp = 0
try:
timestamp = mktime(entry['published_parsed'])
except:
try:
timestamp = mktime(entry['updated_parsed'])
except:
try:
timestamp = mktime(parser.parse(entry['published'], fuzzy=True).timetuple())
except:
try:
timestamp = mktime(parser.parse(entry['updated'], fuzzy=True).timetuple())
except:
timestamp = float(sha1(entry['title'].hexdigest())) # If absolutely no timestamp is possible, "hash" the title.
return timestamp
async def check_feed():
conn = connect_to_db()
with open("urls") as f:
content = f.readlines()
content = [x.strip() for x in content]
bot, chat = init_bot()
for url in content:
if url == "":
continue
feed = feedparser.parse(url)
for entry in feed['entries']:
title = entry.title
try:
desc = entry.description
except:
print(feed)
desc = "[COULD NOT RETRIEVE DESCRIPTION]"
link = entry.link
timestamp = get_timestamp(entry)
new, send = check_new(conn, url, title, timestamp)
if new:
for entry in feed['entries']:
title = entry.title
timestamp = get_timestamp(entry)
check_new(conn, url, title, timestamp)
break
elif send:
message = "**" + feed.feed.title + "** \n \n"
message += "[" + title + "](" + link + ") \n \n"
parsed = feedparser.parse(desc)
try:
src = parsed['feed']['img']['src']
if len(message) > 1024:
message = message[:1020]
message += "..."
await bot.send_photo(chat_id=chat, photo=src, caption=message, parse_mode=telegram.constants.ParseMode.MARKDOWN_V2)
except:
tmp = message + html2markdown.convert(feed.entries[0].description)
try:
await send_message(tmp, bot, chat)
except:
await send_message(message, bot, chat)
conn.close()
def init_bot():
with open("token") as f:
content = f.readlines()
content = [x.strip() for x in content]
bot = telegram.Bot(token=content[0])
return bot, content[1]
async def send_message(message, bot, chat):
if len(message) > 1024:
message = message[:1020]
message += "..."
bot.sendMessage(text=message, chat_id=chat, parse_mode=telegram.constants.ParseMode.MARKDOWN)
if __name__ == "__main__":
init = True
if not os.path.exists("urls"):
print("You do not have a urls file, please add your rss feeds to the newly created urls file")
init = False
if not os.path.exists("token"):
print("You do not have a token file, please add the neccessary details to your token file")
init = False
if not init:
exit()
asyncio.run(check_feed())