-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy patholx_beholder.py
115 lines (98 loc) · 3.59 KB
/
olx_beholder.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
import os
import sqlite3
from collections import namedtuple
import configparser
import argparse
import requests
from bs4 import BeautifulSoup
from pyhiccup.core import html
from send_email import send_email_two_part
parser = argparse.ArgumentParser(
description='Simple watcher and email notifier for recent OLX offers ;)')
parser.add_argument('--ini', dest='config_file', default="olx_beholder.ini",
help='config file (default: olx_beholder.ini)')
args = parser.parse_args()
config = configparser.ConfigParser()
try:
with open(args.config_file) as f:
config.read_file(f)
except FileNotFoundError as e:
print(f"Error opening config file: {args.config_file}\n{e}")
exit(1)
sender = config['Message']['sender']
receiver = config['Message']['receiver']
bcc = config['Message'].get('bcc', '')
subject = config['Message']['subject']
db_file = config['Files'].get('database_file', 'olx_beholder.db')
urls_file = config['Files'].get('urls_file', 'urls.txt')
DB_FULL_PATH = os.path.join(os.path.dirname(__file__), db_file)
Offer = namedtuple("Offer", "title link city price")
offers_to_send = []
def init_db(conn):
conn.execute('''CREATE TABLE IF NOT EXISTS offers
(title text, link text UNIQUE, city text, price text)''')
def insert_offer(conn, title, link, city, price):
try:
conn.execute("INSERT INTO offers VALUES (?, ?, ?, ?)",
(title, link, city, price))
conn.commit()
offer = Offer(title, link, city, price)
offers_to_send.append(offer)
print("new OFFER!", offer)
except sqlite3.IntegrityError:
pass
def format_body_text(offers):
body_text = "\n".join(f'* {o.city} {o.price} {o.title} {o.link}\n' for o in offers)
return body_text
def format_body_html(offers):
margin_right = {"style": "margin-right: 3px;"}
data = [
['div',
['ul',
[['li',
['i', margin_right, o.city], ['b', margin_right, o.price], ['a', {'href': o.link}, o.title]]
for o in offers]]
]
]
body_html = html(data)
body_html = body_html.replace('dir="rtl"', 'dir="ltr"')
return body_html
def process_results(conn, content):
soup = BeautifulSoup(content, 'html.parser')
content = soup.find("div", "content")
offers = content.find_all("div", "offer-wrapper")
for offer in offers:
link_title = offer.h3.a
title = link_title.strong.get_text().strip()
link = link_title['href']
city = offer.i.parent.get_text().strip()
price = offer.find("p", "price").get_text().strip()
insert_offer(conn, title, link, city, price)
def get_results(url):
r = requests.get(url)
if r.status_code == 200:
return r.content
raise LookupError
def main():
try:
with open(urls_file) as f:
urls = [url for url in f if url]
except FileNotFoundError as e:
print(f"Error opening urls file\n{e}")
exit(1)
with sqlite3.connect(DB_FULL_PATH) as conn:
init_db(conn)
for url in urls:
results = get_results(url)
process_results(conn, results)
if offers_to_send:
body_text = format_body_text(offers_to_send)
body_html = format_body_html(offers_to_send)
if len(offers_to_send)==1:
offer = offers_to_send[0]
mail_subject = f"*OLX* {offer.city}; {offer.price}; {offer.title}"
else:
mail_subject = f"*{len(offers_to_send)}* {subject}"
send_email_two_part(receiver, sender, mail_subject, body_text, body_html, bcc)
if __name__ == '__main__':
main()