-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathdata_base.py
259 lines (199 loc) · 10.7 KB
/
data_base.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
"""
data_base.py: The Data Access Layer (DAL) of the project.
This library interacts with the MongoDB , SQLite databases and the Gmail API to fetch, process, and store email data.
It provides functions to initialize, update, and manage the database and more.
"""
from constent import *
import base64
import shared_resources
import pymongo
from simplegmail import Gmail , message , label, attachment
from simplegmail.query import construct_query
import logging
import sqlite_file
from datetime import datetime, timezone
import time
from dateutil import parser
logging.basicConfig(level=logging.INFO)
gmail = Gmail()
categories = {"CATEGORY_SOCIAL": "CATEGORY_SOCIAL","CATEGORY_PROMOTIONS": "CATEGORY_PROMOTIONS","CATEGORY_UPDATES": "CATEGORY_UPDATES","CATEGORY_FORUMS": "CATEGORY_FORUMS","CATEGORY_PERSONAL": "CATEGORY_PERSONAL","CATEGORY_PRIMARY": "CATEGORY_PRIMARY"}
def update_db(email) -> None:
logging.info(f"\n\nupdate_db -- START \n\n")
"""
Get the messages from the user gmail account and check if there's a message that dosent exist in the collection
by checking the id & labels of the message
"""
db = shared_resources.client["Deft"]
users_collection = db["Users"]
message_collection = db["Messages"]
current_latest_message_dict = users_collection.find_one({"email": email}, {"latest_message": 1})
current_latest_message = current_latest_message_dict.get("latest_message")
current_latest_message = current_latest_message.replace(tzinfo=timezone.utc)
latest_message_date = None
labels = gmail.list_labels()
if Constent.there_is_messages_after_latest_message_from_gmail(gmail, users_collection, current_latest_message):
for label in labels:
logging.info(f"\n\nupdate_db -- gmail query START: {time.ctime()}\n\n")
messages = gmail.get_messages(query=f"label: {label.name}")
logging.info(f"\n\nupdate_db -- gmail quary END: {time.ctime()} \n\n")
if messages:
latest_message_date = Constent.convert_date_to_utc(messages[0].date)
has_newer = update_and_check_latest_message(email, latest_message_date)
if has_newer:
for msg in messages:
found = message_collection.count_documents({"id": msg.id, "label_ids": labels_to_list(msg.label_ids)})
if not found:
found_with_other_labels = message_collection.find_one({"id": msg.id})
if found_with_other_labels:
message_collection.delete_one({"id": msg.id})
msg.date = Constent.convert_date_to_utc(msg.date)
msg = purify_message(msg)
message_collection.insert_one(msg)
if (not found_with_other_labels) and ( "TRASH" not in msg["label_ids"]):
x = msg["subject"]
for label in msg["label_ids"]:
if categories.get(label):
category_handler(msg, label, email)
logging.info(f"\n\nupdate_db -- END: {time.ctime()} \n\n")
def init_db(email) -> None:
"""
Init the database with the user email data for the first time
"""
db = shared_resources.client["Deft"]
users_collection = db["Users"]
message_collection = db["Messages"]
labels = gmail.list_labels()
for label in labels:
messages = gmail.get_messages(query=f"label:{label.name}")
if messages:
latest_message_date = Constent.convert_date_to_utc(messages[0].date)
label_message_ids = []
for msg in messages:
msg.date = Constent.convert_date_to_utc(msg.date)
if message_collection.count_documents({"id": msg.id}) == 0:
purified_message = purify_message(msg)
message_collection.insert_one(purified_message)
else:
purified_message = purify_message(msg)
label_message_ids.append(purified_message["id"])
users_collection.update_one({"email": email}, {"$push": {label.name: {"$each": label_message_ids}}})
update_and_check_latest_message(email, latest_message_date)
for message in messages:
labels = {label.name: label.name for label in message.label_ids}
if "TRASH" not in labels:
for label_element in labels:
label_element = label.name if hasattr(label, 'name') else label_element
if categories.get(label_element):
category_handler(message, label_element, email)
def make_db(email) -> None:
"""
Makes a documment for the user with the email
"""
email_name_of_user =shared_resources.get_name_from_email(email)
db = shared_resources.client["Deft"]
users_collection = db["Users"]
user_data_set = users_collection.find_one({"name": email_name_of_user})
if not user_data_set:
labels = gmail.list_labels()
label_lists = {label.name: [] for label in labels}
users_collection.insert_one({"email": email, "name": email_name_of_user, **label_lists, "latest_message": datetime(1970, 1, 1, tzinfo=timezone.utc)})
def category_handler(message, label, email)-> None:
db = shared_resources.client["Deft"]
user_collection = db["Users"]
message = purify_message(message)
user_collection.update_one({"email": email}, {"$push": {label: message["id"]}})
def update_and_check_latest_message(email, latest_message_date)-> bool:
db = shared_resources.client["Deft"]
user_collection = db["Users"]
latest_dict = user_collection.find_one({"email": email}, {"latest_message": 1})
current_latest_date = latest_dict.get("latest_message")
if current_latest_date:
current_latest_date = current_latest_date.replace(tzinfo=timezone.utc)
if current_latest_date and (current_latest_date < latest_message_date):
user_collection.update_one({"email": email}, {"$set": {"latest_message": latest_message_date}})
return True
return False
def labels_to_list(labels)-> list[str]: #TODO: change the insertion to the function
if isinstance(labels[0], label.Label):
return [label.name for label in labels]
elif isinstance(labels, str):
return [label for label in labels]
def purify_message(messages) -> list[dict]:
"""
Makes the messages list to be valid for mongoDB
"""
def process_message(message):
message_dict = message.__dict__
message_dict = Constent.filter_fields(message_dict, labels_to_list)
message_dict['date'] = Constent.convert_date_to_utc(message_dict['date'])
return message_dict
if isinstance(messages, list):
messages = [process_message(message) for message in messages]
elif isinstance(messages, message.Message):
messages = process_message(messages)
return messages
def fetch_message_and_message_labels(message_id, labels) -> dict:
"""
Fetches a single message from the database and its labels.
"""
db = shared_resources.client["Deft"]
label_names = shared_resources.get_labels(labels, 0)
message_collection = db["Messages"]
message = message_collection.find_one({"id": message_id})
return message, label_names
def update_messages_after_action(message, message_id)-> None: #TODO: not in use
db = shared_resources.client["Deft"]
message_collection = db["Messages"]
message_collection.delete_one({"id": message['id']})
message = purify_message(message)
message_collection.insert_one(message)
db["Users"].update_one({"email": session['email']}, {"$pull": {"unread": message_id}})
def make_as_read(email,desired_label,desired_message_id,db) -> None:
db["Users"].update_one({"email":email}, {"$pull": {"UNREAD": desired_message_id}})
db["Messages"].update_one({"id": desired_message_id}, {"$pull": {"label_ids": desired_label}})
def find_user(email)-> int:
db = shared_resources.client["Deft"]
user_count = db["Users"].count_documents({"email": email})
return user_count
def pull_id_from_users_by_label(email, label, message_id, db)-> None:
db["Users"].update_one({"email": email}, {"$pull": {label: message_id}})
def insert_id_to_Users_by_label(email, label, message_id, db)-> None:
db["Users"].update_one({"email": email}, {"$push": {label: message_id}})
def delete_from_collection(collection_name, message_id, db)-> None:
db[collection_name].delete_one({"id": message_id})
def insert_one_document_to_collection(collection_name, message, db)-> None:
message = purify_message(message)
db[collection_name].insert_one(message)
def insert_many_documents_to_collection(collection_name, messages)-> None:
db = shared_resources.client["Deft"]
messages = purify_message(messages)
db[collection_name].insert_many(messages)
def get_all_ids_for_user(email)-> list: #TODO: not in use
db = shared_resources.client["Deft"]
user = db["Users"].find_one({"email": email})
return user["all_ids"]
def get_all_messages_erlier_than_latest_message(message_collection) -> list:
todays_date = Constent.get_today_date()
messages = message_collection.find({"date":{"$gte": todays_date}, "label_ids":{"$ne": "TRASH"}}).sort("date", -1)
messages = list(messages)
messages = remove_duplicates_from_list(messages)
return messages
def remove_duplicates_from_list(messages)-> list:
seen = list()
unique_messages = []
for message in messages:
if message["id"] not in seen:
seen.append(message["id"])
unique_messages.append(message)
return unique_messages
def insert_label_to_message(email, label, message_id, recipient, db) -> None:
res = db["Messages"].update_one({"recipient":recipient, "id": message_id}, {"$addToSet": {"label_ids": label}}, upsert=False)
logging.info(f"\n========\nres: {res}\n=============\ninsert_label_to_message: {label} was added to message {message_id} for recipient {recipient} ==================== \n\n")
def call_all_logic_for_msg_delete(email, msg, db) -> None:
for label in msg.label_ids:
pull_id_from_users_by_label(email, label.name, msg.id, db)
insert_id_to_Users_by_label(email, "TRASH", msg.id, db)
# insert_one_document_to_collection("Messages", msg, db)
logging.info(f"\n======\n")
insert_label_to_message(email, "TRASH", msg.id, msg.recipient ,db)
# delete_from_collection("Messages", msg.id, db)