-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy patharchive.py
311 lines (277 loc) · 11.2 KB
/
archive.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
import configparser
import requests
import urllib
import zipfile
import logging
import logging.config
import os
import hashlib
import tarfile
from datetime import datetime, timedelta
from webdav3.client import Client
import smtplib
from email.mime.multipart import MIMEMultipart
from email.mime.text import MIMEText
from email.mime.application import MIMEApplication
import requests
## SUCCESS VARIABLE
confSuccess = False
downloadZipSuccess = False
zipExtractedSuccess = False
diffDateSuccess = False
sentToServerSuccess = False
checkOutdated = False
success = False
def send_success_mail(receiver):
try:
today = datetime.today().strftime('%H:%M')
conservation = server_conf["CONSERVATION_TIME"]
msg = MIMEMultipart()
msg['From'] = 'Archive Manager'
msg['To'] = receiver
msg['Subject'] = 'Notification : Archiving completed'
message = "Hello, \n The archiving of the file was completed at "+ today+". \n The operation was successful and will be repeated in "+ conservation +" days. \n See you soon"
msg.attach(MIMEText(message))
mailserver = smtplib.SMTP('smtp.gmail.com', 587)
mailserver.ehlo()
mailserver.starttls()
mailserver.ehlo()
mailserver.login(mail_conf['USERNAME'], mail_conf['PASSWORD'])
mailserver.sendmail(receiver, receiver, msg.as_string())
mailserver.quit()
print("Mail sent to "+receiver)
except:
print("Error while sending mail to "+ receiver)
def send_error_mail(receiver):
try:
today = datetime.today().strftime('%H:%M')
conservation = server_conf["CONSERVATION_TIME"]
msg = MIMEMultipart()
msg['From'] = 'Archive Manager'
msg['To'] = receiver
with open("archive.log", "rb") as fil:
part = MIMEApplication(
fil.read(),
Name= os.path.basename('archive.log')
)
# After the file is closed
part['Content-Disposition'] = 'attachment; filename="%s"' % os.path.basename('archive.log')
msg['Subject'] = 'Notification : Error while archiving'
message = "Hello, \n The archiving of the file failed at "+ today+". \n The operation was unsuccessful and will be repeated in "+ conservation +" days. \n You can check the log report in attachment. \n See you soon"
msg.attach(MIMEText(message))
msg.attach(part)
mailserver = smtplib.SMTP('smtp.gmail.com', 587)
mailserver.ehlo()
mailserver.starttls()
mailserver.ehlo()
mailserver.login(mail_conf['USERNAME'], mail_conf['PASSWORD'])
mailserver.sendmail(receiver, receiver, msg.as_string())
mailserver.quit()
print("Mail sent to "+receiver)
except:
print("Error while sending mail to "+ receiver)
def make_tarfile(output_filename, source_dir):
with tarfile.open(output_filename, "w:gz") as tar:
tar.add(source_dir, arcname=os.path.basename(source_dir))
def hash_file(filename):
""""This function returns the SHA-1 hash
of the file passed into it"""
# make a hash object
h = hashlib.sha1()
# open file for reading in binary mode
with open(filename,'rb') as file:
# loop till the end of the file
chunk = 0
while chunk != b'':
# read only 1024 bytes at a time
chunk = file.read(1024)
h.update(chunk)
# return the hex representation of digest
return h.hexdigest()
def hash_zip(zipfile):
sha1 = hashlib.sha1()
blocksize = 1024**2 #1M chunks
while True:
block = zipfile.read(blocksize)
if not block:
break
sha1.update(block)
return sha1.hexdigest()
def dowloadFileFromUrl(url):
global downloadZipSuccess
file_name = url.split('/')[-1]
u = urllib.request.urlopen(url)
f = open(file_name, 'wb')
meta = u.info()
file_size = int(u.info()["Content-Length"])
print("Downloading: %s Bytes: %s" % (file_name, file_size))
file_size_dl = 0
block_sz = 8192
prct = 0.0
while True:
buffer = u.read(block_sz)
if not buffer:
break
file_size_dl += len(buffer)
f.write(buffer)
prct = (file_size_dl, file_size_dl * 100. / file_size)
progress = r"%10d [%3.2f%%]" % prct
print(progress)
if prct[1] == 100.00:
logger.info(file_name+ "("+ str(file_size)+" bytes) "+ "downloaded with success")
downloadZipSuccess = True
else:
logger.error("Can't download " + file_name+" (", str(file_size)+ " bytes)")
downloadZipSuccess = False
f.close()
return file_name
## GET CONFIG
try:
config = configparser.ConfigParser()
config.read('conf.ini')
file_conf = config['FILE']
server_conf = config['SERVER']
mail_conf = config['MAIL']
mattermost_conf = config['MATTERMOST']
confSuccess = True
except:
confSuccess = False
## INSTANCE LOG FILE
logger = logging.getLogger("archive") # > set up a new name for a new logger
logger.setLevel(logging.DEBUG) # here is the missing line
log_format = logging.Formatter('%(asctime)s - %(levelname)s - %(message)s')
log_handler = logging.FileHandler("archive.log")
log_handler.setLevel(logging.DEBUG)
log_handler.setFormatter(log_format)
logger.addHandler(log_handler)
## LOG STARTUP
logger.info("Starting script...")
## DOWNLOAD FILE FROM SERVER
r = requests.get(file_conf['URL'])
if r.status_code != 404:
print('Resource found ! Downloading...')
file_name = dowloadFileFromUrl(file_conf['URL'])
## UNZIP DOWLOADED ZIP AND EXTRACT TO /resources
with zipfile.ZipFile(file_name, 'r') as zip_ref:
listOfFileNames = zip_ref.namelist()
nbDownload = 0
same = False
for fileName in listOfFileNames:
print(fileName)
if fileName == file_conf['SQLFILE']:
# Extract a single file from zip
hash = hash_zip(zip_ref.open(fileName))
if os.path.isfile("./resources/"+file_conf['SQLFILE']):
if hash == hash_file("./resources/"+file_conf['SQLFILE']):
same = True
logger.error(file_conf['SQLFILE']+ " same as yesterday (hash: "+hash+")")
else:
zip_ref.extract(fileName, "./resources")
nbDownload+=1
diffDateSuccess = True
else:
zip_ref.extract(fileName, "./resources")
nbDownload+=1
diffDateSuccess = True
if nbDownload == 0:
logger.error(file_conf['SQLFILE']+ " not extracted ! Aborting...")
zipExtractedSuccess = False
else:
logger.info(file_conf['SQLFILE']+ ' extracted with success in /resources/'+fileName)
zipExtractedSuccess = True
## CONNECTION TO A REMOTE SERVER (WEBDAV)
options = {
'webdav_hostname': server_conf['URL'],
'webdav_login': server_conf['USERNAME'],
'webdav_password': server_conf['PASSWORD']
}
try:
logger.info("Connecting to remote server...")
client = Client(options)
client.verify = False # To not check SSL certificates (Default = True)
client.mkdir('archive')
logger.info("Connected !")
## CHECK CONSERVATION TIME FOR .tgz FILES
expiration = datetime.today() - timedelta(days=int(server_conf['CONSERVATION_TIME']))
try:
logger.info('Checking for expired files...')
files = client.list("archive", get_info=True)
for file in files:
if file['content_type'] == 'application/x-gzip':
date_str = file['path'].split('/')[3].split('.')[0]
date_file = datetime.strptime(date_str, '%Y%d%m')
if date_file < expiration:
path = file["path"].split('/')[2] + "/"+file["path"].split('/')[3]
client.clean(path)
logger.info(date_str+".tgz too old ! Deleting...")
logger.info('Folder is up to date !')
checkOutdated = True
success = True
except:
logger.error("Error while checking for expired files")
checkOutdated = False
## CREATE .tgz FILE AND UPLOAD
if not same:
## CREATE AAAADDMM.tgz FILE
today = datetime.today().strftime('%Y%d%m')
new_filename = today+".tgz"
make_tarfile("./resources/"+new_filename, "./resources/"+file_conf['SQLFILE'])
logger.info(new_filename+" file created in ./resources")
print(new_filename+" file created in ./resources")
## UPLOAD .tgz ON SERVER
try:
client.upload_sync(remote_path="archive/"+new_filename, local_path="./resources/"+new_filename)
logger.info("Uploaded !")
success = True
sentToServerSuccess = True
except:
success = False
logger.error("Error while uploading data to server")
except:
logger.error("Error while connecting to server : " + server_conf['URL'])
else:
logger.error(file_conf['URL'] + " not found (HTTP ERROR 404)")
success = False
## SENDING MAILS
mail_list = mail_conf['MAIL_LIST'].split(' ')
if success:
for mail in mail_list:
send_success_mail(mail)
else:
for mail in mail_list:
send_error_mail(mail)
## SEND MATTERMOST NOTIFICATION
today = datetime.today().strftime('%d %B, %Y')
subject = "#### Archiving report for "+ today+"\nPlease, check logs if some errors occured.\n"
if confSuccess:
confSuccessMessage = ":white_check_mark: |"
else:
confSuccessMessage = ":warning: |"
if downloadZipSuccess:
downloadSuccessMessage = ":white_check_mark: |"
else:
downloadSuccessMessage = ":warning: |"
if zipExtractedSuccess:
extractedSuccessMessage = ":white_check_mark: |"
else:
extractedSuccessMessage = ":warning: |"
if diffDateSuccess:
diffSuccessMessage = ":white_check_mark: |"
else:
diffSuccessMessage = ":warning: |"
if sentToServerSuccess:
sentSuccessMessage = ":white_check_mark: |"
else:
sentSuccessMessage = ":warning: |"
if checkOutdated:
outdatedMessage = ":white_check_mark: |"
else:
outdatedMessage = ":warning: |"
headers = {'Content-type': 'application/json', 'Accept': 'text/plain'}
table ="| Task | State |\n"+"|:-----------------|:-------------------|\n"+"| Get config data | "+ confSuccessMessage +"\n" +"| Download zip | "+ downloadSuccessMessage+"\n" +"| Zip extracted | "+ extractedSuccessMessage+"\n" +"| Different file | "+ diffSuccessMessage+"\n"+"| Check for outdated files | "+ outdatedMessage+"\n" +"| Archive uploaded | "+sentSuccessMessage
data = {"username": "Archive Manager","icon_url": "https://mattermost.org/wp-content/uploads/2016/04/icon.png","text": subject + "\n" + table}
try:
x = requests.post(mattermost_conf['WEBHOOK'],data = json.dumps(data), headers = headers)
logger.info("Mattermost webhook notification done ! (" + mattermost_conf['WEBHOOK'] + ")")
except:
logger.error("Mattermost webhook notification failed ! Check the url or you might exceeded the allowed rate of requests. (" + mattermost_conf['WEBHOOK']+ ")")