-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathcsvemailverifier.py
executable file
·106 lines (95 loc) · 4.22 KB
/
csvemailverifier.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
#!/usr/bin/python2
# CSVEmailVerifier by Mte90
# First parameter [mandatory]: the path of the csv file (csv separator column separator as ,)
# Second parameter [mandatory]: the number of the email column
# Third parameter: export in two different csv file the output [true|false (default)]
# Forth parameter: jump first line [true|false (default)]
import csv
import os.path
import sys
import time
from email_validator import validate_email
start_time = time.time()
if len(sys.argv) < 3:
print("CSVEmailVerifier by Mte90")
print("First parameter [mandatory]: the path of the csv file (csv separator column separator as ,)")
print("Second parameter [mandatory]: the number of the email column")
print("Third parameter: export in two different csv file the output [true|false (default)]")
print("Forth parameter: jump first line [true|false (default)]")
sys.exit()
print("CSVEmailVerifier 1.0 by Mte90 for Codeat - https://github.com/CodeAtCode")
def validate(email):
try:
validate_email(email)
except:
return False
return True
# Check if file exists
if os.path.isfile(sys.argv[1]):
file = sys.argv[1]
position = int(sys.argv[2]) # Column no. for the email
to_jump = False
to_write = False
if len(sys.argv) >= 4 and sys.argv[3].lower() == 'true':
to_write = True
if len(sys.argv) == 5 and sys.argv[4].lower() == 'true':
to_jump = True
with open(file, 'rb') as csv_file:
print("Evaluating in progress...")
# Prepare the output files
if to_write:
dirname = os.path.dirname(file)
if(dirname == '.'):
dirname = '.'
correct_file = open(dirname + '/correct.' + os.path.basename(file), "wb")
correct_object = csv.writer(correct_file, delimiter=',', quotechar='"', quoting=csv.QUOTE_ALL)
wrong_file = open(dirname + '/wrong.' + os.path.basename(file), "wb")
wrong_object = csv.writer(wrong_file, delimiter=',', quotechar='"', quoting=csv.QUOTE_ALL)
missing_file = open(dirname + '/missing.' + os.path.basename(file), "wb")
missing_object = csv.writer(missing_file, delimiter=',', quotechar='"', quoting=csv.QUOTE_ALL)
# Read the input file
email_checking = csv.reader(csv_file, delimiter=',', quotechar='|')
line_no = 0
for row in email_checking:
line_no += 1
# Reading the first line that contain the title of the column
if line_no == 1:
if not(to_jump) and to_write:
wrong_object.writerow(row)
correct_object.writerow(row)
else:
email = row[position]
if email != '':
if validate(email.strip()):
print(" Email " + str(line_no - 1) + " " + email + " exists!")
# Save the output
if to_write:
correct_object.writerow(row)
correct_file.flush()
else:
print(" Email " + str(line_no - 1) + " " + email + " not exists!")
# Save the output
if to_write:
wrong_object.writerow(row)
wrong_file.flush()
else:
print(" Email " + str(line_no - 1) + " is empty!")
if to_write:
missing_object.writerow(row)
missing_file.flush()
if to_write:
correct_file.close()
wrong_file.close()
missing_file.close()
print("Check in the same path of the input file for the 'correct."
+ os.path.basename(file) + "', 'wrong." + os.path.basename(file)
+ "', and 'missing." + os.path.basename(file) + "' output files.")
# File elaboration finished
calculate = int(time.time() - start_time)
if calculate == 0:
calculate = 1
print("Processed " + str(line_no - 1) + " emails in " +\
str(calculate) + " second" + ['', 's'][bool(calculate-1)]) + "."
else:
print("The file" + sys.argv[1] + " does not exist")
sys.exit()