-
Notifications
You must be signed in to change notification settings - Fork 0
/
divide.py
110 lines (83 loc) · 3.1 KB
/
divide.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
import csv
import re
times=20000
all_list=[]
empty_list=[]
noneEmp_list=[]
noneEmp_list_mid=[]
noneEmp_list_big=[]
#with open('testCsv.csv',newline='') as csvfile:
with open('email.csv',newline='') as csvfile:
rows = csv.reader(csvfile)
for row in rows:
if(times<=0):
break
times-=1
if('@' in row[1]):
#print(row[1])
all_list.append(row)
if(('{' in row[1])):
# =============================================================================
# noneEmp_list_big.append(row)
# =============================================================================
tempList=re.findall(r'([{\,\w\.-}]+@[a-z\.-]+)', row[1])
for eachEmail in tempList:
noneEmp_list_big.append([row[0],eachEmail])
else:
if(('(' in row[1]) ):
# =============================================================================
# noneEmp_list_mid.append(row)
# =============================================================================
tempList=re.findall(r'([\w\.-]+@[\w\.-]+)', row[1])
for eachEmail in tempList:
noneEmp_list_mid.append([row[0],eachEmail])
# =============================================================================
# tempList=re.findall(r'([\w\.-]+@[\w\.-]+)', row[1])
# for eachEmail in tempList:
# noneEmp_list_mid.append([row[0],eachEmail])
# =============================================================================
else:
tempList=re.findall(r'[\w\.-]+@[\w\.-]+', row[1])
for eachEmail in tempList:
noneEmp_list.append([row[0],eachEmail])
else:
empty_list.append(row)
#if(row[1]== None): print('NULL')
print('\nempty_list:\n')
for item in empty_list:
print(item)
print('\nnoneEmp_list:\n')
for item in noneEmp_list:
print(item)
print('\nnoneEmp_list_big:\n')
for item in noneEmp_list_big:
print(item)
print('\nnoneEmp_list_mid:\n')
for item in noneEmp_list_mid:
print(item)
with open('noneEmp_list.csv', 'w', newline='') as csvfile:
writer = csv.writer(csvfile)
for row in noneEmp_list:
try:
writer.writerow(row)
except:
pass
with open('noneEmp_list_big.csv', 'w', newline='') as csvfile:
writer = csv.writer(csvfile)
for row in noneEmp_list_big:
try:
writer.writerow(row)
except:
pass
with open('noneEmp_list_mid.csv', 'w', newline='') as csvfile:
writer = csv.writer(csvfile)
for row in noneEmp_list_mid:
try:
writer.writerow(row)
except:
pass
# print(len(rows))
# =============================================================================
# print(rows[0])
# print(rows[1])
# =============================================================================