-
Notifications
You must be signed in to change notification settings - Fork 0
/
gmail_stats_sender.py
77 lines (66 loc) · 3.33 KB
/
gmail_stats_sender.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
import pickle
import os.path
from googleapiclient.discovery import build
from google_auth_oauthlib.flow import InstalledAppFlow
from google.auth.transport.requests import Request
from datetime import datetime
from collections import Counter
# If modifying these scopes, delete the file token.pickle.
SCOPES = ['https://www.googleapis.com/auth/gmail.readonly']
def main():
"""Grab emails from given category (label)
extract sender info in headers (From)
and dump list along with occurrences in a text file
Code for login is pasted from quickstart.py located at https://developers.google.com/gmail/api/quickstart/python
"""
creds = None
# The file token.pickle stores the user's access and refresh tokens, and is
# created automatically when the authorization flow completes for the first
# time.
if os.path.exists('token.pickle'):
with open('token.pickle', 'rb') as token:
creds = pickle.load(token)
# If there are no (valid) credentials available, let the user log in.
if not creds or not creds.valid:
if creds and creds.expired and creds.refresh_token:
creds.refresh(Request())
else:
flow = InstalledAppFlow.from_client_secrets_file(
'credentials.json', SCOPES)
creds = flow.run_local_server(port=0)
# Save the credentials for the next run
with open('token.pickle', 'wb') as token:
pickle.dump(creds, token)
service = build('gmail', 'v1', credentials=creds)
## get list of senders for messages with 'label' (CATEGORY_PROMOTIONS, CATEGORY_SOCIAL)
print (datetime.now(),'Start collecting messages ...')
label = 'CATEGORY_SOCIAL'
results = service.users().messages().list(labelIds=label, userId='me').execute()
messages = results.get('messages', [])
nextPageToken = results.get('nextPageToken')
while (nextPageToken):
results2 = service.users().messages().list(labelIds=label, userId='me', pageToken=nextPageToken).execute()
messages = messages + results2.get('messages', [])
nextPageToken = results2.get('nextPageToken')
print (datetime.now(),'End collecting messages ...')
if not messages:
print('Error')
else:
print(datetime.now(),'Collecting data from message headers using get (can take a while) ...')
print(datetime.now(),'Total number of messages : ', len(messages))
senders =[]
for message in messages:
content = service.users().messages().get(userId='me', id=message['id'], format='metadata', metadataHeaders='From').execute()
headers = content['payload']['headers']
newone = [header['value'] for header in headers]
senders.append(newone[0])
print (datetime.now(),'Finished collecting header From ... Starting to count occurences')
unique_senders=Counter(senders).most_common()
# print (unique_senders) # unique_senders is a list of tuples
print (datetime.now(),'Finished counting occurences ... Writing to file')
filename = 'results_'+ label + '_' + datetime.now().strftime("%Y%m%d%H%M") +'.txt'
with open (filename, 'w') as wf:
wf.write('\n'.join('%s %s' % item for item in unique_senders))
print (datetime.now(),'Finished writing to file', filename)
if __name__ == '__main__':
main()