Omkar008 commited on
Commit
c0bad28
1 Parent(s): 3f50e38

Update get_gmail_data.py

Browse files
Files changed (1) hide show
  1. get_gmail_data.py +11 -11
get_gmail_data.py CHANGED
@@ -151,17 +151,14 @@ class GmailDataExtractor:
151
  payload = message_data['payload']['headers']
152
  print("printing headers response")
153
  print(payload)
154
- print()
155
- print()
156
- brand_from_gmail = ''
157
  company_from_gmail = ''
158
- # if payload['headers']['name'] == 'from':
159
- # brand_from_gmail = payload['headers']['value']
160
- # company_from_gmail = extract_domain_from_email(brand_from_gmail)
161
- # else:
162
- # company_from_gmail = None
163
-
164
-
165
  for part in parts:
166
  if 'mimeType' not in part:
167
  continue
@@ -218,7 +215,10 @@ class GmailDataExtractor:
218
  # Extract text
219
  text = soup.get_text(separator=' ')
220
  text = re.sub(r'\s+', ' ', text).strip()
221
-
 
 
 
222
  # Extract links
223
  links = [(link.text, link['href']) for link in soup.find_all('a', href=True)]
224
 
 
151
  payload = message_data['payload']['headers']
152
  print("printing headers response")
153
  print(payload)
 
 
 
154
  company_from_gmail = ''
155
+
156
+ #Extracting the domain name from the senders email
157
+ for fromdata in payload:
158
+ if fromdata['name'] == 'From':
159
+ company_from_gmail = extract_domain_from_email(fromdata['value'])
160
+ break
161
+
162
  for part in parts:
163
  if 'mimeType' not in part:
164
  continue
 
215
  # Extract text
216
  text = soup.get_text(separator=' ')
217
  text = re.sub(r'\s+', ' ', text).strip()
218
+ print("Printing the extracted text from the html")
219
+ print(text)
220
+ print()
221
+ print()
222
  # Extract links
223
  links = [(link.text, link['href']) for link in soup.find_all('a', href=True)]
224