Spaces:
Sleeping
Sleeping
Update get_gmail_data.py
Browse files- get_gmail_data.py +11 -11
get_gmail_data.py
CHANGED
@@ -151,17 +151,14 @@ class GmailDataExtractor:
|
|
151 |
payload = message_data['payload']['headers']
|
152 |
print("printing headers response")
|
153 |
print(payload)
|
154 |
-
print()
|
155 |
-
print()
|
156 |
-
brand_from_gmail = ''
|
157 |
company_from_gmail = ''
|
158 |
-
|
159 |
-
#
|
160 |
-
|
161 |
-
|
162 |
-
|
163 |
-
|
164 |
-
|
165 |
for part in parts:
|
166 |
if 'mimeType' not in part:
|
167 |
continue
|
@@ -218,7 +215,10 @@ class GmailDataExtractor:
|
|
218 |
# Extract text
|
219 |
text = soup.get_text(separator=' ')
|
220 |
text = re.sub(r'\s+', ' ', text).strip()
|
221 |
-
|
|
|
|
|
|
|
222 |
# Extract links
|
223 |
links = [(link.text, link['href']) for link in soup.find_all('a', href=True)]
|
224 |
|
|
|
151 |
payload = message_data['payload']['headers']
|
152 |
print("printing headers response")
|
153 |
print(payload)
|
|
|
|
|
|
|
154 |
company_from_gmail = ''
|
155 |
+
|
156 |
+
#Extracting the domain name from the senders email
|
157 |
+
for fromdata in payload:
|
158 |
+
if fromdata['name'] == 'From':
|
159 |
+
company_from_gmail = extract_domain_from_email(fromdata['value'])
|
160 |
+
break
|
161 |
+
|
162 |
for part in parts:
|
163 |
if 'mimeType' not in part:
|
164 |
continue
|
|
|
215 |
# Extract text
|
216 |
text = soup.get_text(separator=' ')
|
217 |
text = re.sub(r'\s+', ' ', text).strip()
|
218 |
+
print("Printing the extracted text from the html")
|
219 |
+
print(text)
|
220 |
+
print()
|
221 |
+
print()
|
222 |
# Extract links
|
223 |
links = [(link.text, link['href']) for link in soup.find_all('a', href=True)]
|
224 |
|