from fastapi import FastAPI, Depends , Request,WebSocket from fastapi.security import OAuth2PasswordBearer import requests from jose import jwt import webbrowser import base64 import logging app = FastAPI() oauth2_scheme = OAuth2PasswordBearer(tokenUrl="token") # Replace these with your own values from the Google Developer Console # GOOGLE_CLIENT_ID = "" # GOOGLE_CLIENT_SECRET = "" # GOOGLE_REDIRECT_URI = "" GOOGLE_CLIENT_ID = "485753721652-5uta3e18va2g6cnkldib2d68q39t4vod.apps.googleusercontent.com" GOOGLE_CLIENT_SECRET = "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" GOOGLE_REDIRECT_URI = "https://omkar008-receipt-radar-test.hf.space/auth/google" GOOGLE_REDIRECT_URI_hr = "https://receiptradar-0bb387d81174.herokuapp.com/auth/google" # Configure the logger logging.basicConfig(level=logging.DEBUG) logger = logging.getLogger(__name__) @app.get("/") async def login_google(): # oauth_url = f"https://accounts.google.com/o/oauth2/auth?response_type=code&client_id={GOOGLE_CLIENT_ID}&redirect_uri={GOOGLE_REDIRECT_URI}&scope=openid%20profile%20email&access_type=offline" #Below is the URL to prompt the user to login to his specified gmail account and also give a readonly access to his gmail oauth_url = f"https://accounts.google.com/o/oauth2/auth?response_type=code&client_id={GOOGLE_CLIENT_ID}&redirect_uri={GOOGLE_REDIRECT_URI}&scope=openid%20profile%20email%20https://www.googleapis.com/auth/gmail.readonly&access_type=offline" oauth_url_hr = f"https://accounts.google.com/o/oauth2/auth?response_type=code&client_id={GOOGLE_CLIENT_ID}&redirect_uri={GOOGLE_REDIRECT_URI_hr}&scope=openid%20profile%20email%20https://www.googleapis.com/auth/gmail.readonly&access_type=offline&state=receipts" webbrowser.open(oauth_url) return { "url":f"https://accounts.google.com/o/oauth2/auth?response_type=code&client_id={GOOGLE_CLIENT_ID}&redirect_uri={GOOGLE_REDIRECT_URI}&scope=openid%20profile%20email&access_type=offline", "url_hr": oauth_url_hr } @app.post("/auth/google") async def auth_google(request: Request): #This code is basically the authorization code and this authorization code helps us to get the access token with the required scopes that we have set . #We require the gmail.readonly scopes that requires verification of our application and all. data = await request.json() code = data.get("access_token") print("Printing the access token") print(code) if not code: raise HTTPException(status_code=400, detail="Authorization code not provided") # token_url = "https://accounts.google.com/o/oauth2/token" # print(code) # data = { # "code": code, # "client_id": GOOGLE_CLIENT_ID, # "client_secret": GOOGLE_CLIENT_SECRET, # "redirect_uri": GOOGLE_REDIRECT_URI, # "grant_type": "authorization_code", # } # response = requests.post(token_url, data=data) # access_token = response.json().get("access_token") access_token_new = code # print(response.json()) # print(access_token_new) user_info = requests.get("https://www.googleapis.com/oauth2/v1/userinfo", headers={"Authorization": f"Bearer {access_token_new}"}) # user_query = data.get("user_query") page_token = None messages = [] jobs_query = "subject:receipt OR subject:receipts has:attachment" while True: # Construct Gmail API request with pageToken gmail_url = f"https://www.googleapis.com/gmail/v1/users/me/messages?q={jobs_query}" if page_token: gmail_url += f"&pageToken={page_token}" gmail_response = requests.get(gmail_url, headers={"Authorization": f"Bearer {access_token_new}"}) gmail_data = gmail_response.json() # Check if there are messages in the response if "messages" in gmail_data: messages.extend(gmail_data["messages"]) # Check if there are more pages if "nextPageToken" in gmail_data: page_token = gmail_data["nextPageToken"] else: break # No more pages, exit the loop # print(len(messages)) # query = "subject:receipt OR subject:receipts has:attachment" # gmail_url = f"https://www.googleapis.com/gmail/v1/users/me/messages?q={query}" # gmail_response = requests.get(gmail_url, headers={"Authorization": f"Bearer {access_token_new}"}) # messages = gmail_response.json().get("messages", []) # print(messages) # print("Printing gmail response") # print(gmail_response.json()) # Fetch attachments from the first message attachments = [] attachment_no = 0 data_new = {} for i,message in enumerate(messages) : # print(i) # print(message) if message: message_id = message.get("id") print(message_id) if message_id: message_url = f"https://www.googleapis.com/gmail/v1/users/me/messages/{message_id}" message_response = requests.get(message_url, headers={"Authorization": f"Bearer {access_token_new}"}) message_data = message_response.json() # Check for parts in the message payload if "payload" in message_data and "parts" in message_data["payload"]: for part in message_data["payload"]["parts"]: if "body" in part and "attachmentId" in part["body"]: attachment_id = part["body"]["attachmentId"] attachment_url = f"https://www.googleapis.com/gmail/v1/users/me/messages/{message_id}/attachments/{attachment_id}" attachment_response = requests.get(attachment_url, headers={"Authorization": f"Bearer {access_token_new}"}) attachment_data = attachment_response.json() data = attachment_data.get("data") filename = part.get("filename", "untitled.txt") if data: data_new[filename]=data # data_new.append({filename:data.encode("UTF-8")}) # Decode base64-encoded attachment data # print(filename) attachment_content = base64.urlsafe_b64decode(data.encode("UTF-8")) # print(attachment_content) print("yo") # print(data_new) attachment_no+=1 # if data: # # Decode base64-encoded attachment data # attachment_content = base64.urlsafe_b64decode(data.encode("UTF-8")) # # Save the attachment to a file # save_path = f"/Users/omkarmalpure/Documents/Gmail_API/attachments/{filename}" # with open(save_path, "wb") as file: # file.write(attachment_content) # attachments.append(save_path) # print(attachments) # print(len(data_new)) return {"attachment_count":attachment_no,"attachment_content":data_new} @app.websocket("/ws") async def test_websocket(websocket: WebSocket): #This code is basically the authorization code and this authorization code helps us to get the access token with the required scopes that we have set . #We require the gmail.readonly scopes that requires verification of our application and all. # raw_body = await request.body() # return {"data":Yo Yo"} # data = await request.json() # code = data.get("access_token") sucess =await websocket.accept() # await print(sucess) # await print("Hi hi working") logger.info("Hi hi succefull in connecting !!") # await websocket.send_json({"message":"Yes Websockets successfull"}) # await print("working after line 163") logger.info("Now receiving json!!") data = await websocket.receive_text() logger.info("Received JSON data: %s", data) # print(data) # code = data.get("message") # print(code) # code = raw_body.decode() await event_generator(data) def get_messages(code:str): print() # print(code) access_token = code print("printing access_token") print(access_token) page_token = None messages = [] jobs_query = "subject:receipt OR subject:receipts has:attachment" while True: # Construct Gmail API request with pageToken print("into the gmail") gmail_url = f"https://www.googleapis.com/gmail/v1/users/me/messages?q={jobs_query}" if page_token: gmail_url += f"&pageToken={page_token}" gmail_response = requests.get(gmail_url, headers={"Authorization": f"Bearer {access_token}"}) print(gmail_response) gmail_data = gmail_response.json() # Check if there are messages in the response if "messages" in gmail_data: messages.extend(gmail_data["messages"]) # Check if there are more pages if "nextPageToken" in gmail_data: page_token = gmail_data["nextPageToken"] else: break # No more pages, exit the loop print("returning the messages") unique_thread_ids = set() filtered_data_list = [] for entry in messages: thread_id = entry['threadId'] if thread_id not in unique_thread_ids: unique_thread_ids.add(thread_id) filtered_data_list.append(entry) print(messages) print(filtered_data_list) return filtered_data_list async def event_generator(code:str): print(code) access_token = code messages=get_messages(access_token) print(len(messages)) await websocket.send(json.dumps({"total_messages": len(messages)})) attachments = [] prev_data="" data_new={} attachment_no=0 batch_size = 5 prev_filename = None for i,message in enumerate(messages) : print(i) print(message) if message: message_id = message.get("id") thread_id = message.get("threadId") print(message_id) if message_id: message_url = f"https://www.googleapis.com/gmail/v1/users/me/messages/{message_id}" message_response = requests.get(message_url, headers={"Authorization": f"Bearer {access_token}"}) message_data = message_response.json() # Check for parts in the message payload if "payload" in message_data and "parts" in message_data["payload"]: for part in message_data["payload"]["parts"]: if "body" in part and "attachmentId" in part["body"]: attachment_id = part["body"]["attachmentId"] print(attachment_id) attachment_url = f"https://www.googleapis.com/gmail/v1/users/me/messages/{message_id}/attachments/{attachment_id}" attachment_response = requests.get(attachment_url, headers={"Authorization": f"Bearer {access_token}"}) attachment_data = attachment_response.json() data = attachment_data.get("data",{}) filename = part.get("filename", "untitled.txt") # print("Print the data json response for that gmail") print(filename) # print(attachment_data) # json_str = json.dumps(attachment_data, indent=2) # with subprocess.Popen(["less"], stdin=subprocess.PIPE) as less_process: # less_process.communicate(input=json_str.encode("utf-8")) if data: data_new[filename]=str(data[:10]) # data_new.append({filename:data.encode("UTF-8")}) # Decode base64-encodattaed attachment data # print(filename)s attachment_content = base64.urlsafe_b64decode(data.encode("UTF-8")) # print(attachment_content) print("yo") # print(data_new) attachment_no+=1 await websocket.send_json({filename:data[:10]}) # yield f"data: {str(data_new)}\n\n" # data_new={} await websocket.send_text("Successfully sent all the Data !") @app.get("/token") async def get_token(token: str = Depends(oauth2_scheme)): return jwt.decode(token, GOOGLE_CLIENT_SECRET, algorithms=["HS256"]) # if __name__ == "__main__": # import uvicorn # uvicorn.run(app, host="0.0.0.0", port=8000)