diff --git a/backend/danswer/connectors/google_drive/connector.py b/backend/danswer/connectors/google_drive/connector.py index b1c4a8960c0..c44d2751551 100644 --- a/backend/danswer/connectors/google_drive/connector.py +++ b/backend/danswer/connectors/google_drive/connector.py @@ -334,7 +334,10 @@ def extract_text(file: dict[str, str], service: discovery.Resource) -> str: response = service.files().get_media(fileId=file["id"]).execute() return pptx_to_text(file=io.BytesIO(response)) elif mime_type == GDriveMimeType.PPT.value: - response = service.files().get_media(fileId=file["id"]).execute() + response = service.files().export( + fileId=file["id"], + mimeType="application/vnd.openxmlformats-officedocument.presentationml.presentation" + ).execute() return pptx_to_text(file=io.BytesIO(response)) return UNSUPPORTED_FILE_TYPE_CONTENT