Skip to content

Commit 3dc34dd

Browse files
committed
CW comments
1 parent e3167a4 commit 3dc34dd

File tree

4 files changed

+8
-56
lines changed

4 files changed

+8
-56
lines changed

backend/ee/onyx/server/reporting/usage_export_generation.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -67,7 +67,7 @@ def generate_chat_messages_report(
6767
file_id = file_store.save_file(
6868
content=temp_file,
6969
display_name=file_name,
70-
file_origin=FileOrigin.OTHER,
70+
file_origin=FileOrigin.GENERATED_REPORT,
7171
file_type="text/csv",
7272
)
7373

@@ -99,7 +99,7 @@ def generate_user_report(
9999
file_id = file_store.save_file(
100100
content=temp_file,
101101
display_name=file_name,
102-
file_origin=FileOrigin.OTHER,
102+
file_origin=FileOrigin.GENERATED_REPORT,
103103
file_type="text/csv",
104104
)
105105

backend/onyx/indexing/indexing_pipeline.py

Lines changed: 1 addition & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -867,13 +867,8 @@ def index_doc_batch(
867867
user_file_id_to_raw_text: dict[int, str] = {}
868868
for document_id in updatable_ids:
869869
# Only calculate token counts for documents that have a user file ID
870-
if (
871-
document_id not in doc_id_to_user_file_id
872-
or doc_id_to_user_file_id[document_id] is None
873-
):
874-
continue
875870

876-
user_file_id = doc_id_to_user_file_id[document_id]
871+
user_file_id = doc_id_to_user_file_id.get(document_id)
877872
if user_file_id is None:
878873
continue
879874

backend/onyx/server/documents/connector.py

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -441,7 +441,9 @@ def is_zip_file(file: UploadFile) -> bool:
441441
)
442442

443443

444-
def upload_files(files: list[UploadFile]) -> FileUploadResponse:
444+
def upload_files(
445+
files: list[UploadFile], file_origin: FileOrigin = FileOrigin.CONNECTOR
446+
) -> FileUploadResponse:
445447
for file in files:
446448
if not file.filename:
447449
raise HTTPException(status_code=400, detail="File name cannot be empty")
@@ -497,7 +499,7 @@ def should_process_file(file_path: str) -> bool:
497499
text_file_id = file_store.save_file(
498500
content=io.BytesIO(extracted_text.encode()),
499501
display_name=file.filename,
500-
file_origin=FileOrigin.CHAT_UPLOAD,
502+
file_origin=file_origin,
501503
file_type="text/plain",
502504
)
503505
deduped_file_paths.append(text_file_id)
@@ -528,7 +530,7 @@ def upload_files_api(
528530
files: list[UploadFile],
529531
_: User = Depends(current_curator_or_admin_user),
530532
) -> FileUploadResponse:
531-
return upload_files(files)
533+
return upload_files(files, FileOrigin.OTHER)
532534

533535

534536
@router.get("/admin/connector")

backend/onyx/server/query_and_chat/chat_backend.py

Lines changed: 0 additions & 45 deletions
Original file line numberDiff line numberDiff line change
@@ -716,51 +716,6 @@ def upload_files_for_chat(
716716
detail="Images must be less than 20MB",
717717
)
718718

719-
# file_store = get_default_file_store()
720-
721-
# file_info: list[tuple[str, str | None, ChatFileType]] = []
722-
# for file in files:
723-
# file_type = mime_type_to_chat_file_type(file.content_type)
724-
725-
# file_content = file.file.read() # Read the file content
726-
727-
# # NOTE: Image conversion to JPEG used to be enforced here.
728-
# # This was removed to:
729-
# # 1. Preserve original file content for downloads
730-
# # 2. Maintain transparency in formats like PNG
731-
# # 3. Ameliorate issue with file conversion
732-
# file_content_io = io.BytesIO(file_content)
733-
734-
# new_content_type = file.content_type
735-
736-
# # Store the file normally
737-
# file_id = file_store.save_file(
738-
# content=file_content_io,
739-
# display_name=file.filename,
740-
# file_origin=FileOrigin.CHAT_UPLOAD,
741-
# file_type=new_content_type or file_type.value,
742-
# )
743-
744-
# # 4) If the file is a doc, extract text and store that separately
745-
# if file_type == ChatFileType.DOC:
746-
# # Re-wrap bytes in a fresh BytesIO so we start at position 0
747-
# extracted_text_io = io.BytesIO(file_content)
748-
# extracted_text = extract_file_text(
749-
# file=extracted_text_io, # use the bytes we already read
750-
# file_name=file.filename or "",
751-
# )
752-
753-
# text_file_id = file_store.save_file(
754-
# content=io.BytesIO(extracted_text.encode()),
755-
# display_name=file.filename,
756-
# file_origin=FileOrigin.CHAT_UPLOAD,
757-
# file_type="text/plain",
758-
# )
759-
# # Return the text file as the "main" file descriptor for doc types
760-
# file_info.append((text_file_id, file.filename, ChatFileType.PLAIN_TEXT))
761-
# else:
762-
# file_info.append((file_id, file.filename, file_type))
763-
764719
# 5) Create a user file for each uploaded file
765720
user_files = create_user_files(files, RECENT_DOCS_FOLDER_ID, user, db_session)
766721
for user_file in user_files:

0 commit comments

Comments
 (0)