Skip to content
Draft
Changes from all commits
Commits
Show all changes
38 commits
Select commit Hold shift + click to select a range
cbed950
fix: doc fine mode bug
CaralHsi Dec 7, 2025
20e0839
fix: doc fine mode bug
CaralHsi Dec 7, 2025
fff0fb2
feat: init longbench_v2
CaralHsi Dec 7, 2025
15562c4
Merge branch 'dev' into feat/evaluation_doc_qa
CaralHsi Dec 7, 2025
9beabba
feat: more strict embedder trucation
CaralHsi Dec 7, 2025
fc54da8
Merge branch 'feat/evaluation_doc_qa' of github.com:CaralHsi/MemOSRea…
CaralHsi Dec 7, 2025
8f368bb
feat: parallel processing fine mode in multi-modal-fine
CaralHsi Dec 7, 2025
54897a9
Merge branch 'dev' into feat/evaluation_doc_qa
CaralHsi Dec 7, 2025
be293bc
feat: update parsers; add chunk info into source; remove origin_part
CaralHsi Dec 8, 2025
ba1c161
fix: conflict
CaralHsi Dec 8, 2025
8e8b91b
Merge branch 'dev' into feat/evaluation_doc_qa
CaralHsi Dec 8, 2025
2edd0a3
feat: modify chunk_content in file-fine-parser
CaralHsi Dec 8, 2025
6991ed7
Merge branch 'feat/evaluation_doc_qa' of github.com:CaralHsi/MemOSRea…
CaralHsi Dec 8, 2025
45609ab
Merge branch 'dev' into feat/evaluation_doc_qa
CaralHsi Dec 8, 2025
f80896e
fix: token counter bug
CaralHsi Dec 8, 2025
a3f2b32
Merge branch 'feat/evaluation_doc_qa' of github.com:CaralHsi/MemOSRea…
CaralHsi Dec 8, 2025
b375d51
feat: enlarge polardb
CaralHsi Dec 8, 2025
0bfcaa9
Merge branch 'dev' into feat/evaluation_doc_qa
CaralHsi Dec 8, 2025
69dd3a8
feat: derease parallrl
CaralHsi Dec 8, 2025
7fa7b77
Merge branch 'feat/evaluation_doc_qa' of github.com:CaralHsi/MemOSRea…
CaralHsi Dec 8, 2025
ac38046
feat: add image parser in file
CaralHsi Dec 8, 2025
ef02140
feat: add image parser in file
CaralHsi Dec 8, 2025
37bcc90
feat: update file_content_parser
CaralHsi Dec 8, 2025
7e2adb4
Merge branch 'dev' into feat/evaluation_doc_qa
CaralHsi Dec 8, 2025
20af5d0
feat: modify long_bench_v2
CaralHsi Dec 9, 2025
ec34637
Merge branch 'feat/evaluation_doc_qa' of github.com:CaralHsi/MemOSRea…
CaralHsi Dec 9, 2025
31ad564
Merge branch 'dev' of github.com:MemTensor/MemOS into feat/evaluation…
CaralHsi Dec 9, 2025
72eb129
Merge branch 'dev' into feat/evaluation_doc_qa
CaralHsi Dec 9, 2025
0ef1bb5
feat: modify long_bench_v2
CaralHsi Dec 9, 2025
cf1291b
Merge branch 'feat/evaluation_doc_qa' of github.com:CaralHsi/MemOSRea…
CaralHsi Dec 9, 2025
1ecf03e
Merge branch 'dev' of github.com:MemTensor/MemOS into feat/evaluation…
CaralHsi Dec 9, 2025
b58ee88
fix: image bug
CaralHsi Dec 9, 2025
f94b001
feat: increase playground depth
CaralHsi Dec 9, 2025
3819dae
Merge branch 'dev' into feat/evaluation_doc_qa
CaralHsi Dec 9, 2025
eba9e96
feat: set parsed_text None in file parser
CaralHsi Dec 9, 2025
5504d8d
Merge branch 'feat/evaluation_doc_qa' of github.com:CaralHsi/MemOSRea…
CaralHsi Dec 9, 2025
5c496ee
Merge branch 'dev' into feat/evaluation_doc_qa
CaralHsi Dec 9, 2025
a8ac57c
Merge branch 'dev' into feat/evaluation_doc_qa
CaralHsi Dec 9, 2025
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
14 changes: 2 additions & 12 deletions src/memos/mem_reader/read_multi_modal/file_content_parser.py
Original file line number Diff line number Diff line change
Expand Up @@ -612,8 +612,6 @@ def parse_fine(
# Use parser from utils
if parser:
parsed_text = parser.parse(temp_file_path)
else:
parsed_text = "[File parsing error: Parser not available]"
except Exception as e:
logger.error(
f"[FileContentParser] Error parsing downloaded file: {e}"
Expand All @@ -633,18 +631,9 @@ def parse_fine(
# Priority 2: If file_id is provided but no file_data, try to use file_id as path
elif file_id:
logger.warning(f"[FileContentParser] File data not provided for file_id: {file_id}")
parsed_text = f"[File ID: {file_id}]: File data not provided"

# If no content could be parsed, create a placeholder
if not parsed_text:
if filename:
parsed_text = f"[File: {filename}] File data not provided"
else:
parsed_text = "[File: unknown] File data not provided"

except Exception as e:
logger.error(f"[FileContentParser] Error in parse_fine: {e}")
parsed_text = f"[File parsing error: {e!s}]"

finally:
# Clean up temporary file
Expand All @@ -656,7 +645,8 @@ def parse_fine(
logger.warning(
f"[FileContentParser] Failed to delete temp file {temp_file_path}: {e}"
)

if not parsed_text:
return []
# Extract and process images from parsed_text
if is_markdown and parsed_text and self.image_parser:
parsed_text = self._extract_and_process_images(parsed_text, info, **kwargs)
Expand Down