rag-deepseek / utils.py
fahmiaziz98
add file
1060d7f
raw
history blame contribute delete
708 Bytes
from typing import Dict, List
def get_page_from_documents(documents: List[Dict]) -> int:
"""
Mengambil nilai 'page' atau 'page_label' dari list dokumen.
Args:
documents: List dokumen dari result["documents"].
Returns:
Nomor halaman (int) jika ditemukan, None jika tidak ditemukan.
"""
for doc in documents:
metadata = doc['metadata']
page_num = metadata.get('page')
if page_num is not None:
return page_num
page_label = metadata.get('page_label')
if page_label is not None:
try:
return int(page_label) -1
except ValueError:
pass
return None