Refactor variable names for clarity in the PDF processing loop

This commit is contained in:
Thorsten Sommer 2025-05-02 15:36:57 +02:00
parent 10d4a2d353
commit ecaabfaa2a
Signed by: tsommer
GPG Key ID: 371BBA77A02C0108

View File

@ -153,16 +153,16 @@ async fn stream_pdf(file_path: &str) -> Result<ChunkStream> {
tokio::task::spawn_blocking(move || { tokio::task::spawn_blocking(move || {
let pdfium = Pdfium::default(); let pdfium = Pdfium::default();
let doc = match pdfium.load_pdf_from_file(&path, None) { let doc = match pdfium.load_pdf_from_file(&path, None) {
Ok(d) => d, Ok(document) => document,
Err(e) => { Err(e) => {
let _ = tx.blocking_send(Err(e.into())); let _ = tx.blocking_send(Err(e.into()));
return; return;
} }
}; };
for (i, page) in doc.pages().iter().enumerate() { for (num_page, page) in doc.pages().iter().enumerate() {
let content = match page.text().map(|t| t.all()) { let content = match page.text().map(|t| t.all()) {
Ok(c) => c, Ok(text_content) => text_content,
Err(e) => { Err(e) => {
let _ = tx.blocking_send(Err(e.into())); let _ = tx.blocking_send(Err(e.into()));
continue; continue;
@ -171,7 +171,7 @@ async fn stream_pdf(file_path: &str) -> Result<ChunkStream> {
if tx.blocking_send(Ok(Chunk { if tx.blocking_send(Ok(Chunk {
content, content,
metadata: Metadata::Pdf { page_number: i + 1 }, metadata: Metadata::Pdf { page_number: num_page + 1 },
})).is_err() { })).is_err() {
break; break;
} }