From e1770cf3b0fd5eff3e69a8ec28c15018084eae73 Mon Sep 17 00:00:00 2001 From: Nathan Reiner Date: Thu, 6 Jul 2023 11:51:21 +0200 Subject: add extractors for docx, pptx, pdf, etc. --- src/text/pptx.rs | 9 +++++++++ 1 file changed, 9 insertions(+) create mode 100644 src/text/pptx.rs (limited to 'src/text/pptx.rs') diff --git a/src/text/pptx.rs b/src/text/pptx.rs new file mode 100644 index 0000000..7dac77e --- /dev/null +++ b/src/text/pptx.rs @@ -0,0 +1,9 @@ +use std::io::Read; +use dotext::{Pptx, MsDoc}; + +pub fn get_text(path : &str) -> String { + let mut file = Pptx::open(path).unwrap(); + let mut content = String::new(); + let _ = file.read_to_string(&mut content); + content +} -- cgit v1.2.3-70-g09d2