From e1770cf3b0fd5eff3e69a8ec28c15018084eae73 Mon Sep 17 00:00:00 2001 From: Nathan Reiner Date: Thu, 6 Jul 2023 11:51:21 +0200 Subject: add extractors for docx, pptx, pdf, etc. --- src/text/odp.rs | 9 +++++++++ 1 file changed, 9 insertions(+) create mode 100644 src/text/odp.rs (limited to 'src/text/odp.rs') diff --git a/src/text/odp.rs b/src/text/odp.rs new file mode 100644 index 0000000..eaed196 --- /dev/null +++ b/src/text/odp.rs @@ -0,0 +1,9 @@ +use std::io::Read; +use dotext::{Odp, doc::OpenOfficeDoc}; + +pub fn get_text(path : &str) -> String { + let mut file = Odp::open(path).unwrap(); + let mut content = String::new(); + let _ = file.read_to_string(&mut content); + content +} -- cgit v1.2.3-70-g09d2