docx_template/
docx.rs

1use crate::error::DocxError;
2use crate::image::{DOCX_EMU, DocxImage};
3use quick_xml::Writer;
4use quick_xml::events::{BytesDecl, BytesEnd, BytesStart, BytesText, Event};
5use reqwest::Client;
6use std::collections::HashMap;
7use std::fs::File;
8use std::io::{Cursor, Read, Write};
9use std::path::Path;
10use std::time::Duration;
11use zip::write::SimpleFileOptions;
12use zip::{ZipArchive, ZipWriter};
13
14pub struct DocxTemplate {
15    // 待替换的字符串
16    text_replacements: HashMap<String, String>,
17    // 待替换的图片
18    image_replacements: HashMap<String, Option<DocxImage>>,
19    // 请求对象
20    client: Client,
21}
22
23impl DocxTemplate {
24    pub fn new() -> Self {
25        DocxTemplate {
26            text_replacements: HashMap::new(),
27            image_replacements: HashMap::new(),
28            client: Client::builder()
29                .timeout(Duration::from_secs(10)) // 设置超时
30                .build()
31                .unwrap(),
32        }
33    }
34
35    /// 添加待替换的字符以及对应的值  
36    /// @param placeholder 待替换的字符串  
37    /// @param value 替换的值  
38    pub fn add_text_replacement(&mut self, placeholder: &str, value: &str) {
39        self.text_replacements
40            .insert(placeholder.to_string(), value.to_string());
41    }
42
43    /// 添加待替换的图片  
44    /// @param placeholder 待替换的字符串  
45    /// @param image_path 图片路径  
46    pub fn add_image_file_replacement(
47        &mut self,
48        placeholder: &str,
49        image_path: Option<&str>,
50    ) -> Result<(), DocxError> {
51        match image_path {
52            None => {
53                // 插入图片到属性中
54                self.image_replacements
55                    .insert(placeholder.to_string(), None);
56            }
57            Some(data) => {
58                // 插入图片到属性中
59                self.image_replacements
60                    .insert(placeholder.to_string(), Some(DocxImage::new(data)?));
61            }
62        }
63
64        Ok(())
65    }
66
67    /// 添加待替换的图片  
68    /// @param placeholder 替换的字符串  
69    /// @param image_path 图片路径  
70    /// @param width 图片的宽度(厘米)  
71    /// @param height 图片的高度(厘米)  
72    pub fn add_image_file_size_replacement(
73        &mut self,
74        placeholder: &str,
75        image_path: Option<&str>,
76        width: f32,
77        height: f32,
78    ) -> Result<(), DocxError> {
79        match image_path {
80            None => {
81                // 插入图片到属性中
82                self.image_replacements
83                    .insert(placeholder.to_string(), None);
84            }
85            Some(file_path) => {
86                // 将厘米单位换算成emu
87                let width_emu = (width * DOCX_EMU) as u64;
88                let height_emu = (height * DOCX_EMU) as u64;
89                // 插入图片到属性中
90                self.image_replacements.insert(
91                    placeholder.to_string(),
92                    Some(DocxImage::new_size(file_path, width_emu, height_emu)?),
93                );
94            }
95        }
96
97        Ok(())
98    }
99
100    /// 添加待替换的图片,替换的图片大小默认6.09*5.9厘米  
101    /// @param placeholder 替换的字符串  
102    /// @param image_url 图片路径  
103    pub async fn add_image_url_replacement(
104        &mut self,
105        placeholder: &str,
106        image_url: Option<&str>,
107    ) -> Result<(), DocxError> {
108        match image_url {
109            None => {
110                // 插入图片到属性中
111                self.image_replacements
112                    .insert(placeholder.to_string(), None);
113            }
114            Some(url) => {
115                // 发送请求
116                let response = self.client.get(url).send().await?;
117                // 检查状态码
118                if response.status().is_success() {
119                    // 读取字节
120                    let image_data = response.bytes().await?.to_vec();
121                    // 插入图片到属性中
122                    self.image_replacements.insert(
123                        placeholder.to_string(),
124                        Some(DocxImage::new_image_data(url, image_data)?),
125                    );
126                }
127            }
128        }
129
130        Ok(())
131    }
132
133    /// 添加待替换的图片  
134    /// @param placeholder 替换的字符串  
135    /// @param image_url 图片路径  
136    /// @param width 图片的宽度(厘米)  
137    /// @param height 图片的高度(厘米)  
138    pub async fn add_image_url_size_replacement(
139        &mut self,
140        placeholder: &str,
141        image_url: Option<&str>,
142        width: f32,
143        height: f32,
144    ) -> Result<(), DocxError> {
145        match image_url {
146            None => {
147                // 插入图片到属性中
148                self.image_replacements
149                    .insert(placeholder.to_string(), None);
150            }
151            Some(url) => {
152                // 发送请求
153                let response = self.client.get(url).send().await?;
154                // 检查状态码
155                if response.status().is_success() {
156                    // 读取字节
157                    let image_data = response.bytes().await?.to_vec();
158                    // 将厘米单位换算成emu
159                    let width_emu = (width * DOCX_EMU) as u64;
160                    let height_emu = (height * DOCX_EMU) as u64;
161                    // 插入图片到属性中
162                    self.image_replacements.insert(
163                        placeholder.to_string(),
164                        Some(DocxImage::new_image_data_size(
165                            url, image_data, width_emu, height_emu,
166                        )?),
167                    );
168                }
169            }
170        }
171
172        Ok(())
173    }
174
175    /// 处理模板  
176    /// @param template_path 模板路径  
177    /// @param output_path 输出路径  
178    pub fn process_template(
179        &self,
180        template_path: &str,
181        output_path: &str,
182    ) -> Result<(), DocxError> {
183        // 1. 打开模板文件
184        let template_file = File::open(template_path)?;
185        let mut archive = ZipArchive::new(template_file)?;
186
187        // 2. 创建输出文件
188        let output_file = File::create(output_path)?;
189        let mut zip_writer = ZipWriter::new(output_file);
190
191        // 3. 遍历ZIP中的文件
192        for i in 0..archive.len() {
193            let mut file = archive.by_index(i)?;
194            // 文件内容
195            let mut contents = Vec::new();
196            // 读取文件内容到数组中
197            file.read_to_end(&mut contents)?;
198            // 匹配文件类型
199            match file.name() {
200                "word/document.xml" => {
201                    // 处理文档主内容,替换模板内容
202                    contents = self.process_document_xml(&contents)?;
203                }
204                "word/_rels/document.xml.rels" => {
205                    // 处理关系文件
206                    contents = self.process_rels_xml(&contents)?;
207                }
208                &_ => {}
209            }
210
211            // 写入新文件
212            let option = SimpleFileOptions::default()
213                .compression_method(file.compression())
214                .unix_permissions(file.unix_mode().unwrap_or(0o644));
215            // 写入内容
216            zip_writer.start_file(file.name(), option)?;
217            zip_writer.write_all(&contents)?;
218        }
219
220        // 4. 添加新的图片文件
221        for (_, replacement) in &self.image_replacements {
222            if let Some(replacement) = replacement {
223                let image_path = format!(
224                    "word/media/image_{}.{}",
225                    replacement.relation_id,
226                    DocxTemplate::get_extension(&replacement.image_path)?
227                );
228                // 写入图片到word压缩文件中
229                zip_writer.start_file(&image_path, SimpleFileOptions::default())?;
230                zip_writer.write_all(&replacement.image_data)?;
231            }
232        }
233        // 将内容写入压缩文件(docx)
234        zip_writer.finish()?;
235        Ok(())
236    }
237
238    fn process_element(&self, _element: &mut BytesStart) -> Result<(), DocxError> {
239        // println!("{:?}", String::from_utf8_lossy(element.name().as_ref()));
240        Ok(())
241    }
242
243    /// 处理文件内容  
244    /// @param contents 文件内容数组  
245    fn process_document_xml(&self, contents: &[u8]) -> Result<Vec<u8>, DocxError> {
246        // 创建xml写对象
247        let mut xml_writer = Writer::new(Cursor::new(Vec::new()));
248        // 写入xml文件头
249        // xml_writer.write_event(Event::Decl(BytesDecl::new("1.0", Some("UTF-8"), Some("yes"))))?;
250        // 读取xml文件的内容
251        let mut reader = quick_xml::Reader::from_reader(&contents[..]);
252        reader.config_mut().trim_text(true);
253        // 缓存数组
254        let mut buf = Vec::new();
255        // 图片对应的字符串占位符
256        let mut current_placeholder = String::new();
257        // 循环读取xml数据
258        loop {
259            // 读取数据
260            match reader.read_event_into(&mut buf)? {
261                Event::Start(e) => {
262                    let mut element = e.to_owned();
263                    self.process_element(&mut element)?;
264                    if e.name().as_ref() == b"w:p" {
265                        current_placeholder.clear();
266                    }
267                    xml_writer.write_event(Event::Start(element))?;
268                }
269                Event::Text(e) => {
270                    // 读取标签的内容
271                    let mut text = e.unescape()?.into_owned();
272                    // 替换文本占位符操作
273                    self.process_text(&mut text);
274                    // 判断图片占位符是否包含在内容
275                    if self.image_replacements.contains_key(&text) {
276                        current_placeholder.push_str(&text);
277                    } else {
278                        xml_writer.write_event(Event::Text(BytesText::new(text.as_str())))?;
279                    }
280                }
281                Event::End(e) => {
282                    // 判断标签是w:p,并且判断当前待替换的图片字符串是否为空
283                    if e.name().as_ref() == b"w:p" && !current_placeholder.is_empty() {
284                        if let Some(Some(docx_image)) =
285                            self.image_replacements.get(&current_placeholder)
286                        {
287                            // 替换占位符为图片
288                            DocxTemplate::create_drawing_element(
289                                &mut xml_writer,
290                                &docx_image.relation_id,
291                                docx_image.width,
292                                docx_image.height,
293                            )?;
294                        } else {
295                            // 保留原始占位符文本
296                            xml_writer.write_event(Event::Text(BytesText::from_escaped(
297                                // current_placeholder.as_str(),
298                                "",
299                            )))?;
300                        }
301                        current_placeholder.clear();
302                    }
303                    xml_writer.write_event(Event::End(e))?;
304                }
305                Event::Eof => break,
306                e => {
307                    // 写入原有信息
308                    xml_writer.write_event(e)?
309                }
310            }
311            buf.clear();
312        }
313        // 返回文件数组
314        Ok(xml_writer.into_inner().into_inner())
315    }
316
317    fn process_rels_xml(&self, xml_data: &[u8]) -> Result<Vec<u8>, DocxError> {
318        // 创建xml写对象
319        let mut writer = Writer::new(Cursor::new(Vec::new()));
320        // 写入xml标签头
321        writer.write_event(Event::Decl(BytesDecl::new(
322            "1.0",
323            Some("UTF-8"),
324            Some("yes"),
325        )))?;
326
327        // 写入XML根元素
328        writer.write_event(Event::Start(
329            BytesStart::new("Relationships").with_attributes([(
330                "xmlns",
331                "http://schemas.openxmlformats.org/package/2006/relationships",
332            )]),
333        ))?;
334
335        // 读取原始数据
336        let mut reader = quick_xml::Reader::from_reader(xml_data);
337        reader.config_mut().trim_text(true);
338        let mut buf = Vec::new();
339
340        loop {
341            // 读取关系文件
342            match reader.read_event_into(&mut buf)? {
343                // 判断关系文件内容是否为关联标签
344                Event::Empty(e) if e.name().as_ref() == b"Relationship" => {
345                    // 写入关系标签内容
346                    writer.write_event(Event::Empty(e))?;
347                }
348                // 文件读取完毕
349                Event::Eof => break,
350                _ => {}
351            }
352            // 清理内容
353            buf.clear();
354        }
355
356        // 添加新的图片关系
357        for (_, value) in &self.image_replacements {
358            if let Some(docx_image) = value {
359                // 获取图片扩展名
360                let extension = DocxTemplate::get_extension(&docx_image.image_path)?;
361                // 创建图片路径
362                let image_path = format!("media/image_{}.{}", docx_image.relation_id, extension);
363                // 创建图片关系标签
364                let relationship = BytesStart::new("Relationship").with_attributes([
365                    ("Id", docx_image.relation_id.as_str()),
366                    (
367                        "Type",
368                        "http://schemas.openxmlformats.org/officeDocument/2006/relationships/image",
369                    ),
370                    ("Target", &image_path),
371                ]);
372                // 写入关系标签数据
373                writer.write_event(Event::Empty(relationship))?;
374            }
375        }
376
377        // 结束根元素
378        writer.write_event(Event::End(BytesEnd::new("Relationships")))?;
379        // 输出关系文件内容
380        Ok(writer.into_inner().into_inner())
381    }
382
383    fn get_extension(image_path: &str) -> Result<&str, DocxError> {
384        Path::new(image_path)
385            .extension()
386            .and_then(|s| s.to_str())
387            .ok_or_else(|| {
388                DocxError::ImageNotFound("Could not determine image extension".to_string())
389            })
390    }
391    // 替换模板属性
392    fn process_text(&self, text: &mut String) {
393        for (placeholder, value) in &self.text_replacements {
394            *text = text.replace(placeholder, value);
395        }
396    }
397
398    fn create_drawing_element<T>(
399        writer: &mut Writer<T>,
400        relation_id: &str,
401        width: u64,
402        height: u64,
403    ) -> Result<(), DocxError>
404    where
405        T: Write,
406    {
407        let drawing = format!(
408            r#"
409        <w:drawing>
410            <wp:inline distT="0" distB="0" distL="0" distR="0">
411                <wp:extent cx="{}" cy="{}"/>
412                <wp:docPr id="1" name="Picture 1" descr="Generated image"/>
413                <wp:cNvGraphicFramePr>
414                    <a:graphicFrameLocks xmlns:a="http://schemas.openxmlformats.org/drawingml/2006/main" noChangeAspect="1"/>
415                </wp:cNvGraphicFramePr>
416                <a:graphic xmlns:a="http://schemas.openxmlformats.org/drawingml/2006/main">
417                    <a:graphicData uri="http://schemas.openxmlformats.org/drawingml/2006/picture">
418                        <pic:pic xmlns:pic="http://schemas.openxmlformats.org/drawingml/2006/picture">
419                            <pic:nvPicPr>
420                                <pic:cNvPr id="0" name="Picture 1" descr="Generated image"/>
421                                <pic:cNvPicPr><a:picLocks noChangeAspect="1"/></pic:cNvPicPr>
422                            </pic:nvPicPr>
423                            <pic:blipFill>
424                                <a:blip r:embed="{}"/>
425                                <a:stretch>
426                                    <a:fillRect/>
427                                </a:stretch>
428                            </pic:blipFill>
429                            <pic:spPr>
430                                <a:xfrm>
431                                    <a:off x="0" y="0"/>
432                                    <a:ext cx="{}" cy="{}"/>
433                                </a:xfrm>
434                                <a:prstGeom prst="rect">
435                                    <a:avLst/>
436                                </a:prstGeom>
437                            </pic:spPr>
438                        </pic:pic>
439                    </a:graphicData>
440                </a:graphic>
441            </wp:inline>
442        </w:drawing>
443    "#,
444            width, height, relation_id, width, height,
445        );
446
447        let mut reader = quick_xml::Reader::from_str(&drawing);
448        reader.config_mut().trim_text(true);
449        let mut buf = Vec::new();
450
451        loop {
452            match reader.read_event_into(&mut buf)? {
453                Event::Eof => break,
454                e => {
455                    writer.write_event(e)?;
456                }
457            }
458        }
459        Ok(())
460    }
461}