obs_sdk/
lib.rs

1//! # 使用说明
2//! 
3//! ## 1. 列举桶内对象列表
4//! 
5//! ```rust
6//! use obs_sdk::ObsClient;
7//! 
8//! static ENDPOINT: &str = "obs.cn-north-4.myhuaweicloud.com";
9//! static AK: &str = "YOUR_AK";
10//! static SK: &str = "YOUR_SK";
11//! static BUCKET_NAME: &str = "bucket_name";
12//! 
13//! #[tokio::test]
14//! async fn test_list_prefix() -> Result<(), Box<dyn std::error::Error>> {
15//!     let client = ObsClient {
16//!         endpoint: ENDPOINT.to_string(),
17//!         ak: AK.to_string(),
18//!         sk: SK.to_string(),
19//!         bucket: BUCKET_NAME.to_string(),
20//!     };
21//!     let res = client.list("tmp").await?;
22//!     println!("{:?}", res);
23//!     Ok(())
24//! }
25//! ```
26//! 
27//! ## 2. 上传对象到桶
28//! 
29//! ```rust
30//! use obs_sdk::ObsClient;
31//! 
32//! static ENDPOINT: &str = "obs.cn-north-4.myhuaweicloud.com";
33//! static AK: &str = "YOUR_AK";
34//! static SK: &str = "YOUR_SK";
35//! static BUCKET_NAME: &str = "bucket_name";
36//! 
37//! #[tokio::test]
38//! async fn test_upload_object() -> Result<(), Box<dyn std::error::Error>> {
39//!     let client = ObsClient {
40//!         endpoint: ENDPOINT.to_string(),
41//!         ak: AK.to_string(),
42//!         sk: SK.to_string(),
43//!         bucket: BUCKET_NAME.to_string(),
44//!     };
45//!     let res = client.upload_file("tmp_cargo.txt", "Cargo.txt").await?;
46//!     println!("{:?}", res);
47//!     Ok(())
48//! }
49//! ```
50//! 
51//! ## 3. 下载对象到本地目录
52//! 
53//! ```rust
54//! use obs_sdk::ObsClient;
55//! 
56//! static ENDPOINT: &str = "obs.cn-north-4.myhuaweicloud.com";
57//! static AK: &str = "YOUR_AK";
58//! static SK: &str = "YOUR_SK";
59//! static BUCKET_NAME: &str = "bucket_name";
60//! 
61//! #[tokio::test]
62//! async fn test_download_file02() -> Result<(), Box<dyn std::error::Error>> {
63//!     let client = ObsClient {
64//!         endpoint: ENDPOINT.to_string(),
65//!         ak: AK.to_string(),
66//!         sk: SK.to_string(),
67//!         bucket: BUCKET_NAME.to_string(),
68//!     };
69//!     let res = client.download_file("2hls_stutter-10.mp4", "video/2hls_stutter-10.mp4", false).await;
70//!     res
71//! }
72//! ```
73//! 
74//! ## 4. 下载对象为字节内容
75//! 
76//! ```rust
77//! use obs_sdk::ObsClient;
78//! 
79//! static ENDPOINT: &str = "obs.cn-north-4.myhuaweicloud.com";
80//! static AK: &str = "YOUR_AK";
81//! static SK: &str = "YOUR_SK";
82//! static BUCKET_NAME: &str = "bucket_name";
83//! 
84//! #[tokio::test]
85//! async fn test_download_file01() -> Result<(), Box<dyn std::error::Error>> {
86//!     let client = ObsClient {
87//!         endpoint: ENDPOINT.to_string(),
88//!         ak: AK.to_string(),
89//!         sk: SK.to_string(),
90//!         bucket: BUCKET_NAME.to_string(),
91//!     };
92//!     let data = client.download_object("2hls_stutter-10.mp4").await?;
93//!     let file_path = Path::new("output.mp4");
94//!     match fs::write(file_path, data) {
95//!         Ok(_) => println!("文件保存成功{:?}", file_path),
96//!         Err(e) => eprintln!("文件保存失败:{}", e)
97//!     }
98//!     Ok(())
99//! }
100//! ```
101//! 
102//! ## 5. url鉴权
103//! 
104//! ```rust
105//! use obs_sdk::ObsClient;
106//!
107//! static ENDPOINT: &str = "obs.cn-north-4.myhuaweicloud.com";
108//! static AK: &str = "YOUR_AK";
109//! static SK: &str = "YOUR_SK";
110//! static BUCKET_NAME: &str = "bucket_name";
111//! 
112//! #[test]
113//! fn test_url_sign() -> Result<(), Box<dyn std::error::Error>> {
114//!     let client = ObsClient {
115//!         endpoint: ENDPOINT.to_string(),
116//!         ak: AK.to_string(),
117//!         sk: SK.to_string(),
118//!         bucket: BUCKET_NAME.to_string(),
119//!     };
120//!     let sign_url = client.url_sign("https://ranfs.obs.cn-north-4.myhuaweicloud.com/tmp_cargo.txt")?;
121//!     println!("sign_url = {}", sign_url);
122//!     Ok(())
123//! }
124//! ```
125//! 
126mod utils;
127mod algorithm;
128
129use algorithm::HmacSha1;
130use std::fs;
131use std::path::Path;
132use std::io::{Error, ErrorKind};
133use serde::{Serialize, Deserialize};
134use regex::Regex;
135use std::vec::Vec;
136use url::{Url, form_urlencoded};
137use chrono::Local;
138use reqwest::StatusCode;
139use urlencoding::encode;
140
141/// 华为云OBS客户端
142/// 
143pub struct ObsClient {
144    pub endpoint: String,
145    pub ak: String,
146    pub sk: String,
147    pub bucket: String,
148}
149
150impl ObsClient {
151
152    /// 列举指定前缀开头的所有对象元数据,方法内部会构造http请求:
153    /// ```plain
154    /// GET / HTTP/1.1
155    /// Host: bucketname.obs.cn-north-4.myhuaweicloud.com
156    /// Date: date
157    /// Authorization: authorization
158    /// ```
159    /// 
160    pub async fn list(&self, prefix: &str) -> Result<Vec<ObjectMeta>, Box<dyn std::error::Error>> {
161        // 构造完整的url地址
162        let url = format!("https://{}.{}/?prefix={}", self.bucket, self.endpoint, prefix);
163
164        //  获取GMT格式的时间字符串
165        let date = utils::now_str_gmt();
166
167        // 创建HmacSha1对象
168        let hmacsha1 = HmacSha1();
169
170        // 构造签名用的原始字符串
171        let string_to_sign = hmacsha1.header_string_to_sign("GET", "", "", &date, "",  &format!("/{}/", self.bucket));
172
173        // 根据原始字符串+ak,获取header签名
174        let signature = hmacsha1.sign_to_base64string(&string_to_sign, &self.sk);
175
176        // 构造请求头Authorization的值
177        let authorization = format!("OBS {}:{}", self.ak, signature);
178        // 构造http请求
179        let client = reqwest::Client::new();
180        let res = client.get(url)
181            .header("Date", &date)
182            .header("Authorization", &authorization)
183            .send()
184            .await?;
185
186        // 如果请求成功,则返回字节内容
187        if res.status().is_success() {
188            let xml_content_string = res.text().await?;
189            let results = XmlParser::new(&xml_content_string).parse();
190            return Ok(results);
191        }
192
193        Err(Box::new(Error::new(ErrorKind::Other, format!("请求失败,状态码={}", res.status()))))
194    }
195
196    /// 上传对象
197    /// 
198    /// 方法内部构建请求
199    /// ```plain
200    /// PUT /object01 HTTP/1.1
201    /// User-Agent: curl/7.29.0
202    /// Host: examplebucket.obs.cn-north-4.myhuaweicloud.com
203    /// Accept: */*
204    /// Date: WED, 01 Jul 2015 04:11:15 GMT
205    /// Authorization: OBS H4IPJX0TQTHTHEBQQCEC:gYqplLq30dEX7GMi2qFWyjdFsyw=
206    /// Content-Length: 10240
207    /// Expect: 100-continue
208    /// 
209    /// [1024 Byte data content]
210    /// ```
211    /// 
212    pub async fn upload_object(&self, obj_key: &str, data: Vec<u8>) -> Result<(), Box<dyn std::error::Error>> {
213        let obj_key = &Self::urlencode(obj_key);
214        // 构造完整的url地址
215        let url = format!("https://{}.{}/{}", self.bucket, self.endpoint, obj_key);
216
217        let md5_string = utils::base64_md5_str(&data);
218
219        //  获取GMT格式的时间字符串
220        let date = utils::now_str_gmt();
221
222        // 创建HmacSha1对象
223        let hmacsha1 = HmacSha1();
224
225        let file_type = &utils::get_mime_type_from_extension(obj_key)
226            .expect("资源对应类型暂不支持上传,请在方法get_mime_type_from_extension中添加文件类型");
227
228        // 构造签名用的原始字符串
229        let string_to_sign = hmacsha1.header_string_to_sign("PUT", &md5_string, file_type, &date, "",  &format!("/{}/{}", self.bucket, obj_key));
230
231        // 根据原始字符串+ak,获取header签名
232        let signature = hmacsha1.sign_to_base64string(&string_to_sign, &self.sk);
233
234        // 构造请求头Authorization的值
235        let authorization = format!("OBS {}:{}", self.ak, signature);
236
237        // 构造http请求
238        let client = reqwest::Client::new();
239        let res = client.put(url)
240            .header("Content-MD5", &md5_string)
241            .header("Date", &date)
242            .header("Content-Type", file_type)
243            .header("Content-Length", data.len())
244            .header("Authorization", authorization)
245            .body(data)
246            .send()
247            .await;
248
249        let res = match res {
250            Ok(response) => response,
251            Err(e) => {
252                return Err(Box::new(std::io::Error::new(std::io::ErrorKind::Other, e)));
253            },
254        };
255        let _status: StatusCode = res.status();
256
257        Ok(())
258
259    }
260
261    /// 上传文件
262    pub async fn upload_file(&self, obj_key: &str, file_path: &str) -> Result<(), Box<dyn std::error::Error>> {
263        let data = fs::read(file_path)?;
264        self.upload_object(obj_key, data).await
265    }
266
267    /// 下载对象,方法内部会构造http请求:
268    /// ```plain
269    /// GET /{obj_key} HTTP/1.1
270    /// Host: {bucket}.obs.cn-north-4.myhuaweicloud.com
271    /// Date: {date}
272    /// ```
273    /// 
274    pub async fn download_object(&self, obj_key: &str) -> Result<Vec<u8>, Box<dyn std::error::Error>> {
275        let obj_key = &Self::urlencode(obj_key);
276        // 构造完整的url地址
277        let url = format!("https://{}.{}/{}", self.bucket, self.endpoint, obj_key);
278
279        //  获取GMT格式的时间字符串
280        let date = utils::now_str_gmt();
281
282        // 创建HmacSha1对象
283        let hmacsha1 = HmacSha1();
284
285        // 构造签名用的原始字符串
286        let string_to_sign = hmacsha1.header_string_to_sign("GET", "", "", &date, "",  &format!("/{}/{}", self.bucket, obj_key));
287
288        // 根据原始字符串+ak,获取header签名
289        let signature = hmacsha1.sign_to_base64string(&string_to_sign, &self.sk);
290
291        // 构造请求头Authorization的值
292        let authorization = format!("OBS {}:{}", self.ak, signature);
293
294        // 构造http请求
295        let client = reqwest::Client::new();
296        let res = client.get(url)
297            .header("Authorization", &authorization)
298            .header("Date", &date)
299            .send()
300            .await?;
301
302        // 如果请求成功,则返回字节内容
303        if res.status().is_success() {
304            return Ok(res.bytes().await?.to_vec());
305        }
306        
307        Err(Box::new(Error::new(ErrorKind::Other, format!("请求失败,状态码={}", res.status()))))
308    }
309
310    /// 删除obs上的对象
311    pub async fn delete_object(&self, obj_key: &str) -> Result<(), Box<dyn std::error::Error>> {
312        // 构造完整的url地址
313        let url = format!("https://{}.{}/{}", self.bucket, self.endpoint, obj_key);
314
315        let md5_string = "";
316
317        //  获取GMT格式的时间字符串
318        let date = utils::now_str_gmt();
319
320        // 创建HmacSha1对象
321        let hmacsha1 = HmacSha1();
322
323        // 构造签名用的原始字符串
324        let string_to_sign = hmacsha1.header_string_to_sign("DELETE", &md5_string, "", &date, "",  &format!("/{}/{}", self.bucket, obj_key));
325
326        // 根据原始字符串+ak,获取header签名
327        let signature = hmacsha1.sign_to_base64string(&string_to_sign, &self.sk);
328
329        // 构造请求头Authorization的值
330        let authorization = format!("OBS {}:{}", self.ak, signature);
331
332        // 构造http请求
333        let client = reqwest::Client::new();
334        let res = client.delete(url)
335            .header("Date", &date)
336            .header("Authorization", authorization)
337            .send()
338            .await;
339
340        let res = match res {
341            Ok(response) => response,
342            Err(e) => {
343                return Err(Box::new(std::io::Error::new(std::io::ErrorKind::Other, e)));
344            },
345        };
346        let status = res.status();
347        println!("status = {}, {}", status, res.text_with_charset("utf-8").await?);
348
349        Ok(())
350    }
351
352    /// 下载文件,并指定本地保存用的文件路径
353    /// 
354    /// # 参数
355    /// 
356    /// `overwrite` - 是否覆盖,true,当文件存在时,覆盖文件,false,当文件存在时,不覆盖文件
357    /// 
358    pub async fn download_file(&self, obj_key: &str, file_path: &str, overwrite: bool) -> Result<(), Box<dyn std::error::Error>> {
359        let file_path = Path::new(file_path);
360
361        // 判断文件是否存在,如果存在,不做任何操作
362        if file_path.exists() && !overwrite {
363            return Err(Box::new(Error::new(ErrorKind::AlreadyExists, "文件已存在,请删除文件或设置覆盖参数")));
364        }
365
366        // 根据父目录是否存在,选择性创建父目录
367        let parent = file_path.parent().unwrap();
368        if !parent.exists() {
369            fs::create_dir_all(&parent)?;
370        }
371
372        // 下载文件,得到原始文件字节内容
373        let data = self.download_object(obj_key).await?;
374        
375        // 保存文件
376        fs::write(file_path, data)?;
377        Ok(())
378    }
379
380    pub fn url_sign(&self, url_str: &str) -> Result<String, Box<dyn std::error::Error>> {
381        let obs_object_url = Url::parse(url_str)?;
382        let resource_part = obs_object_url.path();
383        let host = obs_object_url.host().unwrap();
384        let domain = match host {
385            url::Host::Domain(domain) => domain.to_string(),
386            _ => format!("{}.{}", self.bucket, self.endpoint)
387        };
388        let parts: Vec<&str> = domain.split(".").collect();
389        let bucket_name = parts[0];
390
391        let timestamp = utils::timestamp(Local::now(), 3600*2);
392
393        //  获取GMT格式的时间字符串
394        let expires = format!("{}", timestamp);
395
396        // 创建HmacSha1对象
397        let hmacsha1 = HmacSha1();
398
399        // 构造签名用的原始字符串
400        let string_to_sign = hmacsha1.url_string_to_sign("GET", "", "", &expires, "",  &format!("/{}{}", bucket_name, resource_part));
401
402        // 根据原始字符串+ak,获取header签名
403        let signature = hmacsha1.sign_to_base64string(&string_to_sign, &self.sk);
404        let signature = form_urlencoded::byte_serialize(signature.as_bytes()).collect::<String>();
405
406        // 构造url
407        let sign_url = format!("{}?AccessKeyId={}&Expires={}&Signature={}", url_str, self.ak, expires, signature);
408        Ok(sign_url)
409    }
410
411    fn urlencode(s: &str) -> String {
412        let tokens: Vec<String> = s.split("/").map(|token| {
413            encode(token).to_string()
414        }).collect();
415        tokens.join("/")
416    }
417
418}
419
420
421/// obs对象的元数据信息
422/// 
423/// 这个结构体用于表示 OBS 对象的元数据,包含对象的各种属性,如名称、修改时间、内容标识、大小以及存储类型。
424#[derive(Serialize, Deserialize, Debug)]
425pub struct ObjectMeta {
426
427    /// 对象名
428    /// 
429    /// 唯一标识 OBS 存储中的对象
430    pub key: String,
431
432    /// 对象最近一次被修改的时间(UTC时间)
433    /// 
434    /// 该时间戳表示对象在 OBS 存储中最后一次被修改的时刻,采用 UTC 时间格式。
435    pub last_modified: String,
436
437    /// 对象的base64编码的128位MD5摘要
438    /// 
439    /// 这个 ETag 值是对象内容的唯一标识,可以通过该值识别对象内容是否有变化。
440    pub etag: String,
441
442    /// 对象的字节数
443    /// 
444    /// 表示对象在存储中占用的字节大小
445    pub size: u64,
446
447    /// 对象的存储类型:STANDARD,WARM,COLD,DEEP_ARCHIVE
448    /// 
449    /// 不同的存储类型对应不同的存储成本和访问性能,用户可以根据对象的访问频率等因素选择合适的存储类型
450    pub storage_class: String,
451}
452
453/// XML解析器
454/// 
455/// 用于解析XML格式的响应数据,目前这里面针对obs的接口“列举桶内对象”的响应结果进行解析,没有进行通用的xml解析,其不能作为通用工具使用
456struct XmlParser { 
457    xml: String,
458}
459
460
461impl XmlParser {
462    fn new(xml: &str) -> Self {
463        XmlParser { xml: xml.to_string() }
464    }
465
466    /// 解析obs接口“列举桶内对象”的响应结果
467    /// 
468    /// 该内部采用正则表达式进行解析,因此依赖外部的regex库
469    fn parse(&self) -> Vec<ObjectMeta> {
470        let xml = &self.xml;
471
472        // 定义解析需要使用的正则表达式
473        let contents_re = Regex::new(r#"<Contents>(.*?)</Contents>"#).unwrap();
474        let key_regex = Regex::new(r#"<Key>(.*?)</Key>"#).unwrap();
475        let last_modified_regex = Regex::new(r#"<LastModified>(.*?)</LastModified>"#).unwrap();
476        let etag_regex = Regex::new(r#"<ETag>(.*?)</ETag>"#).unwrap();
477        let size_regex = Regex::new(r#"<Size>(.*?)</Size>"#).unwrap();
478        let storage_class_regex = Regex::new(r#"<StorageClass>(.*?)</StorageClass>"#).unwrap();
479
480
481        // 解析Contents标签内的数据
482        let mut contents_vec = Vec::new();
483        for captures in contents_re.captures_iter(xml) {
484            let inner_content = &captures[1];
485
486            let key = key_regex.captures(inner_content).map(|cap| cap[1].to_string()).unwrap_or_default();
487            let last_modified = last_modified_regex.captures(inner_content).map(|cap| cap[1].to_string()).unwrap_or_default();
488            let etag = etag_regex.captures(inner_content).map(|cap| cap[1].to_string()).unwrap_or_default();
489            let size = size_regex.captures(inner_content).and_then(|cap| cap[1].parse().ok()).unwrap_or(0);
490            let storage_class = storage_class_regex.captures(inner_content).map(|cap| cap[1].to_string()).unwrap_or_default();
491            let content = ObjectMeta {
492                key,
493                last_modified,
494                etag,
495                size,
496                storage_class,
497            };
498            contents_vec.push(content);
499        }
500
501        contents_vec
502    }
503}
504
505
506#[cfg(test)]
507mod tests {
508    use super::*;
509    use chrono::{Duration, Local};
510    use std::time::{SystemTime, UNIX_EPOCH};
511
512    #[test]
513    fn test_parse_xml() {
514        let xml = r#"<?xml version="1.0" encoding="UTF-8" standalone="yes"?><ListBucketResult xmlns="http://obs.myhwclouds.com/doc/2015-06-30/"><Name>obs-products</Name><Prefix>tmp</Prefix><Marker></Marker><MaxKeys>1000</MaxKeys><IsTruncated>false</IsTruncated><Contents><Key>tmp/</Key><LastModified>2024-12-03T12:01:48.020Z</LastModified><ETag>"d41d8cd98f00b204e9800998ecf8427e"</ETag><Size>0</Size><Owner><ID>74df55bf376f41d48959d2aa9deaaf38</ID></Owner><StorageClass>STANDARD</StorageClass></Contents><Contents><Key>tmp/index001.png</Key><LastModified>2025-08-20T07:42:59.813Z</LastModified><ETag>"de317c0b7b6e02b42ef2b9e29bb5906a"</ETag><Size>12082</Size><Owner><ID>74df55bf376f41d48959d2aa9deaaf38</ID></Owner><StorageClass>STANDARD</StorageClass></Contents><Contents><Key>tmp/index002.png</Key><LastModified>2025-08-20T07:52:10.204Z</LastModified><ETag>"de317c0b7b6e02b42ef2b9e29bb5906a"</ETag><Size>12082</Size><Owner><ID>74df55bf376f41d48959d2aa9deaaf38</ID></Owner><StorageClass>STANDARD</StorageClass></Contents></ListBucketResult>"#;
515        let parser = XmlParser::new(xml);
516        let contents = parser.parse();
517        let json_data = serde_json::to_string_pretty(&contents).unwrap();
518        println!("{}", json_data);
519    }
520
521    #[test]
522    fn test_timestamp() {
523        let now = Local::now();
524        let two_hours = Duration::hours(2);
525        let future_time = now + two_hours;
526
527        let system_time: SystemTime = future_time.into();
528        let duration = system_time.duration_since(UNIX_EPOCH).unwrap();
529        let timestamp = duration.as_secs();
530        println!("timestamp = {}", timestamp);
531    }
532
533}