google_cloud_storage/storage/write_object.rs
1// Copyright 2025 Google LLC
2//
3// Licensed under the Apache License, Version 2.0 (the "License");
4// you may not use this file except in compliance with the License.
5// You may obtain a copy of the License at
6//
7// https://www.apache.org/licenses/LICENSE-2.0
8//
9// Unless required by applicable law or agreed to in writing, software
10// distributed under the License is distributed on an "AS IS" BASIS,
11// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12// See the License for the specific language governing permissions and
13// limitations under the License.
14
15//! Contains the request builder for [write_object()] and related types.
16//!
17//! [write_object()]: crate::storage::client::Storage::write_object()
18
19use super::streaming_source::{Seek, StreamingSource};
20use super::*;
21use crate::model_ext::KeyAes256;
22use crate::storage::checksum::details::update as checksum_update;
23use crate::storage::checksum::details::{Checksum, Md5};
24use crate::storage::request_options::RequestOptions;
25
26/// A request builder for object writes.
27///
28/// # Example: hello world
29/// ```
30/// use google_cloud_storage::client::Storage;
31/// async fn sample(client: &Storage) -> anyhow::Result<()> {
32/// let response = client
33/// .write_object("projects/_/buckets/my-bucket", "hello", "Hello World!")
34/// .send_unbuffered()
35/// .await?;
36/// println!("response details={response:?}");
37/// Ok(())
38/// }
39/// ```
40///
41/// # Example: upload a file
42/// ```
43/// use google_cloud_storage::client::Storage;
44/// async fn sample(client: &Storage) -> anyhow::Result<()> {
45/// let payload = tokio::fs::File::open("my-data").await?;
46/// let response = client
47/// .write_object("projects/_/buckets/my-bucket", "my-object", payload)
48/// .send_unbuffered()
49/// .await?;
50/// println!("response details={response:?}");
51/// Ok(())
52/// }
53/// ```
54///
55/// # Example: create a new object from a custom data source
56/// ```
57/// use google_cloud_storage::{client::Storage, streaming_source::StreamingSource};
58/// struct DataSource;
59/// impl StreamingSource for DataSource {
60/// type Error = std::io::Error;
61/// async fn next(&mut self) -> Option<Result<bytes::Bytes, Self::Error>> {
62/// # panic!();
63/// }
64/// }
65///
66/// async fn sample(client: &Storage) -> anyhow::Result<()> {
67/// let response = client
68/// .write_object("projects/_/buckets/my-bucket", "my-object", DataSource)
69/// .send_buffered()
70/// .await?;
71/// println!("response details={response:?}");
72/// Ok(())
73/// }
74/// ```
75pub struct WriteObject<T, S = crate::storage::transport::Storage>
76where
77 S: crate::storage::stub::Storage + 'static,
78{
79 stub: std::sync::Arc<S>,
80 pub(crate) request: crate::model_ext::WriteObjectRequest,
81 pub(crate) payload: Payload<T>,
82 pub(crate) options: RequestOptions,
83}
84
85impl<T, S> WriteObject<T, S>
86where
87 S: crate::storage::stub::Storage + 'static,
88{
89 /// Set a [request precondition] on the object generation to match.
90 ///
91 /// With this precondition the request fails if the current object
92 /// generation matches the provided value. A common value is `0`, which
93 /// prevents writes from succeeding if the object already exists.
94 ///
95 /// # Example
96 /// ```
97 /// # use google_cloud_storage::client::Storage;
98 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
99 /// let response = client
100 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
101 /// .set_if_generation_match(0)
102 /// .send_buffered()
103 /// .await?;
104 /// println!("response details={response:?}");
105 /// # Ok(()) }
106 /// ```
107 ///
108 /// [request precondition]: https://cloud.google.com/storage/docs/request-preconditions
109 pub fn set_if_generation_match<V>(mut self, v: V) -> Self
110 where
111 V: Into<i64>,
112 {
113 self.request.spec.if_generation_match = Some(v.into());
114 self
115 }
116
117 /// Set a [request precondition] on the object generation to match.
118 ///
119 /// With this precondition the request fails if the current object
120 /// generation does not match the provided value.
121 ///
122 /// # Example
123 /// ```
124 /// # use google_cloud_storage::client::Storage;
125 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
126 /// let response = client
127 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
128 /// .set_if_generation_not_match(0)
129 /// .send_buffered()
130 /// .await?;
131 /// println!("response details={response:?}");
132 /// # Ok(()) }
133 /// ```
134 ///
135 /// [request precondition]: https://cloud.google.com/storage/docs/request-preconditions
136 pub fn set_if_generation_not_match<V>(mut self, v: V) -> Self
137 where
138 V: Into<i64>,
139 {
140 self.request.spec.if_generation_not_match = Some(v.into());
141 self
142 }
143
144 /// Set a [request precondition] on the object meta generation.
145 ///
146 /// With this precondition the request fails if the current object metadata
147 /// generation does not match the provided value. This may be useful to
148 /// prevent changes when the metageneration is known.
149 ///
150 /// # Example
151 /// ```
152 /// # use google_cloud_storage::client::Storage;
153 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
154 /// let response = client
155 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
156 /// .set_if_metageneration_match(1234)
157 /// .send_buffered()
158 /// .await?;
159 /// println!("response details={response:?}");
160 /// # Ok(()) }
161 /// ```
162 ///
163 /// [request precondition]: https://cloud.google.com/storage/docs/request-preconditions
164 pub fn set_if_metageneration_match<V>(mut self, v: V) -> Self
165 where
166 V: Into<i64>,
167 {
168 self.request.spec.if_metageneration_match = Some(v.into());
169 self
170 }
171
172 /// Set a [request precondition] on the object meta-generation.
173 ///
174 /// With this precondition the request fails if the current object metadata
175 /// generation matches the provided value. This is rarely useful in uploads,
176 /// it is more commonly used on reads to prevent a large response if the
177 /// data is already cached.
178 ///
179 /// # Example
180 /// ```
181 /// # use google_cloud_storage::client::Storage;
182 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
183 /// let response = client
184 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
185 /// .set_if_metageneration_not_match(1234)
186 /// .send_buffered()
187 /// .await?;
188 /// println!("response details={response:?}");
189 /// # Ok(()) }
190 /// ```
191 ///
192 /// [request precondition]: https://cloud.google.com/storage/docs/request-preconditions
193 pub fn set_if_metageneration_not_match<V>(mut self, v: V) -> Self
194 where
195 V: Into<i64>,
196 {
197 self.request.spec.if_metageneration_not_match = Some(v.into());
198 self
199 }
200
201 /// Sets the ACL for the new object.
202 ///
203 /// # Example
204 /// ```
205 /// # use google_cloud_storage::client::Storage;
206 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
207 /// # use google_cloud_storage::model::ObjectAccessControl;
208 /// let response = client
209 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
210 /// .set_acl([ObjectAccessControl::new().set_entity("allAuthenticatedUsers").set_role("READER")])
211 /// .send_buffered()
212 /// .await?;
213 /// println!("response details={response:?}");
214 /// # Ok(()) }
215 /// ```
216 pub fn set_acl<I, V>(mut self, v: I) -> Self
217 where
218 I: IntoIterator<Item = V>,
219 V: Into<crate::model::ObjectAccessControl>,
220 {
221 self.mut_resource().acl = v.into_iter().map(|a| a.into()).collect();
222 self
223 }
224
225 /// Sets the [cache control] for the new object.
226 ///
227 /// This can be used to control caching in [public objects].
228 ///
229 /// # Example
230 /// ```
231 /// # use google_cloud_storage::client::Storage;
232 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
233 /// let response = client
234 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
235 /// .set_cache_control("public; max-age=7200")
236 /// .send_buffered()
237 /// .await?;
238 /// println!("response details={response:?}");
239 /// # Ok(()) }
240 /// ```
241 ///
242 /// [public objects]: https://cloud.google.com/storage/docs/access-control/making-data-public
243 /// [cache control]: https://datatracker.ietf.org/doc/html/rfc7234#section-5.2
244 pub fn set_cache_control<V: Into<String>>(mut self, v: V) -> Self {
245 self.mut_resource().cache_control = v.into();
246 self
247 }
248
249 /// Sets the [content disposition] for the new object.
250 ///
251 /// Google Cloud Storage can serve content directly to web browsers. This
252 /// attribute sets the `Content-Disposition` header, which may change how
253 /// the browser displays the contents.
254 ///
255 /// # Example
256 /// ```
257 /// # use google_cloud_storage::client::Storage;
258 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
259 /// let response = client
260 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
261 /// .set_content_disposition("inline")
262 /// .send_buffered()
263 /// .await?;
264 /// println!("response details={response:?}");
265 /// # Ok(()) }
266 /// ```
267 ///
268 /// [content disposition]: https://datatracker.ietf.org/doc/html/rfc6266
269 pub fn set_content_disposition<V: Into<String>>(mut self, v: V) -> Self {
270 self.mut_resource().content_disposition = v.into();
271 self
272 }
273
274 /// Sets the [content encoding] for the object data.
275 ///
276 /// This can be used to upload compressed data and enable [transcoding] of
277 /// the data during reads.
278 ///
279 /// # Example
280 /// ```
281 /// # use google_cloud_storage::client::Storage;
282 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
283 /// use flate2::write::GzEncoder;
284 /// use std::io::Write;
285 /// let mut e = GzEncoder::new(Vec::new(), flate2::Compression::default());
286 /// e.write_all(b"hello world");
287 /// let response = client
288 /// .write_object("projects/_/buckets/my-bucket", "my-object", bytes::Bytes::from_owner(e.finish()?))
289 /// .set_content_encoding("gzip")
290 /// .send_buffered()
291 /// .await?;
292 /// println!("response details={response:?}");
293 /// # Ok(()) }
294 /// ```
295 ///
296 /// [transcoding]: https://cloud.google.com/storage/docs/transcoding
297 /// [content encoding]: https://datatracker.ietf.org/doc/html/rfc7231#section-3.1.2.2
298 pub fn set_content_encoding<V: Into<String>>(mut self, v: V) -> Self {
299 self.mut_resource().content_encoding = v.into();
300 self
301 }
302
303 /// Sets the [content language] for the new object.
304 ///
305 /// Google Cloud Storage can serve content directly to web browsers. This
306 /// attribute sets the `Content-Language` header, which may change how the
307 /// browser displays the contents.
308 ///
309 /// # Example
310 /// ```
311 /// # use google_cloud_storage::client::Storage;
312 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
313 /// let response = client
314 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
315 /// .set_content_language("en")
316 /// .send_buffered()
317 /// .await?;
318 /// println!("response details={response:?}");
319 /// # Ok(()) }
320 /// ```
321 ///
322 /// [content language]: https://cloud.google.com/storage/docs/metadata#content-language
323 pub fn set_content_language<V: Into<String>>(mut self, v: V) -> Self {
324 self.mut_resource().content_language = v.into();
325 self
326 }
327
328 /// Sets the [content type] for the new object.
329 ///
330 /// Google Cloud Storage can serve content directly to web browsers. This
331 /// attribute sets the `Content-Type` header, which may change how the
332 /// browser interprets the contents.
333 ///
334 /// # Example
335 /// ```
336 /// # use google_cloud_storage::client::Storage;
337 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
338 /// let response = client
339 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
340 /// .set_content_type("text/plain")
341 /// .send_buffered()
342 /// .await?;
343 /// println!("response details={response:?}");
344 /// # Ok(()) }
345 /// ```
346 ///
347 /// [content type]: https://datatracker.ietf.org/doc/html/rfc7231#section-3.1.1.5
348 pub fn set_content_type<V: Into<String>>(mut self, v: V) -> Self {
349 self.mut_resource().content_type = v.into();
350 self
351 }
352
353 /// Sets the [custom time] for the new object.
354 ///
355 /// This field is typically set in order to use the [DaysSinceCustomTime]
356 /// condition in Object Lifecycle Management.
357 ///
358 /// # Example
359 /// ```
360 /// # use google_cloud_storage::client::Storage;
361 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
362 /// let time = wkt::Timestamp::try_from("2025-07-07T18:30:00Z")?;
363 /// let response = client
364 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
365 /// .set_custom_time(time)
366 /// .send_buffered()
367 /// .await?;
368 /// println!("response details={response:?}");
369 /// # Ok(()) }
370 /// ```
371 ///
372 /// [DaysSinceCustomTime]: https://cloud.google.com/storage/docs/lifecycle#dayssincecustomtime
373 /// [custom time]: https://cloud.google.com/storage/docs/metadata#custom-time
374 pub fn set_custom_time<V: Into<wkt::Timestamp>>(mut self, v: V) -> Self {
375 self.mut_resource().custom_time = Some(v.into());
376 self
377 }
378
379 /// Sets the [event based hold] flag for the new object.
380 ///
381 /// This field is typically set in order to prevent objects from being
382 /// deleted or modified.
383 ///
384 /// # Example
385 /// ```
386 /// # use google_cloud_storage::client::Storage;
387 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
388 /// let response = client
389 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
390 /// .set_event_based_hold(true)
391 /// .send_buffered()
392 /// .await?;
393 /// println!("response details={response:?}");
394 /// # Ok(()) }
395 /// ```
396 ///
397 /// [event based hold]: https://cloud.google.com/storage/docs/object-holds
398 pub fn set_event_based_hold<V: Into<bool>>(mut self, v: V) -> Self {
399 self.mut_resource().event_based_hold = Some(v.into());
400 self
401 }
402
403 /// Sets the [custom metadata] for the new object.
404 ///
405 /// This field is typically set to annotate the object with
406 /// application-specific metadata.
407 ///
408 /// # Example
409 /// ```
410 /// # use google_cloud_storage::client::Storage;
411 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
412 /// let time = wkt::Timestamp::try_from("2025-07-07T18:30:00Z")?;
413 /// let response = client
414 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
415 /// .set_metadata([("test-only", "true"), ("environment", "qa")])
416 /// .send_buffered()
417 /// .await?;
418 /// println!("response details={response:?}");
419 /// # Ok(()) }
420 /// ```
421 ///
422 /// [custom metadata]: https://cloud.google.com/storage/docs/metadata#custom-metadata
423 pub fn set_metadata<I, K, V>(mut self, i: I) -> Self
424 where
425 I: IntoIterator<Item = (K, V)>,
426 K: Into<String>,
427 V: Into<String>,
428 {
429 self.mut_resource().metadata = i.into_iter().map(|(k, v)| (k.into(), v.into())).collect();
430 self
431 }
432
433 /// Sets the [retention configuration] for the new object.
434 ///
435 /// # Example
436 /// ```
437 /// # use google_cloud_storage::client::Storage;
438 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
439 /// # use google_cloud_storage::model::object::{Retention, retention};
440 /// let response = client
441 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
442 /// .set_retention(
443 /// Retention::new()
444 /// .set_mode(retention::Mode::Locked)
445 /// .set_retain_until_time(wkt::Timestamp::try_from("2035-01-01T00:00:00Z")?))
446 /// .send_buffered()
447 /// .await?;
448 /// println!("response details={response:?}");
449 /// # Ok(()) }
450 /// ```
451 ///
452 /// [retention configuration]: https://cloud.google.com/storage/docs/metadata#retention-config
453 pub fn set_retention<V>(mut self, v: V) -> Self
454 where
455 V: Into<crate::model::object::Retention>,
456 {
457 self.mut_resource().retention = Some(v.into());
458 self
459 }
460
461 /// Sets the [storage class] for the new object.
462 ///
463 /// # Example
464 /// ```
465 /// # use google_cloud_storage::client::Storage;
466 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
467 /// let response = client
468 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
469 /// .set_storage_class("ARCHIVE")
470 /// .send_buffered()
471 /// .await?;
472 /// println!("response details={response:?}");
473 /// # Ok(()) }
474 /// ```
475 ///
476 /// [storage class]: https://cloud.google.com/storage/docs/storage-classes
477 pub fn set_storage_class<V>(mut self, v: V) -> Self
478 where
479 V: Into<String>,
480 {
481 self.mut_resource().storage_class = v.into();
482 self
483 }
484
485 /// Sets the [temporary hold] flag for the new object.
486 ///
487 /// This field is typically set in order to prevent objects from being
488 /// deleted or modified.
489 ///
490 /// # Example
491 /// ```
492 /// # use google_cloud_storage::client::Storage;
493 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
494 /// let time = wkt::Timestamp::try_from("2025-07-07T18:30:00Z")?;
495 /// let response = client
496 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
497 /// .set_temporary_hold(true)
498 /// .send_buffered()
499 /// .await?;
500 /// println!("response details={response:?}");
501 /// # Ok(()) }
502 /// ```
503 ///
504 /// [temporary hold]: https://cloud.google.com/storage/docs/object-holds
505 pub fn set_temporary_hold<V: Into<bool>>(mut self, v: V) -> Self {
506 self.mut_resource().temporary_hold = v.into();
507 self
508 }
509
510 /// Sets the resource name of the [Customer-managed encryption key] for this
511 /// object.
512 ///
513 /// The service imposes a number of restrictions on the keys used to encrypt
514 /// Google Cloud Storage objects. Read the documentation in full before
515 /// trying to use customer-managed encryption keys. In particular, verify
516 /// the service has the necessary permissions, and the key is in a
517 /// compatible location.
518 ///
519 /// # Example
520 /// ```
521 /// # use google_cloud_storage::client::Storage;
522 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
523 /// let response = client
524 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
525 /// .set_kms_key("projects/test-project/locations/us-central1/keyRings/test-ring/cryptoKeys/test-key")
526 /// .send_buffered()
527 /// .await?;
528 /// println!("response details={response:?}");
529 /// # Ok(()) }
530 /// ```
531 ///
532 /// [Customer-managed encryption key]: https://cloud.google.com/storage/docs/encryption/customer-managed-keys
533 pub fn set_kms_key<V>(mut self, v: V) -> Self
534 where
535 V: Into<String>,
536 {
537 self.mut_resource().kms_key = v.into();
538 self
539 }
540
541 /// Configure this object to use one of the [predefined ACLs].
542 ///
543 /// # Example
544 /// ```
545 /// # use google_cloud_storage::client::Storage;
546 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
547 /// let response = client
548 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
549 /// .set_predefined_acl("private")
550 /// .send_buffered()
551 /// .await?;
552 /// println!("response details={response:?}");
553 /// # Ok(()) }
554 /// ```
555 ///
556 /// [predefined ACLs]: https://cloud.google.com/storage/docs/access-control/lists#predefined-acl
557 pub fn set_predefined_acl<V>(mut self, v: V) -> Self
558 where
559 V: Into<String>,
560 {
561 self.request.spec.predefined_acl = v.into();
562 self
563 }
564
565 /// The encryption key used with the Customer-Supplied Encryption Keys
566 /// feature. In raw bytes format (not base64-encoded).
567 ///
568 /// # Example
569 /// ```
570 /// # use google_cloud_storage::client::Storage;
571 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
572 /// # use google_cloud_storage::model_ext::KeyAes256;
573 /// let key: &[u8] = &[97; 32];
574 /// let response = client
575 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
576 /// .set_key(KeyAes256::new(key)?)
577 /// .send_buffered()
578 /// .await?;
579 /// println!("response details={response:?}");
580 /// # Ok(()) }
581 /// ```
582 pub fn set_key(mut self, v: KeyAes256) -> Self {
583 self.request.params = Some(v.into());
584 self
585 }
586
587 /// Sets the object custom contexts.
588 ///
589 /// # Example
590 /// ```
591 /// # use google_cloud_storage::client::Storage;
592 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
593 /// # use google_cloud_storage::model::{ObjectContexts, ObjectCustomContextPayload};
594 /// let response = client
595 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
596 /// .set_contexts(
597 /// ObjectContexts::new().set_custom([
598 /// ("example", ObjectCustomContextPayload::new().set_value("true")),
599 /// ])
600 /// )
601 /// .send_buffered()
602 /// .await?;
603 /// println!("response details={response:?}");
604 /// # Ok(()) }
605 /// ```
606 pub fn set_contexts<V>(mut self, v: V) -> Self
607 where
608 V: Into<crate::model::ObjectContexts>,
609 {
610 self.mut_resource().contexts = Some(v.into());
611 self
612 }
613
614 /// Configure the idempotency for this upload.
615 ///
616 /// By default, the client library treats single-shot uploads without
617 /// preconditions, as non-idempotent. If the destination bucket is
618 /// configured with [object versioning] then the operation may succeed
619 /// multiple times with observable side-effects. With object versioning and
620 /// a [lifecycle] policy limiting the number of versions, uploading the same
621 /// data multiple times may result in data loss.
622 ///
623 /// The client library cannot efficiently determine if these conditions
624 /// apply to your upload. If they do, or your application can tolerate
625 /// multiple versions of the same data for other reasons, consider using
626 /// `with_idempotency(true)`.
627 ///
628 /// The client library treats resumable uploads as idempotent, regardless of
629 /// the value in this option. Such uploads can succeed at most once.
630 ///
631 /// # Example
632 /// ```
633 /// # use google_cloud_storage::client::Storage;
634 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
635 /// use std::time::Duration;
636 /// use google_cloud_gax::retry_policy::RetryPolicyExt;
637 /// let response = client
638 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
639 /// .with_idempotency(true)
640 /// .send_buffered()
641 /// .await?;
642 /// println!("response details={response:?}");
643 /// # Ok(()) }
644 /// ```
645 ///
646 /// [lifecycle]: https://cloud.google.com/storage/docs/lifecycle
647 /// [object versioning]: https://cloud.google.com/storage/docs/object-versioning
648 pub fn with_idempotency(mut self, v: bool) -> Self {
649 self.options.idempotency = Some(v);
650 self
651 }
652
653 /// The retry policy used for this request.
654 ///
655 /// # Example
656 /// ```
657 /// # use google_cloud_storage::client::Storage;
658 /// # use google_cloud_storage::retry_policy::RetryableErrors;
659 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
660 /// use std::time::Duration;
661 /// use google_cloud_gax::retry_policy::RetryPolicyExt;
662 /// let response = client
663 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
664 /// .with_retry_policy(
665 /// RetryableErrors
666 /// .with_attempt_limit(5)
667 /// .with_time_limit(Duration::from_secs(90)),
668 /// )
669 /// .send_buffered()
670 /// .await?;
671 /// println!("response details={response:?}");
672 /// # Ok(()) }
673 /// ```
674 pub fn with_retry_policy<V: Into<google_cloud_gax::retry_policy::RetryPolicyArg>>(
675 mut self,
676 v: V,
677 ) -> Self {
678 self.options.retry_policy = v.into().into();
679 self
680 }
681
682 /// The backoff policy used for this request.
683 ///
684 /// # Example
685 /// ```
686 /// # use google_cloud_storage::client::Storage;
687 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
688 /// use std::time::Duration;
689 /// use google_cloud_gax::exponential_backoff::ExponentialBackoff;
690 /// let response = client
691 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
692 /// .with_backoff_policy(ExponentialBackoff::default())
693 /// .send_buffered()
694 /// .await?;
695 /// println!("response details={response:?}");
696 /// # Ok(()) }
697 /// ```
698 pub fn with_backoff_policy<V: Into<google_cloud_gax::backoff_policy::BackoffPolicyArg>>(
699 mut self,
700 v: V,
701 ) -> Self {
702 self.options.backoff_policy = v.into().into();
703 self
704 }
705
706 /// The retry throttler used for this request.
707 ///
708 /// Most of the time you want to use the same throttler for all the requests
709 /// in a client, and even the same throttler for many clients. Rarely it
710 /// may be necessary to use an custom throttler for some subset of the
711 /// requests.
712 ///
713 /// # Example
714 /// ```
715 /// # use google_cloud_storage::client::Storage;
716 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
717 /// let response = client
718 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
719 /// .with_retry_throttler(adhoc_throttler())
720 /// .send_buffered()
721 /// .await?;
722 /// println!("response details={response:?}");
723 /// fn adhoc_throttler() -> google_cloud_gax::retry_throttler::SharedRetryThrottler {
724 /// # panic!();
725 /// }
726 /// # Ok(()) }
727 /// ```
728 pub fn with_retry_throttler<V: Into<google_cloud_gax::retry_throttler::RetryThrottlerArg>>(
729 mut self,
730 v: V,
731 ) -> Self {
732 self.options.retry_throttler = v.into().into();
733 self
734 }
735
736 /// Sets the payload size threshold to switch from single-shot to resumable uploads.
737 ///
738 /// # Example
739 /// ```
740 /// # use google_cloud_storage::client::Storage;
741 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
742 /// let response = client
743 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
744 /// .with_resumable_upload_threshold(0_usize) // Forces a resumable upload.
745 /// .send_buffered()
746 /// .await?;
747 /// println!("response details={response:?}");
748 /// # Ok(()) }
749 /// ```
750 ///
751 /// The client library can perform uploads using [single-shot] or
752 /// [resumable] uploads. For small objects, single-shot uploads offer better
753 /// performance, as they require a single HTTP transfer. For larger objects,
754 /// the additional request latency is not significant, and resumable uploads
755 /// offer better recovery on errors.
756 ///
757 /// The library automatically selects resumable uploads when the payload is
758 /// equal to or larger than this option. For smaller uploads the client
759 /// library uses single-shot uploads.
760 ///
761 /// The exact threshold depends on where the application is deployed and
762 /// destination bucket location with respect to where the application is
763 /// running. The library defaults should work well in most cases, but some
764 /// applications may benefit from fine-tuning.
765 ///
766 /// [single-shot]: https://cloud.google.com/storage/docs/uploading-objects
767 /// [resumable]: https://cloud.google.com/storage/docs/resumable-uploads
768 pub fn with_resumable_upload_threshold<V: Into<usize>>(mut self, v: V) -> Self {
769 self.options.set_resumable_upload_threshold(v.into());
770 self
771 }
772
773 /// Changes the buffer size for some resumable uploads.
774 ///
775 /// # Example
776 /// ```
777 /// # use google_cloud_storage::client::Storage;
778 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
779 /// let response = client
780 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
781 /// .with_resumable_upload_buffer_size(32 * 1024 * 1024_usize)
782 /// .send_buffered()
783 /// .await?;
784 /// println!("response details={response:?}");
785 /// # Ok(()) }
786 /// ```
787 ///
788 /// When performing [resumable uploads] from sources without [Seek] the
789 /// client library needs to buffer data in memory until it is persisted by
790 /// the service. Otherwise the data would be lost if the upload fails.
791 /// Applications may want to tune this buffer size:
792 ///
793 /// - Use smaller buffer sizes to support more concurrent uploads in the
794 /// same application.
795 /// - Use larger buffer sizes for better throughput. Sending many small
796 /// buffers stalls the upload until the client receives a successful
797 /// response from the service.
798 ///
799 /// Keep in mind that there are diminishing returns on using larger buffers.
800 ///
801 /// [resumable uploads]: https://cloud.google.com/storage/docs/resumable-uploads
802 /// [Seek]: crate::streaming_source::Seek
803 pub fn with_resumable_upload_buffer_size<V: Into<usize>>(mut self, v: V) -> Self {
804 self.options.set_resumable_upload_buffer_size(v.into());
805 self
806 }
807
808 /// Sets the `User-Agent` header for this request.
809 ///
810 /// # Example
811 /// ```
812 /// # use google_cloud_storage::client::Storage;
813 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
814 /// let mut response = client
815 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
816 /// .with_user_agent("my-app/1.0.0")
817 /// .send_buffered()
818 /// .await?;
819 /// println!("response details={response:?}");
820 /// # Ok(()) }
821 /// ```
822 pub fn with_user_agent(mut self, user_agent: impl Into<String>) -> Self {
823 self.options.user_agent = Some(user_agent.into());
824 self
825 }
826
827 fn mut_resource(&mut self) -> &mut crate::model::Object {
828 self.request
829 .spec
830 .resource
831 .as_mut()
832 .expect("resource field initialized in `new()`")
833 }
834
835 fn set_crc32c<V: Into<u32>>(mut self, v: V) -> Self {
836 let checksum = self.mut_resource().checksums.get_or_insert_default();
837 checksum.crc32c = Some(v.into());
838 self
839 }
840
841 pub fn set_md5_hash<I, V>(mut self, i: I) -> Self
842 where
843 I: IntoIterator<Item = V>,
844 V: Into<u8>,
845 {
846 let checksum = self.mut_resource().checksums.get_or_insert_default();
847 checksum.md5_hash = i.into_iter().map(|v| v.into()).collect();
848 self
849 }
850
851 /// Provide a precomputed value for the CRC32C checksum.
852 ///
853 /// # Example
854 /// ```
855 /// # use google_cloud_storage::client::Storage;
856 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
857 /// use crc32c::crc32c;
858 /// let response = client
859 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
860 /// .with_known_crc32c(crc32c(b"hello world"))
861 /// .send_buffered()
862 /// .await?;
863 /// println!("response details={response:?}");
864 /// # Ok(()) }
865 /// ```
866 ///
867 /// In some applications, the payload's CRC32C checksum is already known.
868 /// For example, the application may be reading the data from another blob
869 /// storage system.
870 ///
871 /// In such cases, it is safer to pass the known CRC32C of the payload to
872 /// [Cloud Storage], and more efficient to skip the computation in the
873 /// client library.
874 ///
875 /// Note that once you provide a CRC32C value to this builder you cannot
876 /// use [compute_md5()] to also have the library compute the checksums.
877 ///
878 /// [compute_md5()]: WriteObject::compute_md5
879 pub fn with_known_crc32c<V: Into<u32>>(self, v: V) -> Self {
880 let mut this = self;
881 this.options.checksum.crc32c = None;
882 this.set_crc32c(v)
883 }
884
885 /// Provide a precomputed value for the MD5 hash.
886 ///
887 /// # Example
888 /// ```
889 /// # use google_cloud_storage::client::Storage;
890 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
891 /// use md5::compute;
892 /// let hash = md5::compute(b"hello world");
893 /// let response = client
894 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
895 /// .with_known_md5_hash(bytes::Bytes::from_owner(hash.0))
896 /// .send_buffered()
897 /// .await?;
898 /// println!("response details={response:?}");
899 /// # Ok(()) }
900 /// ```
901 ///
902 /// In some applications, the payload's MD5 hash is already known. For
903 /// example, the application may be reading the data from another blob
904 /// storage system.
905 ///
906 /// In such cases, it is safer to pass the known MD5 of the payload to
907 /// [Cloud Storage], and more efficient to skip the computation in the
908 /// client library.
909 ///
910 /// Note that once you provide a MD5 value to this builder you cannot
911 /// use [compute_md5()] to also have the library compute the checksums.
912 ///
913 /// [compute_md5()]: WriteObject::compute_md5
914 pub fn with_known_md5_hash<I, V>(self, i: I) -> Self
915 where
916 I: IntoIterator<Item = V>,
917 V: Into<u8>,
918 {
919 let mut this = self;
920 this.options.checksum.md5_hash = None;
921 this.set_md5_hash(i)
922 }
923
924 /// Enables computation of MD5 hashes.
925 ///
926 /// # Example
927 /// ```
928 /// # use google_cloud_storage::client::Storage;
929 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
930 /// let payload = tokio::fs::File::open("my-data").await?;
931 /// let response = client
932 /// .write_object("projects/_/buckets/my-bucket", "my-object", payload)
933 /// .compute_md5()
934 /// .send_buffered()
935 /// .await?;
936 /// println!("response details={response:?}");
937 /// # Ok(()) }
938 /// ```
939 ///
940 /// See [precompute_checksums][WriteObject::precompute_checksums] for more
941 /// details on how checksums are used by the client library and their
942 /// limitations.
943 pub fn compute_md5(self) -> Self {
944 let mut this = self;
945 this.options.checksum.md5_hash = Some(Md5::default());
946 this
947 }
948
949 pub(crate) fn new<B, O, P>(
950 stub: std::sync::Arc<S>,
951 bucket: B,
952 object: O,
953 payload: P,
954 options: RequestOptions,
955 ) -> Self
956 where
957 B: Into<String>,
958 O: Into<String>,
959 P: Into<Payload<T>>,
960 {
961 let resource = crate::model::Object::new()
962 .set_bucket(bucket)
963 .set_name(object);
964 WriteObject {
965 stub,
966 request: crate::model_ext::WriteObjectRequest {
967 spec: crate::model::WriteObjectSpec::new().set_resource(resource),
968 params: None,
969 },
970 payload: payload.into(),
971 options,
972 }
973 }
974}
975
976impl<T, S> WriteObject<T, S>
977where
978 T: StreamingSource + Seek + Send + Sync + 'static,
979 <T as StreamingSource>::Error: std::error::Error + Send + Sync + 'static,
980 <T as Seek>::Error: std::error::Error + Send + Sync + 'static,
981 S: crate::storage::stub::Storage + 'static,
982{
983 /// A simple upload from a buffer.
984 ///
985 /// # Example
986 /// ```
987 /// # use google_cloud_storage::client::Storage;
988 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
989 /// let response = client
990 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
991 /// .send_unbuffered()
992 /// .await?;
993 /// println!("response details={response:?}");
994 /// # Ok(()) }
995 /// ```
996 pub async fn send_unbuffered(self) -> Result<Object> {
997 self.stub
998 .write_object_unbuffered(self.payload, self.request, self.options)
999 .await
1000 }
1001
1002 /// Precompute the payload checksums before uploading the data.
1003 ///
1004 /// If the checksums are known when the upload starts, the client library
1005 /// can include the checksums with the upload request, and the service can
1006 /// reject the upload if the payload and the checksums do not match.
1007 ///
1008 /// # Example
1009 /// ```
1010 /// # use google_cloud_storage::client::Storage;
1011 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
1012 /// let payload = tokio::fs::File::open("my-data").await?;
1013 /// let response = client
1014 /// .write_object("projects/_/buckets/my-bucket", "my-object", payload)
1015 /// .precompute_checksums()
1016 /// .await?
1017 /// .send_unbuffered()
1018 /// .await?;
1019 /// println!("response details={response:?}");
1020 /// # Ok(()) }
1021 /// ```
1022 ///
1023 /// Precomputing the checksums can be expensive if the data source is slow
1024 /// to read. Therefore, the client library does not precompute the checksums
1025 /// by default. The client library compares the checksums computed by the
1026 /// service against its own checksums. If they do not match, the client
1027 /// library returns an error. However, the service has already created the
1028 /// object with the (likely incorrect) data.
1029 ///
1030 /// The client library currently uses the [JSON API], it is not possible to
1031 /// send the checksums at the end of the upload with this API.
1032 ///
1033 /// [JSON API]: https://cloud.google.com/storage/docs/json_api
1034 pub async fn precompute_checksums(mut self) -> Result<Self> {
1035 let mut offset = 0_u64;
1036 self.payload.seek(offset).await.map_err(Error::ser)?;
1037 while let Some(n) = self.payload.next().await.transpose().map_err(Error::ser)? {
1038 self.options.checksum.update(offset, &n);
1039 offset += n.len() as u64;
1040 }
1041 self.payload.seek(0_u64).await.map_err(Error::ser)?;
1042 let computed = self.options.checksum.finalize();
1043 let current = self.mut_resource().checksums.get_or_insert_default();
1044 checksum_update(current, computed);
1045 self.options.checksum = Checksum {
1046 crc32c: None,
1047 md5_hash: None,
1048 };
1049 Ok(self)
1050 }
1051}
1052
1053impl<T, S> WriteObject<T, S>
1054where
1055 T: StreamingSource + Send + Sync + 'static,
1056 T::Error: std::error::Error + Send + Sync + 'static,
1057 S: crate::storage::stub::Storage + 'static,
1058{
1059 /// Upload an object from a streaming source without rewinds.
1060 ///
1061 /// If the data source does **not** implement [Seek] the client library must
1062 /// buffer data sent to the service until the service confirms it has
1063 /// persisted the data. This requires more memory in the client, and when
1064 /// the buffer grows too large, may require stalling the writer until the
1065 /// service can persist the data.
1066 ///
1067 /// Use this function for data sources where it is expensive or impossible
1068 /// to restart the data source. This function is also useful when it is hard
1069 /// or impossible to predict the number of bytes emitted by a stream, even
1070 /// if restarting the stream is not too expensive.
1071 ///
1072 /// # Example
1073 /// ```
1074 /// # use google_cloud_storage::client::Storage;
1075 /// # async fn sample(client: &Storage) -> anyhow::Result<()> {
1076 /// let response = client
1077 /// .write_object("projects/_/buckets/my-bucket", "my-object", "hello world")
1078 /// .send_buffered()
1079 /// .await?;
1080 /// println!("response details={response:?}");
1081 /// # Ok(()) }
1082 /// ```
1083 pub async fn send_buffered(self) -> crate::Result<Object> {
1084 self.stub
1085 .write_object_buffered(self.payload, self.request, self.options)
1086 .await
1087 }
1088}
1089
1090// We need `Debug` to use `expect_err()` in `Result<WriteObject, ...>`.
1091impl<T, S> std::fmt::Debug for WriteObject<T, S>
1092where
1093 S: crate::storage::stub::Storage + 'static,
1094{
1095 fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
1096 f.debug_struct("WriteObject")
1097 .field("stub", &self.stub)
1098 .field("request", &self.request)
1099 // skip payload, as it is not `Debug`
1100 .field("options", &self.options)
1101 .finish()
1102 }
1103}
1104
1105#[cfg(test)]
1106mod tests {
1107 use super::client::tests::{test_builder, test_inner_client};
1108 use super::*;
1109 use crate::client::Storage;
1110 use crate::model::{
1111 CommonObjectRequestParams, ObjectChecksums, ObjectContexts, ObjectCustomContextPayload,
1112 WriteObjectSpec,
1113 };
1114 use crate::storage::checksum::details::{Crc32c, Md5};
1115 use crate::streaming_source::tests::MockSeekSource;
1116 use google_cloud_auth::credentials::anonymous::Builder as Anonymous;
1117 use httptest::{Expectation, Server, matchers::*, responders::status_code};
1118 use std::error::Error as _;
1119 use std::io::{Error as IoError, ErrorKind};
1120
1121 type Result = anyhow::Result<()>;
1122
1123 // Verify `write_object()` can be used with a source that implements
1124 // `StreamingSource` **and** `Seek`
1125 #[tokio::test]
1126 async fn test_upload_streaming_source_and_seek() -> Result {
1127 struct Source;
1128 impl crate::streaming_source::StreamingSource for Source {
1129 type Error = std::io::Error;
1130 async fn next(&mut self) -> Option<std::result::Result<bytes::Bytes, Self::Error>> {
1131 None
1132 }
1133 }
1134 impl crate::streaming_source::Seek for Source {
1135 type Error = std::io::Error;
1136 async fn seek(&mut self, _offset: u64) -> std::result::Result<(), Self::Error> {
1137 Ok(())
1138 }
1139 }
1140
1141 let client = Storage::builder()
1142 .with_credentials(Anonymous::new().build())
1143 .build()
1144 .await?;
1145 let _ = client.write_object("projects/_/buckets/test-bucket", "test-object", Source);
1146 Ok(())
1147 }
1148
1149 // Verify `write_object()` can be used with a source that **only**
1150 // implements `StreamingSource`.
1151 #[tokio::test]
1152 async fn test_upload_only_streaming_source() -> Result {
1153 struct Source;
1154 impl crate::streaming_source::StreamingSource for Source {
1155 type Error = std::io::Error;
1156 async fn next(&mut self) -> Option<std::result::Result<bytes::Bytes, Self::Error>> {
1157 None
1158 }
1159 }
1160
1161 let client = Storage::builder()
1162 .with_credentials(Anonymous::new().build())
1163 .build()
1164 .await?;
1165 let _ = client.write_object("projects/_/buckets/test-bucket", "test-object", Source);
1166 Ok(())
1167 }
1168
1169 // Verify `write_object()` meets normal Send, Sync, requirements.
1170 #[tokio::test]
1171 async fn test_upload_is_send_and_static() -> Result {
1172 let client = Storage::builder()
1173 .with_credentials(Anonymous::new().build())
1174 .build()
1175 .await?;
1176
1177 fn need_send<T: Send>(_val: &T) {}
1178 fn need_sync<T: Sync>(_val: &T) {}
1179 fn need_static<T: 'static>(_val: &T) {}
1180
1181 let upload = client.write_object("projects/_/buckets/test-bucket", "test-object", "");
1182 need_send(&upload);
1183 need_sync(&upload);
1184 need_static(&upload);
1185
1186 let upload = client
1187 .write_object("projects/_/buckets/test-bucket", "test-object", "")
1188 .send_unbuffered();
1189 need_send(&upload);
1190 need_static(&upload);
1191
1192 let upload = client
1193 .write_object("projects/_/buckets/test-bucket", "test-object", "")
1194 .send_buffered();
1195 need_send(&upload);
1196 need_static(&upload);
1197
1198 Ok(())
1199 }
1200
1201 #[tokio::test]
1202 async fn write_object_metadata() -> Result {
1203 use crate::model::ObjectAccessControl;
1204 let inner = test_inner_client(test_builder()).await;
1205 let options = inner.options.clone();
1206 let stub = crate::storage::transport::Storage::new_test(inner);
1207 let key = KeyAes256::new(&[0x42; 32]).expect("hard-coded key is not an error");
1208 let mut builder =
1209 WriteObject::new(stub, "projects/_/buckets/bucket", "object", "", options)
1210 .set_if_generation_match(10)
1211 .set_if_generation_not_match(20)
1212 .set_if_metageneration_match(30)
1213 .set_if_metageneration_not_match(40)
1214 .set_predefined_acl("private")
1215 .set_acl([ObjectAccessControl::new()
1216 .set_entity("allAuthenticatedUsers")
1217 .set_role("READER")])
1218 .set_cache_control("public; max-age=7200")
1219 .set_content_disposition("inline")
1220 .set_content_encoding("gzip")
1221 .set_content_language("en")
1222 .set_content_type("text/plain")
1223 .set_contexts(ObjectContexts::new().set_custom([(
1224 "context-key",
1225 ObjectCustomContextPayload::new().set_value("context-value"),
1226 )]))
1227 .set_custom_time(wkt::Timestamp::try_from("2025-07-07T18:11:00Z")?)
1228 .set_event_based_hold(true)
1229 .set_key(key.clone())
1230 .set_metadata([("k0", "v0"), ("k1", "v1")])
1231 .set_retention(
1232 crate::model::object::Retention::new()
1233 .set_mode(crate::model::object::retention::Mode::Locked)
1234 .set_retain_until_time(wkt::Timestamp::try_from("2035-07-07T18:14:00Z")?),
1235 )
1236 .set_storage_class("ARCHIVE")
1237 .set_temporary_hold(true)
1238 .set_kms_key("test-key")
1239 .with_known_crc32c(crc32c::crc32c(b""))
1240 .with_known_md5_hash(md5::compute(b"").0);
1241
1242 let resource = builder.request.spec.resource.take().unwrap();
1243 let builder = builder;
1244 assert_eq!(
1245 &builder.request.spec,
1246 &WriteObjectSpec::new()
1247 .set_if_generation_match(10)
1248 .set_if_generation_not_match(20)
1249 .set_if_metageneration_match(30)
1250 .set_if_metageneration_not_match(40)
1251 .set_predefined_acl("private")
1252 );
1253
1254 assert_eq!(
1255 &builder.request.params,
1256 &Some(CommonObjectRequestParams::from(key))
1257 );
1258
1259 assert_eq!(
1260 resource,
1261 Object::new()
1262 .set_name("object")
1263 .set_bucket("projects/_/buckets/bucket")
1264 .set_acl([ObjectAccessControl::new()
1265 .set_entity("allAuthenticatedUsers")
1266 .set_role("READER")])
1267 .set_cache_control("public; max-age=7200")
1268 .set_content_disposition("inline")
1269 .set_content_encoding("gzip")
1270 .set_content_language("en")
1271 .set_content_type("text/plain")
1272 .set_contexts(ObjectContexts::new().set_custom([(
1273 "context-key",
1274 ObjectCustomContextPayload::new().set_value("context-value"),
1275 )]))
1276 .set_checksums(
1277 crate::model::ObjectChecksums::new()
1278 .set_crc32c(crc32c::crc32c(b""))
1279 .set_md5_hash(bytes::Bytes::from_iter(md5::compute(b"").0))
1280 )
1281 .set_custom_time(wkt::Timestamp::try_from("2025-07-07T18:11:00Z")?)
1282 .set_event_based_hold(true)
1283 .set_metadata([("k0", "v0"), ("k1", "v1")])
1284 .set_retention(
1285 crate::model::object::Retention::new()
1286 .set_mode("LOCKED")
1287 .set_retain_until_time(wkt::Timestamp::try_from("2035-07-07T18:14:00Z")?)
1288 )
1289 .set_storage_class("ARCHIVE")
1290 .set_temporary_hold(true)
1291 .set_kms_key("test-key")
1292 );
1293
1294 Ok(())
1295 }
1296
1297 #[tokio::test]
1298 async fn upload_object_options() {
1299 let inner = test_inner_client(
1300 test_builder()
1301 .with_resumable_upload_threshold(123_usize)
1302 .with_resumable_upload_buffer_size(234_usize),
1303 )
1304 .await;
1305 let options = inner.options.clone();
1306 let stub = crate::storage::transport::Storage::new_test(inner);
1307 let request = WriteObject::new(
1308 stub.clone(),
1309 "projects/_/buckets/bucket",
1310 "object",
1311 "",
1312 options.clone(),
1313 );
1314 assert_eq!(request.options.resumable_upload_threshold(), 123);
1315 assert_eq!(request.options.resumable_upload_buffer_size(), 234);
1316 assert_eq!(request.options.user_agent, None);
1317
1318 let user_agent = "quick_foxes_lazy_dogs/1.0.0";
1319 let request = WriteObject::new(stub, "projects/_/buckets/bucket", "object", "", options)
1320 .with_resumable_upload_threshold(345_usize)
1321 .with_resumable_upload_buffer_size(456_usize)
1322 .with_user_agent(user_agent);
1323 assert_eq!(request.options.resumable_upload_threshold(), 345);
1324 assert_eq!(request.options.resumable_upload_buffer_size(), 456);
1325 assert_eq!(request.options.user_agent.as_deref(), Some(user_agent));
1326 }
1327
1328 const QUICK: &str = "the quick brown fox jumps over the lazy dog";
1329 const VEXING: &str = "how vexingly quick daft zebras jump";
1330
1331 fn quick_checksum(mut engine: Checksum) -> ObjectChecksums {
1332 engine.update(0, &bytes::Bytes::from_static(QUICK.as_bytes()));
1333 engine.finalize()
1334 }
1335
1336 async fn collect<S: StreamingSource>(mut stream: S) -> anyhow::Result<Vec<u8>> {
1337 let mut collected = Vec::new();
1338 while let Some(b) = stream.next().await.transpose()? {
1339 collected.extend_from_slice(&b);
1340 }
1341 Ok(collected)
1342 }
1343
1344 #[tokio::test]
1345 async fn checksum_default() -> Result {
1346 let client = test_builder().build().await?;
1347 let upload = client
1348 .write_object("my-bucket", "my-object", QUICK)
1349 .precompute_checksums()
1350 .await?;
1351 let want = quick_checksum(Checksum {
1352 crc32c: Some(Crc32c::default()),
1353 md5_hash: None,
1354 });
1355 assert_eq!(
1356 upload.request.spec.resource.and_then(|r| r.checksums),
1357 Some(want)
1358 );
1359 let collected = collect(upload.payload).await?;
1360 assert_eq!(collected, QUICK.as_bytes());
1361 Ok(())
1362 }
1363
1364 #[tokio::test]
1365 async fn checksum_md5_and_crc32c() -> Result {
1366 let client = test_builder().build().await?;
1367 let upload = client
1368 .write_object("my-bucket", "my-object", QUICK)
1369 .compute_md5()
1370 .precompute_checksums()
1371 .await?;
1372 let want = quick_checksum(Checksum {
1373 crc32c: Some(Crc32c::default()),
1374 md5_hash: Some(Md5::default()),
1375 });
1376 assert_eq!(
1377 upload.request.spec.resource.and_then(|r| r.checksums),
1378 Some(want)
1379 );
1380 Ok(())
1381 }
1382
1383 #[tokio::test]
1384 async fn checksum_precomputed() -> Result {
1385 let mut engine = Checksum {
1386 crc32c: Some(Crc32c::default()),
1387 md5_hash: Some(Md5::default()),
1388 };
1389 engine.update(0, &bytes::Bytes::from_static(VEXING.as_bytes()));
1390 let ck = engine.finalize();
1391
1392 let client = test_builder().build().await?;
1393 let upload = client
1394 .write_object("my-bucket", "my-object", QUICK)
1395 .with_known_crc32c(ck.crc32c.unwrap())
1396 .with_known_md5_hash(ck.md5_hash.clone())
1397 .precompute_checksums()
1398 .await?;
1399 // Note that the checksums do not match the data. This is intentional,
1400 // we are trying to verify that whatever is provided in with_crc32c()
1401 // and with_md5() is respected.
1402 assert_eq!(
1403 upload.request.spec.resource.and_then(|r| r.checksums),
1404 Some(ck)
1405 );
1406
1407 Ok(())
1408 }
1409
1410 #[tokio::test]
1411 async fn checksum_crc32c_known_md5_computed() -> Result {
1412 let mut engine = Checksum {
1413 crc32c: Some(Crc32c::default()),
1414 md5_hash: Some(Md5::default()),
1415 };
1416 engine.update(0, &bytes::Bytes::from_static(VEXING.as_bytes()));
1417 let ck = engine.finalize();
1418
1419 let client = test_builder().build().await?;
1420 let upload = client
1421 .write_object("my-bucket", "my-object", QUICK)
1422 .compute_md5()
1423 .with_known_crc32c(ck.crc32c.unwrap())
1424 .precompute_checksums()
1425 .await?;
1426 // Note that the checksums do not match the data. This is intentional,
1427 // we are trying to verify that whatever is provided in with_known*()
1428 // is respected.
1429 let want = quick_checksum(Checksum {
1430 crc32c: None,
1431 md5_hash: Some(Md5::default()),
1432 })
1433 .set_crc32c(ck.crc32c.unwrap());
1434 assert_eq!(
1435 upload.request.spec.resource.and_then(|r| r.checksums),
1436 Some(want)
1437 );
1438
1439 Ok(())
1440 }
1441
1442 #[tokio::test]
1443 async fn checksum_mixed_then_precomputed() -> Result {
1444 let mut engine = Checksum {
1445 crc32c: Some(Crc32c::default()),
1446 md5_hash: Some(Md5::default()),
1447 };
1448 engine.update(0, &bytes::Bytes::from_static(VEXING.as_bytes()));
1449 let ck = engine.finalize();
1450
1451 let client = test_builder().build().await?;
1452 let upload = client
1453 .write_object("my-bucket", "my-object", QUICK)
1454 .with_known_md5_hash(ck.md5_hash.clone())
1455 .with_known_crc32c(ck.crc32c.unwrap())
1456 .precompute_checksums()
1457 .await?;
1458 // Note that the checksums do not match the data. This is intentional,
1459 // we are trying to verify that whatever is provided in with_known*()
1460 // is respected.
1461 let want = ck.clone();
1462 assert_eq!(
1463 upload.request.spec.resource.and_then(|r| r.checksums),
1464 Some(want)
1465 );
1466
1467 Ok(())
1468 }
1469
1470 #[tokio::test]
1471 async fn checksum_full_computed_then_md5_precomputed() -> Result {
1472 let mut engine = Checksum {
1473 crc32c: Some(Crc32c::default()),
1474 md5_hash: Some(Md5::default()),
1475 };
1476 engine.update(0, &bytes::Bytes::from_static(VEXING.as_bytes()));
1477 let ck = engine.finalize();
1478
1479 let client = test_builder().build().await?;
1480 let upload = client
1481 .write_object("my-bucket", "my-object", QUICK)
1482 .compute_md5()
1483 .with_known_md5_hash(ck.md5_hash.clone())
1484 .precompute_checksums()
1485 .await?;
1486 // Note that the checksums do not match the data. This is intentional,
1487 // we are trying to verify that whatever is provided in with_known*()
1488 // is respected.
1489 let want = quick_checksum(Checksum {
1490 crc32c: Some(Crc32c::default()),
1491 md5_hash: None,
1492 })
1493 .set_md5_hash(ck.md5_hash.clone());
1494 assert_eq!(
1495 upload.request.spec.resource.and_then(|r| r.checksums),
1496 Some(want)
1497 );
1498
1499 Ok(())
1500 }
1501
1502 #[tokio::test]
1503 async fn checksum_known_crc32_then_computed_md5() -> Result {
1504 let mut engine = Checksum {
1505 crc32c: Some(Crc32c::default()),
1506 md5_hash: Some(Md5::default()),
1507 };
1508 engine.update(0, &bytes::Bytes::from_static(VEXING.as_bytes()));
1509 let ck = engine.finalize();
1510
1511 let client = test_builder().build().await?;
1512 let upload = client
1513 .write_object("my-bucket", "my-object", QUICK)
1514 .with_known_crc32c(ck.crc32c.unwrap())
1515 .compute_md5()
1516 .with_known_md5_hash(ck.md5_hash.clone())
1517 .precompute_checksums()
1518 .await?;
1519 // Note that the checksums do not match the data. This is intentional,
1520 // we are trying to verify that whatever is provided in with_known*()
1521 // is respected.
1522 let want = ck.clone();
1523 assert_eq!(
1524 upload.request.spec.resource.and_then(|r| r.checksums),
1525 Some(want)
1526 );
1527
1528 Ok(())
1529 }
1530
1531 #[tokio::test]
1532 async fn checksum_known_crc32_then_known_md5() -> Result {
1533 let mut engine = Checksum {
1534 crc32c: Some(Crc32c::default()),
1535 md5_hash: Some(Md5::default()),
1536 };
1537 engine.update(0, &bytes::Bytes::from_static(VEXING.as_bytes()));
1538 let ck = engine.finalize();
1539
1540 let client = test_builder().build().await?;
1541 let upload = client
1542 .write_object("my-bucket", "my-object", QUICK)
1543 .with_known_crc32c(ck.crc32c.unwrap())
1544 .with_known_md5_hash(ck.md5_hash.clone())
1545 .precompute_checksums()
1546 .await?;
1547 // Note that the checksums do not match the data. This is intentional,
1548 // we are trying to verify that whatever is provided in with_known*()
1549 // is respected.
1550 let want = ck.clone();
1551 assert_eq!(
1552 upload.request.spec.resource.and_then(|r| r.checksums),
1553 Some(want)
1554 );
1555
1556 Ok(())
1557 }
1558
1559 #[tokio::test]
1560 async fn precompute_checksums_seek_error() -> Result {
1561 let mut source = MockSeekSource::new();
1562 source
1563 .expect_seek()
1564 .once()
1565 .returning(|_| Err(IoError::new(ErrorKind::Deadlock, "test-only")));
1566
1567 let client = test_builder().build().await?;
1568 let err = client
1569 .write_object("my-bucket", "my-object", source)
1570 .precompute_checksums()
1571 .await
1572 .expect_err("seek() returns an error");
1573 assert!(err.is_serialization(), "{err:?}");
1574 assert!(
1575 err.source()
1576 .and_then(|e| e.downcast_ref::<IoError>())
1577 .is_some(),
1578 "{err:?}"
1579 );
1580
1581 Ok(())
1582 }
1583
1584 #[tokio::test]
1585 async fn precompute_checksums_next_error() -> Result {
1586 let mut source = MockSeekSource::new();
1587 source.expect_seek().returning(|_| Ok(()));
1588 let mut seq = mockall::Sequence::new();
1589 source
1590 .expect_next()
1591 .times(3)
1592 .in_sequence(&mut seq)
1593 .returning(|| Some(Ok(bytes::Bytes::new())));
1594 source
1595 .expect_next()
1596 .once()
1597 .in_sequence(&mut seq)
1598 .returning(|| Some(Err(IoError::new(ErrorKind::BrokenPipe, "test-only"))));
1599
1600 let client = test_builder().build().await?;
1601 let err = client
1602 .write_object("my-bucket", "my-object", source)
1603 .precompute_checksums()
1604 .await
1605 .expect_err("seek() returns an error");
1606 assert!(err.is_serialization(), "{err:?}");
1607 assert!(
1608 err.source()
1609 .and_then(|e| e.downcast_ref::<IoError>())
1610 .is_some(),
1611 "{err:?}"
1612 );
1613
1614 Ok(())
1615 }
1616
1617 #[tokio::test]
1618 async fn write_object_with_user_agent() -> Result {
1619 use http::header::USER_AGENT;
1620
1621 let user_agent = "quicker_foxes_lazier_dogs/1.2.3";
1622 let server = Server::run();
1623 server.expect(
1624 Expectation::matching(all_of![
1625 request::method_path("POST", "/upload/storage/v1/b/test-bucket/o"),
1626 request::headers(contains((USER_AGENT.as_str(), user_agent))),
1627 request::query(url_decoded(contains(("uploadType", "multipart")))),
1628 ])
1629 .times(1)
1630 .respond_with(status_code(200).body("{}")),
1631 );
1632
1633 let client = Storage::builder()
1634 .with_endpoint(format!("http://{}", server.addr()))
1635 .with_credentials(Anonymous::new().build())
1636 .build()
1637 .await?;
1638 let _ = client
1639 .write_object(
1640 "projects/_/buckets/test-bucket",
1641 "test-object",
1642 "hello world",
1643 )
1644 .with_user_agent(user_agent)
1645 .send_unbuffered()
1646 .await?;
1647
1648 Ok(())
1649 }
1650
1651 #[tokio::test]
1652 async fn debug() -> Result {
1653 let client = test_builder().build().await?;
1654 let upload = client
1655 .write_object("my-bucket", "my-object", "")
1656 .precompute_checksums()
1657 .await;
1658
1659 let fmt = format!("{upload:?}");
1660 ["WriteObject", "inner", "spec", "options", "checksum"]
1661 .into_iter()
1662 .for_each(|text| {
1663 assert!(fmt.contains(text), "expected {text} in {fmt}");
1664 });
1665 Ok(())
1666 }
1667}