1#![expect(missing_docs)]
16
17use std::fmt::Debug;
18use std::fs;
19use std::fs::File;
20use std::io::Cursor;
21use std::io::Read as _;
22use std::io::Write as _;
23use std::path::Path;
24use std::path::PathBuf;
25use std::pin::Pin;
26use std::time::SystemTime;
27
28use async_trait::async_trait;
29use blake2::Blake2b512;
30use blake2::Digest as _;
31use futures::stream;
32use futures::stream::BoxStream;
33use pollster::FutureExt as _;
34use prost::Message as _;
35use tempfile::NamedTempFile;
36use tokio::io::AsyncRead;
37use tokio::io::AsyncReadExt as _;
38
39use crate::backend::Backend;
40use crate::backend::BackendError;
41use crate::backend::BackendResult;
42use crate::backend::ChangeId;
43use crate::backend::Commit;
44use crate::backend::CommitId;
45use crate::backend::CopyHistory;
46use crate::backend::CopyId;
47use crate::backend::CopyRecord;
48use crate::backend::FileId;
49use crate::backend::MergedTreeId;
50use crate::backend::MillisSinceEpoch;
51use crate::backend::SecureSig;
52use crate::backend::Signature;
53use crate::backend::SigningFn;
54use crate::backend::SymlinkId;
55use crate::backend::Timestamp;
56use crate::backend::Tree;
57use crate::backend::TreeId;
58use crate::backend::TreeValue;
59use crate::backend::make_root_commit;
60use crate::content_hash::blake2b_hash;
61use crate::file_util::persist_content_addressed_temp_file;
62use crate::index::Index;
63use crate::merge::MergeBuilder;
64use crate::object_id::ObjectId;
65use crate::repo_path::RepoPath;
66use crate::repo_path::RepoPathBuf;
67use crate::repo_path::RepoPathComponentBuf;
68
69const COMMIT_ID_LENGTH: usize = 64;
70const CHANGE_ID_LENGTH: usize = 16;
71
72fn map_not_found_err(err: std::io::Error, id: &impl ObjectId) -> BackendError {
73 if err.kind() == std::io::ErrorKind::NotFound {
74 BackendError::ObjectNotFound {
75 object_type: id.object_type(),
76 hash: id.hex(),
77 source: Box::new(err),
78 }
79 } else {
80 BackendError::ReadObject {
81 object_type: id.object_type(),
82 hash: id.hex(),
83 source: Box::new(err),
84 }
85 }
86}
87
88fn to_other_err(err: impl Into<Box<dyn std::error::Error + Send + Sync>>) -> BackendError {
89 BackendError::Other(err.into())
90}
91
92#[derive(Debug)]
93pub struct SimpleBackend {
94 path: PathBuf,
95 root_commit_id: CommitId,
96 root_change_id: ChangeId,
97 empty_tree_id: TreeId,
98}
99
100impl SimpleBackend {
101 pub fn name() -> &'static str {
102 "Simple"
103 }
104
105 pub fn init(store_path: &Path) -> Self {
106 fs::create_dir(store_path.join("commits")).unwrap();
107 fs::create_dir(store_path.join("trees")).unwrap();
108 fs::create_dir(store_path.join("files")).unwrap();
109 fs::create_dir(store_path.join("symlinks")).unwrap();
110 fs::create_dir(store_path.join("conflicts")).unwrap();
111 let backend = Self::load(store_path);
112 let empty_tree_id = backend
113 .write_tree(RepoPath::root(), &Tree::default())
114 .block_on()
115 .unwrap();
116 assert_eq!(empty_tree_id, backend.empty_tree_id);
117 backend
118 }
119
120 pub fn load(store_path: &Path) -> Self {
121 let root_commit_id = CommitId::from_bytes(&[0; COMMIT_ID_LENGTH]);
122 let root_change_id = ChangeId::from_bytes(&[0; CHANGE_ID_LENGTH]);
123 let empty_tree_id = TreeId::from_hex(
124 "482ae5a29fbe856c7272f2071b8b0f0359ee2d89ff392b8a900643fbd0836eccd067b8bf41909e206c90d45d6e7d8b6686b93ecaee5fe1a9060d87b672101310",
125 );
126 Self {
127 path: store_path.to_path_buf(),
128 root_commit_id,
129 root_change_id,
130 empty_tree_id,
131 }
132 }
133
134 fn file_path(&self, id: &FileId) -> PathBuf {
135 self.path.join("files").join(id.hex())
136 }
137
138 fn symlink_path(&self, id: &SymlinkId) -> PathBuf {
139 self.path.join("symlinks").join(id.hex())
140 }
141
142 fn tree_path(&self, id: &TreeId) -> PathBuf {
143 self.path.join("trees").join(id.hex())
144 }
145
146 fn commit_path(&self, id: &CommitId) -> PathBuf {
147 self.path.join("commits").join(id.hex())
148 }
149}
150
151#[async_trait]
152impl Backend for SimpleBackend {
153 fn name(&self) -> &str {
154 Self::name()
155 }
156
157 fn commit_id_length(&self) -> usize {
158 COMMIT_ID_LENGTH
159 }
160
161 fn change_id_length(&self) -> usize {
162 CHANGE_ID_LENGTH
163 }
164
165 fn root_commit_id(&self) -> &CommitId {
166 &self.root_commit_id
167 }
168
169 fn root_change_id(&self) -> &ChangeId {
170 &self.root_change_id
171 }
172
173 fn empty_tree_id(&self) -> &TreeId {
174 &self.empty_tree_id
175 }
176
177 fn concurrency(&self) -> usize {
178 1
179 }
180
181 async fn read_file(
182 &self,
183 path: &RepoPath,
184 id: &FileId,
185 ) -> BackendResult<Pin<Box<dyn AsyncRead + Send>>> {
186 let disk_path = self.file_path(id);
187 let mut file = File::open(disk_path).map_err(|err| map_not_found_err(err, id))?;
188 let mut buf = vec![];
189 file.read_to_end(&mut buf)
190 .map_err(|err| BackendError::ReadFile {
191 path: path.to_owned(),
192 id: id.clone(),
193 source: err.into(),
194 })?;
195 Ok(Box::pin(Cursor::new(buf)))
196 }
197
198 async fn write_file(
199 &self,
200 _path: &RepoPath,
201 contents: &mut (dyn AsyncRead + Send + Unpin),
202 ) -> BackendResult<FileId> {
203 let temp_file = NamedTempFile::new_in(&self.path).map_err(to_other_err)?;
205 let mut file = temp_file.as_file();
206 let mut hasher = Blake2b512::new();
207 let mut buff: Vec<u8> = vec![0; 1 << 14];
208 loop {
209 let bytes_read = contents.read(&mut buff).await.map_err(to_other_err)?;
210 if bytes_read == 0 {
211 break;
212 }
213 let bytes = &buff[..bytes_read];
214 file.write_all(bytes).map_err(to_other_err)?;
215 hasher.update(bytes);
216 }
217 file.flush().map_err(to_other_err)?;
218 let id = FileId::new(hasher.finalize().to_vec());
219
220 persist_content_addressed_temp_file(temp_file, self.file_path(&id))
221 .map_err(to_other_err)?;
222 Ok(id)
223 }
224
225 async fn read_symlink(&self, _path: &RepoPath, id: &SymlinkId) -> BackendResult<String> {
226 let path = self.symlink_path(id);
227 let target = fs::read_to_string(path).map_err(|err| map_not_found_err(err, id))?;
228 Ok(target)
229 }
230
231 async fn write_symlink(&self, _path: &RepoPath, target: &str) -> BackendResult<SymlinkId> {
232 let mut temp_file = NamedTempFile::new_in(&self.path).map_err(to_other_err)?;
234 temp_file
235 .write_all(target.as_bytes())
236 .map_err(to_other_err)?;
237 let mut hasher = Blake2b512::new();
238 hasher.update(target.as_bytes());
239 let id = SymlinkId::new(hasher.finalize().to_vec());
240
241 persist_content_addressed_temp_file(temp_file, self.symlink_path(&id))
242 .map_err(to_other_err)?;
243 Ok(id)
244 }
245
246 async fn read_copy(&self, _id: &CopyId) -> BackendResult<CopyHistory> {
247 Err(BackendError::Unsupported(
248 "The simple backend doesn't support copies".to_string(),
249 ))
250 }
251
252 async fn write_copy(&self, _contents: &CopyHistory) -> BackendResult<CopyId> {
253 Err(BackendError::Unsupported(
254 "The simple backend doesn't support copies".to_string(),
255 ))
256 }
257
258 async fn get_related_copies(&self, _copy_id: &CopyId) -> BackendResult<Vec<CopyHistory>> {
259 Err(BackendError::Unsupported(
260 "The simple backend doesn't support copies".to_string(),
261 ))
262 }
263
264 async fn read_tree(&self, _path: &RepoPath, id: &TreeId) -> BackendResult<Tree> {
265 let path = self.tree_path(id);
266 let buf = fs::read(path).map_err(|err| map_not_found_err(err, id))?;
267
268 let proto = crate::protos::simple_store::Tree::decode(&*buf).map_err(to_other_err)?;
269 Ok(tree_from_proto(proto))
270 }
271
272 async fn write_tree(&self, _path: &RepoPath, tree: &Tree) -> BackendResult<TreeId> {
273 let temp_file = NamedTempFile::new_in(&self.path).map_err(to_other_err)?;
275
276 let proto = tree_to_proto(tree);
277 temp_file
278 .as_file()
279 .write_all(&proto.encode_to_vec())
280 .map_err(to_other_err)?;
281
282 let id = TreeId::new(blake2b_hash(tree).to_vec());
283
284 persist_content_addressed_temp_file(temp_file, self.tree_path(&id))
285 .map_err(to_other_err)?;
286 Ok(id)
287 }
288
289 async fn read_commit(&self, id: &CommitId) -> BackendResult<Commit> {
290 if *id == self.root_commit_id {
291 return Ok(make_root_commit(
292 self.root_change_id().clone(),
293 self.empty_tree_id.clone(),
294 ));
295 }
296
297 let path = self.commit_path(id);
298 let buf = fs::read(path).map_err(|err| map_not_found_err(err, id))?;
299
300 let proto = crate::protos::simple_store::Commit::decode(&*buf).map_err(to_other_err)?;
301 Ok(commit_from_proto(proto))
302 }
303
304 async fn write_commit(
305 &self,
306 mut commit: Commit,
307 sign_with: Option<&mut SigningFn>,
308 ) -> BackendResult<(CommitId, Commit)> {
309 assert!(commit.secure_sig.is_none(), "commit.secure_sig was set");
310
311 if commit.parents.is_empty() {
312 return Err(BackendError::Other(
313 "Cannot write a commit with no parents".into(),
314 ));
315 }
316 let temp_file = NamedTempFile::new_in(&self.path).map_err(to_other_err)?;
318
319 let mut proto = commit_to_proto(&commit);
320 if let Some(sign) = sign_with {
321 let data = proto.encode_to_vec();
322 let sig = sign(&data).map_err(to_other_err)?;
323 proto.secure_sig = Some(sig.clone());
324 commit.secure_sig = Some(SecureSig { data, sig });
325 }
326
327 temp_file
328 .as_file()
329 .write_all(&proto.encode_to_vec())
330 .map_err(to_other_err)?;
331
332 let id = CommitId::new(blake2b_hash(&commit).to_vec());
333
334 persist_content_addressed_temp_file(temp_file, self.commit_path(&id))
335 .map_err(to_other_err)?;
336 Ok((id, commit))
337 }
338
339 fn get_copy_records(
340 &self,
341 _paths: Option<&[RepoPathBuf]>,
342 _root: &CommitId,
343 _head: &CommitId,
344 ) -> BackendResult<BoxStream<'_, BackendResult<CopyRecord>>> {
345 Ok(Box::pin(stream::empty()))
346 }
347
348 fn gc(&self, _index: &dyn Index, _keep_newer: SystemTime) -> BackendResult<()> {
349 Ok(())
350 }
351}
352
353#[expect(clippy::assigning_clones)]
354pub fn commit_to_proto(commit: &Commit) -> crate::protos::simple_store::Commit {
355 let mut proto = crate::protos::simple_store::Commit::default();
356 for parent in &commit.parents {
357 proto.parents.push(parent.to_bytes());
358 }
359 for predecessor in &commit.predecessors {
360 proto.predecessors.push(predecessor.to_bytes());
361 }
362 proto.root_tree = commit
363 .root_tree
364 .as_merge()
365 .iter()
366 .map(|id| id.to_bytes())
367 .collect();
368 proto.change_id = commit.change_id.to_bytes();
369 proto.description = commit.description.clone();
370 proto.author = Some(signature_to_proto(&commit.author));
371 proto.committer = Some(signature_to_proto(&commit.committer));
372 proto
373}
374
375fn commit_from_proto(mut proto: crate::protos::simple_store::Commit) -> Commit {
376 let secure_sig = proto.secure_sig.take().map(|sig| SecureSig {
379 data: proto.encode_to_vec(),
380 sig,
381 });
382
383 let parents = proto.parents.into_iter().map(CommitId::new).collect();
384 let predecessors = proto.predecessors.into_iter().map(CommitId::new).collect();
385 let merge_builder: MergeBuilder<_> = proto.root_tree.into_iter().map(TreeId::new).collect();
386 let root_tree = MergedTreeId::new(merge_builder.build());
387 let change_id = ChangeId::new(proto.change_id);
388 Commit {
389 parents,
390 predecessors,
391 root_tree,
392 change_id,
393 description: proto.description,
394 author: signature_from_proto(proto.author.unwrap_or_default()),
395 committer: signature_from_proto(proto.committer.unwrap_or_default()),
396 secure_sig,
397 }
398}
399
400fn tree_to_proto(tree: &Tree) -> crate::protos::simple_store::Tree {
401 let mut proto = crate::protos::simple_store::Tree::default();
402 for entry in tree.entries() {
403 proto
404 .entries
405 .push(crate::protos::simple_store::tree::Entry {
406 name: entry.name().as_internal_str().to_owned(),
407 value: Some(tree_value_to_proto(entry.value())),
408 });
409 }
410 proto
411}
412
413fn tree_from_proto(proto: crate::protos::simple_store::Tree) -> Tree {
414 let entries = proto
416 .entries
417 .into_iter()
418 .map(|proto_entry| {
419 let value = tree_value_from_proto(proto_entry.value.unwrap());
420 (RepoPathComponentBuf::new(proto_entry.name).unwrap(), value)
421 })
422 .collect();
423 Tree::from_sorted_entries(entries)
424}
425
426fn tree_value_to_proto(value: &TreeValue) -> crate::protos::simple_store::TreeValue {
427 let mut proto = crate::protos::simple_store::TreeValue::default();
428 match value {
429 TreeValue::File {
430 id,
431 executable,
432 copy_id,
433 } => {
434 proto.value = Some(crate::protos::simple_store::tree_value::Value::File(
435 crate::protos::simple_store::tree_value::File {
436 id: id.to_bytes(),
437 executable: *executable,
438 copy_id: copy_id.to_bytes(),
439 },
440 ));
441 }
442 TreeValue::Symlink(id) => {
443 proto.value = Some(crate::protos::simple_store::tree_value::Value::SymlinkId(
444 id.to_bytes(),
445 ));
446 }
447 TreeValue::GitSubmodule(_id) => {
448 panic!("cannot store git submodules");
449 }
450 TreeValue::Tree(id) => {
451 proto.value = Some(crate::protos::simple_store::tree_value::Value::TreeId(
452 id.to_bytes(),
453 ));
454 }
455 }
456 proto
457}
458
459fn tree_value_from_proto(proto: crate::protos::simple_store::TreeValue) -> TreeValue {
460 match proto.value.unwrap() {
461 crate::protos::simple_store::tree_value::Value::TreeId(id) => {
462 TreeValue::Tree(TreeId::new(id))
463 }
464 crate::protos::simple_store::tree_value::Value::File(
465 crate::protos::simple_store::tree_value::File {
466 id,
467 executable,
468 copy_id,
469 },
470 ) => TreeValue::File {
471 id: FileId::new(id),
472 executable,
473 copy_id: CopyId::new(copy_id),
474 },
475 crate::protos::simple_store::tree_value::Value::SymlinkId(id) => {
476 TreeValue::Symlink(SymlinkId::new(id))
477 }
478 }
479}
480
481fn signature_to_proto(signature: &Signature) -> crate::protos::simple_store::commit::Signature {
482 crate::protos::simple_store::commit::Signature {
483 name: signature.name.clone(),
484 email: signature.email.clone(),
485 timestamp: Some(crate::protos::simple_store::commit::Timestamp {
486 millis_since_epoch: signature.timestamp.timestamp.0,
487 tz_offset: signature.timestamp.tz_offset,
488 }),
489 }
490}
491
492fn signature_from_proto(proto: crate::protos::simple_store::commit::Signature) -> Signature {
493 let timestamp = proto.timestamp.unwrap_or_default();
494 Signature {
495 name: proto.name,
496 email: proto.email,
497 timestamp: Timestamp {
498 timestamp: MillisSinceEpoch(timestamp.millis_since_epoch),
499 tz_offset: timestamp.tz_offset,
500 },
501 }
502}
503
504#[cfg(test)]
505mod tests {
506 use assert_matches::assert_matches;
507 use pollster::FutureExt as _;
508
509 use super::*;
510 use crate::tests::new_temp_dir;
511
512 #[test]
514 fn write_commit_parents() {
515 let temp_dir = new_temp_dir();
516 let store_path = temp_dir.path();
517
518 let backend = SimpleBackend::init(store_path);
519 let mut commit = Commit {
520 parents: vec![],
521 predecessors: vec![],
522 root_tree: MergedTreeId::resolved(backend.empty_tree_id().clone()),
523 change_id: ChangeId::from_hex("abc123"),
524 description: "".to_string(),
525 author: create_signature(),
526 committer: create_signature(),
527 secure_sig: None,
528 };
529
530 let write_commit = |commit: Commit| -> BackendResult<(CommitId, Commit)> {
531 backend.write_commit(commit, None).block_on()
532 };
533
534 commit.parents = vec![];
536 assert_matches!(
537 write_commit(commit.clone()),
538 Err(BackendError::Other(err)) if err.to_string().contains("no parents")
539 );
540
541 commit.parents = vec![backend.root_commit_id().clone()];
543 let first_id = write_commit(commit.clone()).unwrap().0;
544 let first_commit = backend.read_commit(&first_id).block_on().unwrap();
545 assert_eq!(first_commit, commit);
546
547 commit.parents = vec![first_id.clone()];
549 let second_id = write_commit(commit.clone()).unwrap().0;
550 let second_commit = backend.read_commit(&second_id).block_on().unwrap();
551 assert_eq!(second_commit, commit);
552
553 commit.parents = vec![first_id.clone(), second_id.clone()];
555 let merge_id = write_commit(commit.clone()).unwrap().0;
556 let merge_commit = backend.read_commit(&merge_id).block_on().unwrap();
557 assert_eq!(merge_commit, commit);
558
559 commit.parents = vec![first_id, backend.root_commit_id().clone()];
561 let root_merge_id = write_commit(commit.clone()).unwrap().0;
562 let root_merge_commit = backend.read_commit(&root_merge_id).block_on().unwrap();
563 assert_eq!(root_merge_commit, commit);
564 }
565
566 fn create_signature() -> Signature {
567 Signature {
568 name: "Someone".to_string(),
569 email: "someone@example.com".to_string(),
570 timestamp: Timestamp {
571 timestamp: MillisSinceEpoch(0),
572 tz_offset: 0,
573 },
574 }
575 }
576}