1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
use super::CrateVersion;
use serde_json;
use std::path::Path;
use git2::{
build::RepoBuilder, Delta, DiffFormat, Error as GitError, ErrorClass, Object, ObjectType, Oid,
Reference, Repository, Tree,
};
use std::str;
static INDEX_GIT_URL: &str = "https://github.com/rust-lang/crates.io-index";
static LAST_SEEN_REFNAME: &str = "refs/heads/crates-index-diff_last-seen";
static EMPTY_TREE_HASH: &str = "4b825dc642cb6eb9a060e54bf8d69288fbee4904";
static LINE_ADDED_INDICATOR: char = '+';
pub struct Index {
pub seen_ref_name: &'static str,
repo: Repository,
}
impl Index {
pub fn repository(&self) -> &Repository {
&self.repo
}
pub fn last_seen_reference(&self) -> Result<Reference, GitError> {
self.repo.find_reference(self.seen_ref_name)
}
pub fn from_path_or_cloned(path: impl AsRef<Path>) -> Result<Index, GitError> {
let repo = Repository::open(path.as_ref()).or_else(|err| {
if err.class() == ErrorClass::Repository {
RepoBuilder::new()
.bare(true)
.clone(INDEX_GIT_URL, path.as_ref())
} else {
Err(err)
}
})?;
Ok(Index {
repo,
seen_ref_name: LAST_SEEN_REFNAME,
})
}
pub fn fetch_changes(&self) -> Result<Vec<CrateVersion>, GitError> {
let from = self
.last_seen_reference()
.and_then(|r| {
r.target().ok_or_else(|| {
GitError::from_str("last-seen reference did not have a valid target")
})
})
.or_else(|_| Oid::from_str(EMPTY_TREE_HASH))?;
let to = {
self.repo
.find_remote("origin")
.and_then(|mut r| r.fetch(&["refs/heads/*:refs/remotes/origin/*"], None, None))?;
let latest_fetched_commit_oid =
self.repo.refname_to_id("refs/remotes/origin/master")?;
self.last_seen_reference()
.and_then(|mut seen_ref| {
seen_ref.set_target(
latest_fetched_commit_oid,
"updating seen-ref head to latest fetched commit",
)
})
.or_else(|_err| {
self.repo.reference(
self.seen_ref_name,
latest_fetched_commit_oid,
true,
"creating seen-ref at latest fetched commit",
)
})?;
latest_fetched_commit_oid
};
self.changes_from_objects(
&self.repo.find_object(from, None)?,
&self.repo.find_object(to, None)?,
)
}
pub fn changes(
&self,
from: impl AsRef<str>,
to: impl AsRef<str>,
) -> Result<Vec<CrateVersion>, GitError> {
self.changes_from_objects(
&self.repo.revparse_single(from.as_ref())?,
&self.repo.revparse_single(to.as_ref())?,
)
}
pub fn changes_from_objects(
&self,
from: &Object,
to: &Object,
) -> Result<Vec<CrateVersion>, GitError> {
fn into_tree<'a>(repo: &'a Repository, obj: &Object) -> Result<Tree<'a>, GitError> {
repo.find_tree(match obj.kind() {
Some(ObjectType::Commit) => obj
.as_commit()
.expect("object of kind commit yields commit")
.tree_id(),
_ =>
{
obj.id()
}
})
}
let diff = self.repo.diff_tree_to_tree(
Some(&into_tree(&self.repo, from)?),
Some(&into_tree(&self.repo, to)?),
None,
)?;
let mut res: Vec<CrateVersion> = Vec::new();
diff.print(DiffFormat::Patch, |delta, _, diffline| {
if diffline.origin() != LINE_ADDED_INDICATOR {
return true;
}
if !match delta.status() {
Delta::Added | Delta::Modified => true,
_ => false,
} {
return true;
}
let content = match str::from_utf8(diffline.content()) {
Ok(c) => c,
Err(_) => return true,
};
if let Ok(c) = serde_json::from_str(content) {
res.push(c)
}
true
})
.map(|_| res)
}
}