Skip to content

Optimize the reverse dependencies endpoint #623

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Merged
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions migrations/20170312165531_index_dependencies/down.sql
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
DROP INDEX dependencies_crate_id_version_id_idx;
1 change: 1 addition & 0 deletions migrations/20170312165531_index_dependencies/up.sql
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
CREATE INDEX ON dependencies (crate_id, version_id);
38 changes: 9 additions & 29 deletions src/krate.rs
Original file line number Diff line number Diff line change
Expand Up @@ -576,38 +576,18 @@ impl Crate {
offset: i64,
limit: i64)
-> CargoResult<(Vec<(Dependency, String, i32)>, i64)> {
let select_sql = "
FROM dependencies
INNER JOIN (
SELECT versions.*,
row_number() OVER (PARTITION BY crate_id ORDER BY to_semver_no_prerelease(num) DESC NULLS LAST) rn
FROM versions
WHERE NOT yanked
) versions
ON versions.id = dependencies.version_id
INNER JOIN crates
ON crates.id = versions.crate_id
WHERE dependencies.crate_id = $1
AND rn = 1
";
let fetch_sql = format!("SELECT DISTINCT ON (crate_downloads, crate_name)
dependencies.*,
crates.downloads AS crate_downloads,
crates.name AS crate_name
{}
ORDER BY crate_downloads DESC
OFFSET $2
LIMIT $3",
select_sql);
let count_sql = format!("SELECT COUNT(DISTINCT(crates.id)) {}", select_sql);

let stmt = conn.prepare(&fetch_sql)?;
let vec: Vec<_> = stmt.query(&[&self.id, &offset, &limit])?
let stmt = conn.prepare(include_str!("krate_reverse_dependencies.sql"))?;

let rows = stmt.query(&[&self.id, &offset, &limit])?;
let cnt = if rows.is_empty() {
0i64
} else {
rows.get(0).get("total")
};
let vec: Vec<_> = rows
.iter()
.map(|r| (Model::from_row(&r), r.get("crate_name"), r.get("crate_downloads")))
.collect();
let stmt = conn.prepare(&count_sql)?;
let cnt: i64 = stmt.query(&[&self.id])?.iter().next().unwrap().get(0);

Ok((vec, cnt))
}
Expand Down
37 changes: 37 additions & 0 deletions src/krate_reverse_dependencies.sql
Original file line number Diff line number Diff line change
@@ -0,0 +1,37 @@
-- Apply pagination to the whole thing
SELECT *, COUNT(*) OVER () as total FROM (
-- Multple dependencies can exist, make it distinct
SELECT DISTINCT ON (crate_downloads, crate_name)
dependencies.*,
crates.downloads AS crate_downloads,
crates.name AS crate_name
FROM dependencies
-- We only want the crates whose *max* version is dependent, so we join on a
-- subselect that includes the versions with their ordinal position
INNER JOIN (
SELECT versions.*,
row_number() OVER (
PARTITION BY crate_id
ORDER BY to_semver_no_prerelease(num) DESC NULLS LAST
) rn
FROM versions
WHERE NOT yanked
-- This is completely redundant, but it's faster to filter the versions
-- early even if this subselect is done via an index scan.
AND crate_id = ANY(
SELECT versions.crate_id
FROM versions
INNER JOIN dependencies
ON dependencies.version_id = versions.id
WHERE dependencies.crate_id = $1
)
) versions
ON versions.id = dependencies.version_id
INNER JOIN crates
ON crates.id = versions.crate_id
WHERE dependencies.crate_id = $1
AND rn = 1
ORDER BY crate_downloads DESC
) t
OFFSET $2
LIMIT $3