Skip to content

Fetch readme from source archive if available for crate details page #2146

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Merged
merged 2 commits into from
Aug 2, 2023
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 2 additions & 0 deletions src/storage/mod.rs
Original file line number Diff line number Diff line change
Expand Up @@ -13,6 +13,7 @@ use crate::web::metrics::RenderingTimesRecorder;
use crate::{db::Pool, Config, InstanceMetrics};
use anyhow::{anyhow, ensure};
use chrono::{DateTime, Utc};
use fn_error_context::context;
use path_slash::PathExt;
use std::io::BufReader;
use std::num::NonZeroU64;
Expand Down Expand Up @@ -199,6 +200,7 @@ impl Storage {
})
}

#[context("fetching {path} from {name} {version} (archive: {archive_storage})")]
pub(crate) fn fetch_source_file(
&self,
name: &str,
Expand Down
23 changes: 23 additions & 0 deletions src/test/fakes.rs
Original file line number Diff line number Diff line change
Expand Up @@ -214,6 +214,12 @@ impl<'a> FakeRelease<'a> {
self.source_file("README.md", content.as_bytes())
}

/// NOTE: this should be markdown. It will be rendered as HTML when served.
pub(crate) fn readme_only_database(mut self, content: &'a str) -> Self {
self.readme = Some(content);
self
}

pub(crate) fn add_owner(mut self, owner: CrateOwner) -> Self {
self.registry_crate_data.owners.push(owner);
self
Expand Down Expand Up @@ -347,6 +353,23 @@ impl<'a> FakeRelease<'a> {
debug!("before upload source");
let source_tmp = create_temp_dir();
store_files_into(&self.source_files, source_tmp.path())?;

if !self
.source_files
.iter()
.any(|&(path, _)| path == "Cargo.toml")
{
let MetadataPackage { name, version, .. } = &package;
let content = format!(
r#"
[package]
name = "{name}"
version = "{version}"
"#
);
store_files_into(&[("Cargo.toml", content.as_bytes())], source_tmp.path())?;
}

let (source_meta, algs) = upload_files(FileKind::Sources, source_tmp.path())?;
debug!("added source files {}", source_meta);

Expand Down
111 changes: 101 additions & 10 deletions src/web/crate_details.rs
Original file line number Diff line number Diff line change
Expand Up @@ -4,13 +4,15 @@ use crate::{
db::Pool,
impl_axum_webpage,
repositories::RepositoryStatsUpdater,
storage::PathNotFoundError,
web::{
cache::CachePolicy,
encode_url_path,
error::{AxumNope, AxumResult},
},
Storage,
};
use anyhow::anyhow;
use anyhow::{Context, Result};
use axum::{
extract::{Extension, Path},
response::{IntoResponse, Response as AxumResponse},
Expand Down Expand Up @@ -237,6 +239,42 @@ impl CrateDetails {
Ok(Some(crate_details))
}

#[fn_error_context::context("fetching readme for {} {}", self.name, self.version)]
fn fetch_readme(&self, storage: &Storage) -> anyhow::Result<Option<String>> {
let manifest = storage.fetch_source_file(
&self.name,
&self.version,
"Cargo.toml",
self.archive_storage,
)?;
let manifest = String::from_utf8(manifest.content)
.context("parsing Cargo.toml")?
.parse::<toml::Value>()
.context("parsing Cargo.toml")?;
let paths = match manifest.get("package").and_then(|p| p.get("readme")) {
Some(toml::Value::Boolean(true)) => vec!["README.md"],
Some(toml::Value::Boolean(false)) => vec![],
Some(toml::Value::String(path)) => vec![path.as_ref()],
_ => vec!["README.md", "README.txt", "README"],
};
for path in &paths {
match storage.fetch_source_file(&self.name, &self.version, path, self.archive_storage) {
Ok(readme) => {
let readme = String::from_utf8(readme.content)
.with_context(|| format!("parsing {path} content"))?;
return Ok(Some(readme));
}
Err(err) if err.is::<PathNotFoundError>() => {
continue;
}
Err(err) => {
return Err(err);
}
}
}
Ok(None)
}

/// Returns the latest non-yanked, non-prerelease release of this crate (or latest
/// yanked/prereleased if that is all that exist).
pub fn latest_release(&self) -> &Release {
Expand Down Expand Up @@ -270,7 +308,9 @@ pub(crate) fn releases_for_crate(
.into_iter()
.filter_map(|row| {
let version: String = row.get("version");
match semver::Version::parse(&version) {
match semver::Version::parse(&version).with_context(|| {
format!("invalid semver in database for crate {crate_id}: {version}")
}) {
Ok(semversion) => Some(Release {
id: row.get("id"),
version: semversion,
Expand All @@ -281,9 +321,7 @@ pub(crate) fn releases_for_crate(
target_name: row.get("target_name"),
}),
Err(err) => {
report_error(&anyhow!(err).context(format!(
"invalid semver in database for crate {crate_id}: {version}"
)));
report_error(&err);
None
}
}
Expand All @@ -310,9 +348,10 @@ pub(crate) struct CrateDetailHandlerParams {
version: Option<String>,
}

#[tracing::instrument]
#[tracing::instrument(skip(pool, storage))]
pub(crate) async fn crate_details_handler(
Path(params): Path<CrateDetailHandlerParams>,
Extension(storage): Extension<Arc<Storage>>,
Extension(pool): Extension<Pool>,
Extension(repository_stats_updater): Extension<Arc<RepositoryStatsUpdater>>,
) -> AxumResult<AxumResponse> {
Expand Down Expand Up @@ -352,16 +391,23 @@ pub(crate) async fn crate_details_handler(

let details = spawn_blocking(move || {
let mut conn = pool.get()?;
CrateDetails::new(
let mut details = CrateDetails::new(
&mut *conn,
&params.name,
&version,
&version_or_latest,
Some(&repository_stats_updater),
)
)?
.ok_or(AxumNope::VersionNotFound)?;

match details.fetch_readme(&storage) {
Ok(readme) => details.readme = readme.or(details.readme),
Err(e) => report_error(&e),
}

Ok(details)
})
.await?
.ok_or(AxumNope::VersionNotFound)?;
.await?;

let mut res = CrateDetailsPage { details }.into_response();
res.extensions_mut()
Expand Down Expand Up @@ -1111,4 +1157,49 @@ mod tests {
Ok(())
});
}

#[test]
fn readme() {
wrapper(|env| {
env.fake_release()
.name("dummy")
.version("0.1.0")
.readme_only_database("database readme")
.create()?;

env.fake_release()
.name("dummy")
.version("0.2.0")
.readme_only_database("database readme")
.source_file("README.md", b"storage readme")
.create()?;

env.fake_release()
.name("dummy")
.version("0.3.0")
.source_file("README.md", b"storage readme")
.create()?;

env.fake_release()
.name("dummy")
.version("0.4.0")
.readme_only_database("database readme")
.source_file("MEREAD", b"storage meread")
.source_file("Cargo.toml", br#"package.readme = "MEREAD""#)
.create()?;

let check_readme = |path, content| {
let resp = env.frontend().get(path).send().unwrap();
let body = String::from_utf8(resp.bytes().unwrap().to_vec()).unwrap();
assert!(body.contains(content));
};

check_readme("/crate/dummy/0.1.0", "database readme");
check_readme("/crate/dummy/0.2.0", "storage readme");
check_readme("/crate/dummy/0.3.0", "storage readme");
check_readme("/crate/dummy/0.4.0", "storage meread");

Ok(())
});
}
}
14 changes: 12 additions & 2 deletions src/web/source.rs
Original file line number Diff line number Diff line change
Expand Up @@ -619,6 +619,7 @@ mod tests {
env.fake_release()
.name("fake")
.version("0.1.0")
.source_file("Cargo.toml", b"")
.source_file("config.json", b"{}")
.create()?;

Expand All @@ -637,7 +638,10 @@ mod tests {
assert!(text.starts_with(r#"<!DOCTYPE html>"#));

// file list doesn't show "../"
assert_eq!(get_file_list_links(&text), vec!["./config.json"]);
assert_eq!(
get_file_list_links(&text),
vec!["./Cargo.toml", "./config.json"]
);

Ok(())
});
Expand All @@ -649,6 +653,7 @@ mod tests {
env.fake_release()
.name("fake")
.version("0.1.0")
.source_file("Cargo.toml", b"some_random_content")
.source_file("folder1/some_filename.rs", b"some_random_content")
.source_file("folder2/another_filename.rs", b"some_random_content")
.source_file("root_filename.rs", b"some_random_content")
Expand All @@ -665,7 +670,12 @@ mod tests {

assert_eq!(
get_file_list_links(&response.text()?),
vec!["./folder1/", "./folder2/", "./root_filename.rs"]
vec![
"./folder1/",
"./folder2/",
"./Cargo.toml",
"./root_filename.rs"
]
);
Ok(())
});
Expand Down