src/generate.rs
/*
* Copyright 2023 Trevor Bentley
*
* Author: Trevor Bentley
* Contact: gitsy@@trevorbentley.com
* Source: https://github.com/mrmekon/itsy-gitsy
*
* This file is part of Itsy-Gitsy.
*
* Itsy-Gitsy is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* Itsy-Gitsy is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with Itsy-Gitsy. If not, see <http://www.gnu.org/licenses/>.
*/
use crate::{
error,
git::{dir_listing, parse_repo, GitFile, GitObject, GitRepo, GitsyMetadata},
loud, louder, loudest, normal, normal_noln,
settings::{GitsyCli, GitsyRepoDescriptions, GitsySettings, GitsySettingsRepo},
template::{
DirFilter, FileFilter, HexFilter, MaskFilter, OctFilter, Pagination, TsDateFn, TsTimestampFn, UrlStringFilter,
},
util::{GitsyError, GitsyErrorKind, VERBOSITY},
};
use chrono::{DateTime, Local};
use git2::{Error, Repository};
use rayon::prelude::*;
use std::cmp;
use std::collections::BTreeMap;
use std::fs::File;
use std::io::Write;
use std::path::{Path, PathBuf};
use std::sync::atomic::{AtomicUsize, Ordering};
use std::time::Instant;
use tera::{Context, Tera};
#[cfg(feature = "markdown")]
use pulldown_cmark::{html, Options, Parser as MdParser};
#[cfg(any(feature = "highlight", feature = "highlight_fast"))]
use syntect::{
highlighting::ThemeSet,
html::{css_for_theme_with_class_style, ClassStyle, ClassedHTMLGenerator},
parsing::SyntaxSet,
util::LinesWithEndings,
};
macro_rules! size_check {
($settings:expr, $cur:expr, $total:expr, $action:expr) => {
let cur: usize = $cur;
if cur > $settings.limit_repo_size.unwrap_or(usize::MAX) {
$action;
}
let total: usize = $total;
if total.saturating_add($cur) > $settings.limit_total_size.unwrap_or(usize::MAX) {
$action;
}
};
}
macro_rules! size_check_atomic {
($settings:expr, $cur:expr, $total:expr, $action:expr) => {
let cur: usize = $cur.load(Ordering::SeqCst);
if cur > $settings.limit_repo_size.unwrap_or(usize::MAX) {
$action;
}
let total: usize = $total.load(Ordering::SeqCst);
if total.saturating_add(cur) > $settings.limit_total_size.unwrap_or(usize::MAX) {
$action;
}
};
}
pub struct GitsyGenerator {
cli: GitsyCli,
settings: GitsySettings,
repo_descriptions: GitsyRepoDescriptions,
tera: Option<Tera>,
total_bytes: AtomicUsize,
generated_dt: DateTime<Local>,
}
impl GitsyGenerator {
pub fn new(cli: GitsyCli, settings: GitsySettings, repo_descriptions: GitsyRepoDescriptions) -> GitsyGenerator {
GitsyGenerator {
cli,
settings,
repo_descriptions,
tera: None,
total_bytes: AtomicUsize::new(0),
generated_dt: chrono::offset::Local::now(),
}
}
fn new_context(&self, repo: Option<&GitRepo>) -> Result<Context, GitsyError> {
let mut ctx = match repo {
Some(repo) => Context::from_serialize(repo)?,
_ => Context::new(),
};
if let Some(extra) = &self.settings.extra {
ctx.try_insert("extra", extra)
.expect("Failed to add extra settings to template engine.");
}
if let Some(site_name) = &self.settings.site_name {
ctx.insert("site_name", site_name);
}
if let Some(site_url) = &self.settings.site_url {
let site_url = match site_url.chars().last() {
Some('/') => &site_url[0..site_url.len() - 1],
_ => site_url,
};
ctx.insert("site_url", site_url);
}
if let Some(site_description) = &self.settings.site_description {
ctx.insert("site_description", site_description);
}
ctx.insert("site_dir", &self.settings.outputs.output_dir());
if self.settings.outputs.global_assets.is_some() {
ctx.insert(
"site_assets",
&self
.settings
.outputs
.to_relative(&self.settings.outputs.global_assets::<GitFile>(None, None)),
);
}
ctx.insert("site_generated_ts", &self.generated_dt.timestamp());
ctx.insert("site_generated_offset", &self.generated_dt.offset().local_minus_utc());
Ok(ctx)
}
fn find_repo(&self, name: &str, repo_desc: &GitsySettingsRepo) -> Result<String, GitsyError> {
let repo_path = match &repo_desc.path {
url if url.starts_with("https://") || url.to_str().unwrap_or_default().contains("@") => {
if self.settings.outputs.cloned_repos.is_none() {
return Err(GitsyError::kind(
GitsyErrorKind::Settings,
Some(&format!(
"ERROR: Found remote repo [{}], but `cloned_repos` directory not configured.",
name
)),
));
};
let clone_path: PathBuf = [self.settings.outputs.cloned_repos.as_deref().unwrap(), name]
.iter()
.collect();
match Repository::open(&clone_path) {
Ok(r) => {
match self.settings.fetch_remote {
Some(false) => {}
_ => { // explicitly true, or unspecified (default)
// Repo already cloned, so update all refs
let refs: Vec<String> = r
.references()
.expect(&format!("Unable to enumerate references for repo [{}]", name))
.map(|x| {
x.expect(&format!("Found invalid reference in repo [{}]", name))
.name()
.expect(&format!("Found unnamed reference in repo: [{}]", name))
.to_string()
})
.collect();
r.find_remote("origin")
.expect(&format!("Clone of repo [{}] missing `origin` remote.", name))
.fetch(&refs, None, None)
.expect(&format!("Failed to fetch updates from remote repo [{}]", name));
},
}
clone_path.to_string_lossy().to_string()
}
Err(_) => {
let mut builder = git2::build::RepoBuilder::new();
// TODO: git2-rs's ssh support just doesn't seem to
// work. It finds the repo, but fails to either
// decrypt or use the private key.
//
//if !url.starts_with("https://") {
// use secrecy::ExposeSecret;
// // this must be SSH, which needs credentials.
// let mut callbacks = git2::RemoteCallbacks::new();
// callbacks.credentials(|_url, username_from_url, _allowed_types| {
// //git2::Cred::ssh_key_from_agent(username_from_url.unwrap())
//
// let keyfile = format!("{}/.ssh/id_rsa", std::env::var("HOME").unwrap());
// let passphrase = pinentry::PassphraseInput::with_default_binary().unwrap()
// .with_description(&format!("Enter passphrase for SSH key {} (repo: {})",
// keyfile, url.display()))
// .with_prompt("Passphrase:")
// .interact().unwrap();
// git2::Cred::ssh_key(
// username_from_url.unwrap(),
// None,
// Path::new(&keyfile),
// Some(passphrase.expose_secret()),
// )
// });
// let mut options = git2::FetchOptions::new();
// options.remote_callbacks(callbacks);
// builder.fetch_options(options);
//}
builder
.bare(true)
.clone(&url.to_string_lossy().to_string(), &clone_path)
.expect(&format!("Failed to clone remote repo [{}]", name));
clone_path.to_string_lossy().to_string()
}
}
}
dir => {
match dir.metadata() {
Ok(m) if m.is_dir() => {}
_ => {
error!(
"ERROR: local repository [{}]: directory not found: {}",
name,
dir.display()
);
return Err(GitsyError::kind(
GitsyErrorKind::Settings,
Some(&format!("ERROR: Local repository not found: {}", name)),
));
}
}
dir.to_string_lossy().to_string()
}
};
Ok(repo_path)
}
#[cfg(feature = "markdown")]
fn parse_markdown(contents: &str) -> String {
let mut options = Options::empty();
options.insert(Options::ENABLE_STRIKETHROUGH);
options.insert(Options::ENABLE_TABLES);
let parser = MdParser::new_ext(contents, options);
let mut html_output: String = String::with_capacity(contents.len() * 3 / 2);
html::push_html(&mut html_output, parser);
html_output
}
#[cfg(any(feature = "highlight", feature = "highlight_fast"))]
fn syntax_highlight(contents: &str, extension: &str) -> String {
let syntax_set = SyntaxSet::load_defaults_newlines();
let syntax = match syntax_set.find_syntax_by_extension(extension) {
Some(s) => s,
_ => {
return contents.to_string();
}
};
let mut html_generator = ClassedHTMLGenerator::new_with_class_style(syntax, &syntax_set, ClassStyle::Spaced);
for line in LinesWithEndings::from(contents) {
match html_generator.parse_html_for_line_which_includes_newline(line) {
Ok(_) => {}
Err(_) => {
error!("Warning: failed to apply syntax highlighting.");
return contents.to_string();
}
}
}
html_generator.finalize()
}
fn fill_file_contents(repo: &Repository, file: &GitFile, settings: &GitsySettingsRepo) -> Result<GitFile, Error> {
let mut file = file.clone();
if file.kind == "file" {
let blob = repo.find_blob(git2::Oid::from_str(&file.id)?)?;
file.contents = match blob.is_binary() {
false => {
let path = Path::new(&file.path);
let cstr = String::from_utf8_lossy(blob.content()).to_string();
let (content, rendered, pre) = match path.extension() {
#[cfg(feature = "markdown")]
Some(x) if settings.render_markdown.unwrap_or(false) && x == "md" => {
loudest!(" - rendering Markdown in {}", path.display());
let (cstr, rendered, pre) = (GitsyGenerator::parse_markdown(&cstr), true, false);
(cstr, rendered, pre)
}
#[cfg(any(feature = "highlight", feature = "highlight_fast"))]
Some(x) if settings.syntax_highlight.unwrap_or(false) => {
loudest!(" - syntax highlighting {}", path.display());
(
GitsyGenerator::syntax_highlight(&cstr, x.to_string_lossy().to_string().as_str()),
true,
true,
)
}
_ => (cstr, false, true),
};
file.contents_safe = rendered;
file.contents_preformatted = pre;
Some(content)
}
true => Some(format!("[Binary data ({} bytes)]", blob.content().len())),
};
}
Ok(file)
}
fn write_rendered<P: AsRef<Path>>(&self, path: &P, rendered: &str) -> usize {
let path: &Path = path.as_ref();
assert!(
self.settings.outputs.assert_valid(&path),
"ERROR: attempted to write invalid path: {}",
path.display()
);
// Write the file to disk
let mut file = File::create(path).expect(&format!("Unable to write to output path: {}", path.display()));
file.write(rendered.as_bytes())
.expect(&format!("Failed to save rendered html to path: {}", path.display()));
louder!(" - wrote file: {}", path.display());
rendered.as_bytes().len()
}
fn tera_init(&self) -> Result<Tera, GitsyError> {
let mut template_path = self.settings.outputs.template_dir();
template_path.push("**");
template_path.push("*.html");
let mut tera = Tera::new(&template_path.to_string_lossy().to_string())?;
tera.register_filter("only_files", FileFilter {});
tera.register_filter("only_dirs", DirFilter {});
tera.register_filter("hex", HexFilter {});
tera.register_filter("oct", OctFilter {});
tera.register_filter("mask", MaskFilter {});
tera.register_filter("url_string", UrlStringFilter {});
tera.register_function("ts_to_date", TsDateFn {});
tera.register_function("ts_to_git_timestamp", TsTimestampFn {});
Ok(tera)
}
pub fn gen_repo_list(&self, ctx: &Context) -> Result<usize, GitsyError> {
let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
let mut global_bytes = 0;
for (templ_path, out_path) in self.settings.outputs.repo_list::<GitRepo>(None, None) {
let templ_path = templ_path.to_str().expect(&format!(
"ERROR: a summary template path is invalid: {}",
templ_path.display()
));
let out_path = out_path.to_str().expect(&format!(
"ERROR: a summary output path is invalid: {}",
out_path.display()
));
let rendered = tera.render(templ_path, &ctx)?;
global_bytes += self.write_rendered(&out_path, &rendered);
}
Ok(global_bytes)
}
pub fn gen_error(&self, ctx: &Context) -> Result<usize, GitsyError> {
let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
let mut global_bytes = 0;
for (templ_path, out_path) in self.settings.outputs.error::<GitRepo>(None, None) {
let templ_path = templ_path.to_str().expect(&format!(
"ERROR: a summary template path is invalid: {}",
templ_path.display()
));
let out_path = out_path.to_str().expect(&format!(
"ERROR: a summary output path is invalid: {}",
out_path.display()
));
match tera.render(templ_path, &ctx) {
Ok(rendered) => {
global_bytes += self.write_rendered(&out_path, &rendered);
}
Err(x) => match x.kind {
_ => error!("ERROR: {:?}", x),
},
}
}
Ok(global_bytes)
}
pub fn gen_summary(
&self,
ctx: &Context,
atomic_bytes: &AtomicUsize,
parsed_repo: &GitRepo,
repo_desc: &GitsySettingsRepo,
_repo: &Repository,
) -> Result<usize, GitsyError> {
let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
let mut repo_bytes = 0;
for (templ_path, out_path) in self.settings.outputs.summary::<GitRepo>(Some(parsed_repo), None) {
let templ_path = templ_path.to_str().expect(&format!(
"ERROR: a summary template path is invalid: {}",
templ_path.display()
));
let out_path = out_path.to_str().expect(&format!(
"ERROR: a summary output path is invalid: {}",
out_path.display()
));
match tera.render(templ_path, &ctx) {
Ok(rendered) => {
let bytes = self.write_rendered(&out_path, &rendered);
repo_bytes += bytes;
atomic_bytes.fetch_add(bytes, Ordering::SeqCst);
}
Err(x) => match x.kind {
_ => error!("ERROR: {:?}", x),
},
}
size_check_atomic!(
repo_desc,
atomic_bytes,
self.total_bytes,
return Err(GitsyError::kind(
GitsyErrorKind::Settings,
Some("ERROR: size limit exceeded")
))
);
}
Ok(repo_bytes)
}
pub fn gen_history(
&self,
ctx: &Context,
atomic_bytes: &AtomicUsize,
parsed_repo: &GitRepo,
repo_desc: &GitsySettingsRepo,
_repo: &Repository,
) -> Result<usize, GitsyError> {
let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
let repo_bytes = AtomicUsize::new(0);
for (templ_path, out_path) in self.settings.outputs.history::<GitRepo>(Some(parsed_repo), None) {
let templ_path = templ_path.to_str().expect(&format!(
"ERROR: a summary template path is invalid: {}",
templ_path.display()
));
let out_path = out_path.to_str().expect(&format!(
"ERROR: a summary output path is invalid: {}",
out_path.display()
));
let pages = parsed_repo.history.chunks(self.settings.paginate_history());
let page_count = pages.len();
parsed_repo
.history
.par_chunks(self.settings.paginate_history())
.enumerate()
.try_for_each(|(idx, page)| {
let mut paged_ctx = ctx.clone();
let pagination = Pagination::new(idx + 1, page_count, &out_path);
// make sure the 'commits' map contains the same
// commits as the current page.
let commits: BTreeMap<String, GitObject> = page
.iter()
.map(|entry| match parsed_repo.commits.get(&entry.full_hash) {
Some(com) => Some((entry.full_hash.clone(), com.clone())),
_ => None,
})
.map_while(|x| x)
.collect();
if repo_desc.limit_commit_ids_to_related == Some(true) {
let parent_ids: Vec<String> = commits.keys().cloned().collect();
paged_ctx.insert("commit_ids", &parent_ids);
}
paged_ctx.insert("page", &pagination.with_relative_paths());
paged_ctx.insert("history", &page);
paged_ctx.insert("commits", &commits);
let rendered = tera.render(templ_path, &paged_ctx)?;
let bytes = self.write_rendered(&pagination.cur_page, &rendered);
repo_bytes.fetch_add(bytes, Ordering::SeqCst);
atomic_bytes.fetch_add(bytes, Ordering::SeqCst);
paged_ctx.remove("page");
paged_ctx.remove("history");
paged_ctx.remove("commits");
size_check_atomic!(
repo_desc,
atomic_bytes,
self.total_bytes,
return Err(GitsyError::kind(
GitsyErrorKind::Settings,
Some("ERROR: size limit exceeded")
))
);
Ok::<(), GitsyError>(())
})?;
}
Ok(repo_bytes.load(Ordering::SeqCst))
}
pub fn gen_commit(
&self,
ctx: &Context,
atomic_bytes: &AtomicUsize,
parsed_repo: &GitRepo,
repo_desc: &GitsySettingsRepo,
_repo: &Repository,
) -> Result<usize, GitsyError> {
let mut ctx = ctx.clone();
let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
let mut repo_bytes = 0;
for (_id, commit) in &parsed_repo.commits {
ctx.try_insert("commit", &commit)
.expect("Failed to add commit to template engine.");
if repo_desc.limit_commit_ids_to_related == Some(true) {
let parent_ids: Vec<String> = commit
.parents
.iter()
.filter(|x| parsed_repo.commits.contains_key(*x))
.cloned()
.collect();
ctx.insert("commit_ids", &parent_ids);
}
for (templ_path, out_path) in self.settings.outputs.commit(Some(parsed_repo), Some(commit)) {
let templ_path = templ_path.to_str().expect(&format!(
"ERROR: a summary template path is invalid: {}",
templ_path.display()
));
let out_path = out_path.to_str().expect(&format!(
"ERROR: a summary output path is invalid: {}",
out_path.display()
));
match tera.render(templ_path, &ctx) {
Ok(rendered) => {
let bytes = self.write_rendered(&out_path, &rendered);
repo_bytes += bytes;
atomic_bytes.fetch_add(bytes, Ordering::SeqCst);
}
Err(x) => match x.kind {
_ => error!("ERROR: {:?}", x),
},
}
}
ctx.remove("commit");
size_check_atomic!(
repo_desc,
atomic_bytes,
self.total_bytes,
return Err(GitsyError::kind(
GitsyErrorKind::Settings,
Some("ERROR: size limit exceeded")
))
);
}
Ok(repo_bytes)
}
pub fn gen_branches(
&self,
ctx: &Context,
atomic_bytes: &AtomicUsize,
parsed_repo: &GitRepo,
repo_desc: &GitsySettingsRepo,
_repo: &Repository,
) -> Result<usize, GitsyError> {
let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
let mut repo_bytes = 0;
for (templ_path, out_path) in self.settings.outputs.branches::<GitRepo>(Some(parsed_repo), None) {
let templ_path = templ_path.to_str().expect(&format!(
"ERROR: a summary template path is invalid: {}",
templ_path.display()
));
let out_path = out_path.to_str().expect(&format!(
"ERROR: a summary output path is invalid: {}",
out_path.display()
));
let mut paged_ctx = ctx.clone();
paged_ctx.remove("branches");
let pages = parsed_repo.branches.chunks(self.settings.paginate_branches());
let page_count = pages.len();
for (idx, page) in pages.enumerate() {
let pagination = Pagination::new(idx + 1, page_count, &out_path);
paged_ctx.insert("page", &pagination.with_relative_paths());
paged_ctx.insert("branches", &page);
match tera.render(templ_path, &paged_ctx) {
Ok(rendered) => {
let bytes = self.write_rendered(&pagination.cur_page, &rendered);
repo_bytes += bytes;
atomic_bytes.fetch_add(bytes, Ordering::SeqCst);
}
Err(x) => match x.kind {
_ => error!("ERROR: {:?}", x),
},
}
paged_ctx.remove("page");
paged_ctx.remove("branches");
}
size_check_atomic!(
repo_desc,
atomic_bytes,
self.total_bytes,
return Err(GitsyError::kind(
GitsyErrorKind::Settings,
Some("ERROR: size limit exceeded")
))
);
}
Ok(repo_bytes)
}
pub fn gen_branch(
&self,
ctx: &Context,
atomic_bytes: &AtomicUsize,
parsed_repo: &GitRepo,
repo_desc: &GitsySettingsRepo,
_repo: &Repository,
) -> Result<usize, GitsyError> {
let mut ctx = ctx.clone();
let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
let mut repo_bytes = 0;
for branch in &parsed_repo.branches {
ctx.insert("branch", branch);
if repo_desc.limit_commit_ids_to_related == Some(true) {
let parent_ids: Vec<String> = [&branch.full_hash]
.iter()
.filter(|x| parsed_repo.commits.contains_key(**x))
.map(|x| (**x).clone())
.collect();
ctx.insert("commit_ids", &parent_ids);
}
for (templ_path, out_path) in self.settings.outputs.branch(Some(parsed_repo), Some(branch)) {
let templ_path = templ_path.to_str().expect(&format!(
"ERROR: a summary template path is invalid: {}",
templ_path.display()
));
let out_path = out_path.to_str().expect(&format!(
"ERROR: a summary output path is invalid: {}",
out_path.display()
));
match tera.render(templ_path, &ctx) {
Ok(rendered) => {
let bytes = self.write_rendered(&out_path, &rendered);
repo_bytes += bytes;
atomic_bytes.fetch_add(bytes, Ordering::SeqCst);
}
Err(x) => match x.kind {
_ => error!("ERROR: {:?}", x),
},
}
}
ctx.remove("branch");
size_check_atomic!(
repo_desc,
atomic_bytes,
self.total_bytes,
return Err(GitsyError::kind(
GitsyErrorKind::Settings,
Some("ERROR: size limit exceeded")
))
);
}
Ok(repo_bytes)
}
pub fn gen_tags(
&self,
ctx: &Context,
atomic_bytes: &AtomicUsize,
parsed_repo: &GitRepo,
repo_desc: &GitsySettingsRepo,
_repo: &Repository,
) -> Result<usize, GitsyError> {
let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
let mut repo_bytes = 0;
for (templ_path, out_path) in self.settings.outputs.tags::<GitRepo>(Some(parsed_repo), None) {
let templ_path = templ_path.to_str().expect(&format!(
"ERROR: a summary template path is invalid: {}",
templ_path.display()
));
let out_path = out_path.to_str().expect(&format!(
"ERROR: a summary output path is invalid: {}",
out_path.display()
));
let mut paged_ctx = ctx.clone();
paged_ctx.remove("tags");
let pages = parsed_repo.tags.chunks(self.settings.paginate_tags());
let page_count = pages.len();
for (idx, page) in pages.enumerate() {
let pagination = Pagination::new(idx + 1, page_count, &out_path);
paged_ctx.insert("page", &pagination.with_relative_paths());
paged_ctx.insert("tags", &page);
match tera.render(templ_path, &paged_ctx) {
Ok(rendered) => {
let bytes = self.write_rendered(&pagination.cur_page, &rendered);
repo_bytes += bytes;
atomic_bytes.fetch_add(bytes, Ordering::SeqCst);
}
Err(x) => match x.kind {
_ => error!("ERROR: {:?}", x),
},
}
paged_ctx.remove("page");
paged_ctx.remove("tags");
size_check_atomic!(
repo_desc,
atomic_bytes,
self.total_bytes,
return Err(GitsyError::kind(
GitsyErrorKind::Settings,
Some("ERROR: size limit exceeded")
))
);
}
}
Ok(repo_bytes)
}
pub fn gen_tag(
&self,
ctx: &Context,
atomic_bytes: &AtomicUsize,
parsed_repo: &GitRepo,
repo_desc: &GitsySettingsRepo,
_repo: &Repository,
) -> Result<usize, GitsyError> {
let mut ctx = ctx.clone();
let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
let mut repo_bytes = 0;
for tag in &parsed_repo.tags {
ctx.insert("tag", tag);
if repo_desc.limit_commit_ids_to_related == Some(true) {
let parent_ids: Vec<String> = [tag.tagged_id.as_deref()]
.iter()
.map_while(|x| *x)
.filter(|x| parsed_repo.commits.contains_key(*x))
.map(|x| x.to_string())
.collect();
ctx.insert("commit_ids", &parent_ids);
}
if let Some(tagged_id) = tag.tagged_id.as_ref() {
if let Some(commit) = parsed_repo.commits.get(tagged_id) {
ctx.insert("commit", &commit);
}
}
for (templ_path, out_path) in self.settings.outputs.tag(Some(parsed_repo), Some(tag)) {
let templ_path = templ_path.to_str().expect(&format!(
"ERROR: a summary template path is invalid: {}",
templ_path.display()
));
let out_path = out_path.to_str().expect(&format!(
"ERROR: a summary output path is invalid: {}",
out_path.display()
));
match tera.render(templ_path, &ctx) {
Ok(rendered) => {
let bytes = self.write_rendered(&out_path, &rendered);
repo_bytes += bytes;
atomic_bytes.fetch_add(bytes, Ordering::SeqCst);
}
Err(x) => match x.kind {
_ => error!("ERROR: {:?}", x),
},
}
}
ctx.remove("tag");
ctx.remove("commit");
size_check_atomic!(
repo_desc,
atomic_bytes,
self.total_bytes,
return Err(GitsyError::kind(
GitsyErrorKind::Settings,
Some("ERROR: size limit exceeded")
))
);
}
Ok(repo_bytes)
}
pub fn gen_files(
&self,
ctx: &Context,
atomic_bytes: &AtomicUsize,
parsed_repo: &GitRepo,
repo_desc: &GitsySettingsRepo,
_repo: &Repository,
) -> Result<usize, GitsyError> {
let mut ctx = ctx.clone();
let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
let mut repo_bytes = 0;
for (templ_path, out_path) in self.settings.outputs.files::<GitRepo>(Some(parsed_repo), None) {
let templ_path = templ_path.to_str().expect(&format!(
"ERROR: a summary template path is invalid: {}",
templ_path.display()
));
let out_path = out_path.to_str().expect(&format!(
"ERROR: a summary output path is invalid: {}",
out_path.display()
));
ctx.insert("root_files", &parsed_repo.root_files);
ctx.insert("all_files", &parsed_repo.all_files);
match tera.render(templ_path, &ctx) {
Ok(rendered) => {
let bytes = self.write_rendered(&out_path, &rendered);
repo_bytes += bytes;
atomic_bytes.fetch_add(bytes, Ordering::SeqCst);
}
Err(x) => match x.kind {
_ => error!("ERROR: {:?}", x),
},
}
size_check_atomic!(
repo_desc,
atomic_bytes,
self.total_bytes,
return Err(GitsyError::kind(
GitsyErrorKind::Settings,
Some("ERROR: size limit exceeded")
))
);
}
Ok(repo_bytes)
}
pub fn gen_file(
&self,
ctx: &Context,
atomic_bytes: &AtomicUsize,
parsed_repo: &GitRepo,
repo_desc: &GitsySettingsRepo,
repo: &Repository,
) -> Result<usize, GitsyError> {
let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
let mut repo_bytes = 0;
#[cfg(any(feature = "highlight", feature = "highlight_fast"))]
if self.settings.outputs.has_files() {
let ts = ThemeSet::load_defaults();
let theme = ts
.themes
.get(
repo_desc
.syntax_highlight_theme
.as_deref()
.unwrap_or("base16-ocean.dark"),
)
.expect("Invalid syntax highlighting theme specified.");
let css: String = css_for_theme_with_class_style(theme, syntect::html::ClassStyle::Spaced)
.expect("Invalid syntax highlighting theme specified.");
let bytes = self.write_rendered(
&self.settings.outputs.syntax_css::<GitFile>(Some(&parsed_repo), None),
css.as_str(),
);
repo_bytes += bytes;
atomic_bytes.fetch_add(bytes, Ordering::SeqCst);
}
let files: Vec<&GitFile> = parsed_repo.all_files.iter().filter(|x| x.kind == "file").collect();
let atomic_repo_bytes: AtomicUsize = AtomicUsize::new(repo_bytes);
let repo_path = repo
.path()
.to_str()
.expect("ERROR: unable to determine path to local repository");
let _ = files
.par_iter()
.fold(
|| Some(0),
|acc, file| {
// These two have to be recreated. Cloning the Tera context is expensive.
let repo = Repository::open(&repo_path).expect("Unable to find git repository.");
let mut ctx = ctx.clone();
let mut local_bytes = 0;
let cur_repo_bytes = atomic_repo_bytes.load(Ordering::SeqCst);
size_check!(
repo_desc,
cur_repo_bytes,
self.total_bytes.load(Ordering::SeqCst),
return None
);
let file = match file.size < repo_desc.limit_file_size.unwrap_or(usize::MAX) {
true => {
GitsyGenerator::fill_file_contents(&repo, &file, &repo_desc).expect("Failed to parse file.")
}
false => (*file).clone(),
};
ctx.try_insert("file", &file)
.expect("Failed to add file to template engine.");
for (templ_path, out_path) in self.settings.outputs.file(Some(parsed_repo), Some(&file)) {
let templ_path = templ_path.to_str().expect(&format!(
"ERROR: a summary template path is invalid: {}",
templ_path.display()
));
let out_path = out_path.to_str().expect(&format!(
"ERROR: a summary output path is invalid: {}",
out_path.display()
));
match tera.render(templ_path, &ctx) {
Ok(rendered) => {
local_bytes = self.write_rendered(&out_path, &rendered);
atomic_repo_bytes.fetch_add(local_bytes, Ordering::SeqCst);
atomic_bytes.fetch_add(local_bytes, Ordering::SeqCst);
// Copy readme files to their real filename, so links to readme files remain valid
// across file changes.
if let Some(readmes) = &repo_desc.readme_files {
for readme in readmes {
if &file.path == readme {
let mut pretty_path = PathBuf::from(out_path);
pretty_path.pop();
pretty_path.push(&file.path);
match std::fs::copy(&out_path, &pretty_path) {
Ok(_) => louder!(" - wrote readme file: {}", pretty_path.to_string_lossy()),
Err(e) => error!("ERROR: {:?}", e),
}
}
}
};
}
Err(x) => match x.kind {
_ => error!("ERROR: {:?}", x),
},
}
}
ctx.remove("file");
if atomic_repo_bytes.load(Ordering::SeqCst) >= repo_desc.limit_repo_size.unwrap_or(usize::MAX) {
return None;
}
Some(acc.unwrap() + local_bytes)
},
)
.while_some() // allow short-circuiting if size limit is reached
.sum::<usize>();
repo_bytes = atomic_repo_bytes.load(Ordering::SeqCst);
size_check_atomic!(
repo_desc,
atomic_bytes,
self.total_bytes,
return Err(GitsyError::kind(
GitsyErrorKind::Settings,
Some("ERROR: size limit exceeded")
))
);
Ok(repo_bytes)
}
pub fn gen_dir(
&self,
ctx: &Context,
atomic_bytes: &AtomicUsize,
parsed_repo: &GitRepo,
repo_desc: &GitsySettingsRepo,
repo: &Repository,
) -> Result<usize, GitsyError> {
let mut ctx = ctx.clone();
let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
let mut repo_bytes = 0;
for dir in parsed_repo.all_files.iter().filter(|x| x.kind == "dir") {
let listing = dir_listing(&repo, &dir).expect("Failed to parse file.");
ctx.insert("dir", dir);
ctx.try_insert("files", &listing)
.expect("Failed to add dir to template engine.");
for (templ_path, out_path) in self.settings.outputs.dir(Some(parsed_repo), Some(dir)) {
let templ_path = templ_path.to_str().expect(&format!(
"ERROR: a summary template path is invalid: {}",
templ_path.display()
));
let out_path = out_path.to_str().expect(&format!(
"ERROR: a summary output path is invalid: {}",
out_path.display()
));
match tera.render(templ_path, &ctx) {
Ok(rendered) => {
let bytes = self.write_rendered(&out_path, &rendered);
repo_bytes += bytes;
atomic_bytes.fetch_add(bytes, Ordering::SeqCst);
}
Err(x) => match x.kind {
_ => error!("ERROR: {:?}", x),
},
}
}
ctx.remove("files");
ctx.remove("dir");
size_check_atomic!(
repo_desc,
atomic_bytes,
self.total_bytes,
return Err(GitsyError::kind(
GitsyErrorKind::Settings,
Some("ERROR: size limit exceeded")
))
);
}
Ok(repo_bytes)
}
fn copy_assets(
&self,
repo_desc: Option<&GitsySettingsRepo>,
parsed_repo: Option<&GitRepo>,
repo: Option<&Repository>,
) -> Result<usize, GitsyError> {
let mut bytes = 0;
match repo_desc {
Some(repo_desc) => {
let parsed_repo = parsed_repo.expect("ERROR: attempted to fill repo assets without a repository");
let repo = repo.expect("ERROR: attempted to fill repo assets without a repository");
if repo_desc.asset_files.is_some() {
let target_dir = self.settings.outputs.repo_assets::<GitFile>(Some(&parsed_repo), None);
for src_file in repo_desc.asset_files.as_ref().unwrap() {
// Read the asset file contents from the git repo
let src_file = PathBuf::from(src_file);
let src_contents = self.settings.outputs
.asset_contents(&src_file, Some(parsed_repo), Some(repo))?;
// Determine the output path
let mut dst_file = PathBuf::from(&target_dir);
let basename = src_file.file_name()
.ok_or(GitsyError::kind(
GitsyErrorKind::Settings,
Some(&format!(
"ERROR: repo asset file missing filename: {}",
src_file.display()
))))?;
dst_file.push(basename);
// Open destination file for writing
let mut file = File::create(&dst_file)
.map_err(|e| GitsyError::sourced_kind(
GitsyErrorKind::Settings,
Some(&format!(
"ERROR: unable to open repo asset file for writing: {}",
dst_file.display()
)),
e))?;
// Write to disk
file.write(&src_contents)
.map_err(|e| GitsyError::sourced_kind(
GitsyErrorKind::Settings,
Some(&format!(
"ERROR: unable to write repo asset file: {}",
dst_file.display()
)),
e))?;
if let Ok(meta) = std::fs::metadata(dst_file) {
bytes += meta.len() as usize;
}
loud!(" - copied repo asset: {}", src_file.display());
}
}
}
_ => {
if self.settings.asset_files.is_some() {
let target_dir = self.settings.outputs.global_assets::<GitFile>(None, None);
for src_file in self.settings.asset_files.as_ref().unwrap() {
let src_file = self.settings.outputs.asset_path(src_file, None, None);
let mut dst_file = PathBuf::from(&target_dir);
dst_file.push(
src_file
.file_name()
.expect(&format!("Failed to copy asset file: {}", src_file.display())),
);
std::fs::copy(&src_file, &dst_file)
.expect(&format!("Failed to copy asset file: {}", src_file.display()));
if let Ok(meta) = std::fs::metadata(dst_file) {
bytes += meta.len() as usize;
}
loud!(" - copied global asset: {}", src_file.display());
}
}
}
}
Ok(bytes)
}
pub fn generate_repo(
&self,
repo_desc: &GitsySettingsRepo,
pad_name_len: usize,
) -> Result<(GitRepo, usize), GitsyError> {
loudest!("Repo settings:\n{:#?}", &repo_desc);
let start_repo = Instant::now();
let name = repo_desc.name.as_deref().expect("A configured repository has no name!");
if self.settings.threads.unwrap_or(0) == 1 || VERBOSITY.load(Ordering::SeqCst) > 1 {
normal_noln!("[{}{}]... ", name, " ".repeat(pad_name_len - name.len()));
}
let repo_path = self.find_repo(&name, &repo_desc)?;
let repo = Repository::open(&repo_path).expect("Unable to find git repository.");
let metadata = GitsyMetadata {
full_name: repo_desc.name.clone(),
description: repo_desc.description.clone(),
website: repo_desc.website.clone(),
clone: repo_desc.clone_url.clone(),
attributes: repo_desc.attributes.clone().unwrap_or_default(),
};
let parsed_repo = parse_repo(&repo, &name, &repo_desc, metadata).expect("Failed to analyze repo HEAD.");
let minimized_repo = parsed_repo.minimal_clone(self.settings.limit_context.unwrap_or(usize::MAX));
let atomic_bytes = AtomicUsize::new(0);
let mut local_ctx = self.new_context(Some(&minimized_repo))?;
// Add README file to context, if specified and found
if let Some(readmes) = &repo_desc.readme_files {
for readme in readmes {
if let Some(file) = parsed_repo.root_files.iter().filter(|x| &x.name == readme).next() {
louder!(" - found readme file: {}", file.name);
let _ =
GitsyGenerator::fill_file_contents(&repo, &file, &repo_desc).expect("Failed to parse file.");
local_ctx.insert("readme", &file);
break;
}
}
};
let fns = &[
GitsyGenerator::gen_summary,
GitsyGenerator::gen_branches,
GitsyGenerator::gen_branch,
GitsyGenerator::gen_tags,
GitsyGenerator::gen_tag,
GitsyGenerator::gen_history,
GitsyGenerator::gen_commit,
GitsyGenerator::gen_file,
GitsyGenerator::gen_dir,
GitsyGenerator::gen_files,
];
let repo_bytes: usize = fns
.par_iter()
.try_fold(
|| 0,
|acc, x| {
let repo = Repository::open(&repo_path).expect("Unable to find git repository.");
let bytes = x(&self, &local_ctx, &atomic_bytes, &parsed_repo, repo_desc, &repo)?;
// remove these bytes from the current repo bytes and move them to the total bytes.
atomic_bytes.fetch_sub(bytes, Ordering::SeqCst);
self.total_bytes.fetch_add(bytes, Ordering::SeqCst);
Ok::<usize, GitsyError>(acc + bytes)
},
)
.try_reduce(|| 0, |acc, x| Ok(acc + x))?;
size_check!(
repo_desc,
0,
self.total_bytes.load(Ordering::SeqCst),
return Err(GitsyError::kind(
GitsyErrorKind::Settings,
Some("ERROR: size limit exceeded")
))
);
self.copy_assets(Some(&repo_desc), Some(&parsed_repo), Some(&repo))?;
normal!(
"{}{}done in {:.2}s ({} bytes)",
match self.settings.threads.unwrap_or(0) == 1 && VERBOSITY.load(Ordering::SeqCst) <= 1 {
true => "".into(),
false => format!("[{}{}]... ", name, " ".repeat(pad_name_len - name.len())),
},
match VERBOSITY.load(Ordering::SeqCst) > 1 {
true => " - ",
_ => "",
},
start_repo.elapsed().as_secs_f32(),
repo_bytes
);
Ok((minimized_repo, repo_bytes))
}
pub fn generate(&mut self) -> Result<(), GitsyError> {
let start_all = Instant::now();
self.tera = Some(self.tera_init()?);
self.generated_dt = chrono::offset::Local::now();
if self.cli.should_clean {
self.settings.outputs.clean();
}
if self.repo_descriptions.len() == 0 {
panic!(
"No Git repositories defined! Please check your configuration file ({})",
self.cli.path.display()
);
}
self.settings.outputs.create();
// Sort the repositories by name
let mut repo_vec: Vec<GitsySettingsRepo> = self.repo_descriptions.iter().cloned().collect();
repo_vec.sort_by(|x, y| {
x.name
.as_deref()
.map(|n| n.cmp(&y.name.as_deref().unwrap_or_default()))
.unwrap_or(cmp::Ordering::Equal)
});
// Find the one with the longest name, for pretty printing
let global_name = "repo list";
let longest_repo_name = repo_vec
.iter()
.fold(0, |acc, x| {
cmp::max(acc, x.name.as_deref().map(|n| n.len()).unwrap_or(0))
})
.max(global_name.len());
loudest!("Global settings:\n{:#?}", &self.settings);
let shared_repos = std::sync::Mutex::new(Vec::<GitRepo>::new());
// Iterate over each repository, generating outputs
let mut total_bytes = match self.settings.threads.unwrap_or(0) {
n if n == 1 => {
let mut tb = 0;
for repo_desc in &repo_vec {
let (minimized_repo, repo_bytes) = self.generate_repo(repo_desc, longest_repo_name)?;
size_check!(
repo_desc,
0,
tb,
return Err(GitsyError::kind(
GitsyErrorKind::Settings,
Some("ERROR: site size limit exceeded")
))
);
shared_repos.lock().unwrap().push(minimized_repo);
tb += repo_bytes;
}
tb
}
n if n == 0 => {
let total_bytes: usize = repo_vec
.par_iter()
.try_fold(
|| 0,
|acc, repo_desc| {
let (minimized_repo, repo_bytes) = self.generate_repo(repo_desc, longest_repo_name)?;
size_check!(
repo_desc,
0,
acc + repo_bytes,
return Err(GitsyError::kind(
GitsyErrorKind::Unknown,
Some("ERROR: site size limit exceeded")
))
);
shared_repos.lock().unwrap().push(minimized_repo);
Ok::<usize, GitsyError>(repo_bytes)
},
)
.try_reduce(|| 0, |acc, x| Ok(acc + x))?;
total_bytes
}
n => {
let pool = rayon::ThreadPoolBuilder::new().num_threads(n).build().unwrap();
let total_bytes = pool.install(|| {
let total_bytes: usize = repo_vec
.par_iter()
.try_fold(
|| 0,
|acc, repo_desc| {
let (minimized_repo, repo_bytes) = self.generate_repo(repo_desc, longest_repo_name)?;
size_check!(
repo_desc,
0,
acc + repo_bytes,
return Err(GitsyError::kind(
GitsyErrorKind::Unknown,
Some("ERROR: site size limit exceeded")
))
);
shared_repos.lock().unwrap().push(minimized_repo);
Ok::<usize, GitsyError>(repo_bytes)
},
)
.try_reduce(|| 0, |acc, x| Ok(acc + x))?;
Ok::<usize, GitsyError>(total_bytes)
})?;
total_bytes
}
};
size_check!(
self.settings,
0,
total_bytes,
return Err(GitsyError::kind(
GitsyErrorKind::Unknown,
Some("ERROR: site size limit exceeded")
))
);
let repos = shared_repos;
let start_global = Instant::now();
normal_noln!(
"[{}{}]... ",
global_name,
" ".repeat(longest_repo_name - global_name.len())
);
let mut global_ctx = self.new_context(None)?;
global_ctx.try_insert("repos", &repos)?;
let mut global_bytes = 0;
global_bytes += self.gen_repo_list(&global_ctx)?;
global_bytes += self.gen_error(&global_ctx)?;
self.copy_assets(None, None, None)?;
total_bytes += global_bytes;
size_check!(
self.settings,
0,
total_bytes,
return Err(GitsyError::kind(
GitsyErrorKind::Unknown,
Some("ERROR: site size limit exceeded")
))
);
normal!(
"done in {:.2}s ({} bytes)",
start_global.elapsed().as_secs_f32(),
global_bytes
);
loud!(
"Wrote {} bytes in {:.2}s",
total_bytes,
start_all.elapsed().as_secs_f32()
);
if self.cli.should_open {
if let Some((_templ, out)) = self.settings.outputs.repo_list::<GitFile>(None, None).first() {
let _ = open::that(&format!("file://{}", out.display()));
}
}
Ok(())
}
}