summary history branches tags files
src/generate.rs
/*
 * Copyright 2023 Trevor Bentley
 *
 * Author: Trevor Bentley
 * Contact: gitsy@@trevorbentley.com
 * Source: https://github.com/mrmekon/itsy-gitsy
 *
 * This file is part of Itsy-Gitsy.
 *
 * Itsy-Gitsy is free software: you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 *
 * Itsy-Gitsy is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with Itsy-Gitsy.  If not, see <http://www.gnu.org/licenses/>.
 */
use crate::{
    error,
    git::{dir_listing, parse_repo, GitFile, GitObject, GitRepo, GitsyMetadata},
    loud, louder, loudest, normal, normal_noln,
    settings::{GitsyCli, GitsyRepoDescriptions, GitsySettings, GitsySettingsRepo},
    template::{
        DirFilter, FileFilter, HexFilter, MaskFilter, OctFilter, Pagination, TsDateFn, TsTimestampFn, UrlStringFilter,
    },
    util::{GitsyError, GitsyErrorKind, VERBOSITY},
};
use chrono::{DateTime, Local};
use git2::{Error, Repository};
use rayon::prelude::*;
use std::cmp;
use std::collections::BTreeMap;
use std::fs::File;
use std::io::Write;
use std::path::{Path, PathBuf};
use std::sync::atomic::{AtomicUsize, Ordering};
use std::time::Instant;
use tera::{Context, Tera};

#[cfg(feature = "markdown")]
use pulldown_cmark::{html, Options, Parser as MdParser};

#[cfg(any(feature = "highlight", feature = "highlight_fast"))]
use syntect::{
    highlighting::ThemeSet,
    html::{css_for_theme_with_class_style, ClassStyle, ClassedHTMLGenerator},
    parsing::SyntaxSet,
    util::LinesWithEndings,
};

macro_rules! size_check {
    ($settings:expr, $cur:expr, $total:expr, $action:expr) => {
        let cur: usize = $cur;
        if cur > $settings.limit_repo_size.unwrap_or(usize::MAX) {
            $action;
        }
        let total: usize = $total;
        if total.saturating_add($cur) > $settings.limit_total_size.unwrap_or(usize::MAX) {
            $action;
        }
    };
}

macro_rules! size_check_atomic {
    ($settings:expr, $cur:expr, $total:expr, $action:expr) => {
        let cur: usize = $cur.load(Ordering::SeqCst);
        if cur > $settings.limit_repo_size.unwrap_or(usize::MAX) {
            $action;
        }
        let total: usize = $total.load(Ordering::SeqCst);
        if total.saturating_add(cur) > $settings.limit_total_size.unwrap_or(usize::MAX) {
            $action;
        }
    };
}

pub struct GitsyGenerator {
    cli: GitsyCli,
    settings: GitsySettings,
    repo_descriptions: GitsyRepoDescriptions,
    tera: Option<Tera>,
    total_bytes: AtomicUsize,
    generated_dt: DateTime<Local>,
}

impl GitsyGenerator {
    pub fn new(cli: GitsyCli, settings: GitsySettings, repo_descriptions: GitsyRepoDescriptions) -> GitsyGenerator {
        GitsyGenerator {
            cli,
            settings,
            repo_descriptions,
            tera: None,
            total_bytes: AtomicUsize::new(0),
            generated_dt: chrono::offset::Local::now(),
        }
    }
    fn new_context(&self, repo: Option<&GitRepo>) -> Result<Context, GitsyError> {
        let mut ctx = match repo {
            Some(repo) => Context::from_serialize(repo)?,
            _ => Context::new(),
        };
        if let Some(extra) = &self.settings.extra {
            ctx.try_insert("extra", extra)
                .expect("Failed to add extra settings to template engine.");
        }
        if let Some(site_name) = &self.settings.site_name {
            ctx.insert("site_name", site_name);
        }
        if let Some(site_url) = &self.settings.site_url {
            let site_url = match site_url.chars().last() {
                Some('/') => &site_url[0..site_url.len() - 1],
                _ => site_url,
            };
            ctx.insert("site_url", site_url);
        }
        if let Some(site_description) = &self.settings.site_description {
            ctx.insert("site_description", site_description);
        }
        ctx.insert("site_dir", &self.settings.outputs.output_dir());
        if self.settings.outputs.global_assets.is_some() {
            ctx.insert(
                "site_assets",
                &self
                    .settings
                    .outputs
                    .to_relative(&self.settings.outputs.global_assets::<GitFile>(None, None)),
            );
        }
        ctx.insert("site_generated_ts", &self.generated_dt.timestamp());
        ctx.insert("site_generated_offset", &self.generated_dt.offset().local_minus_utc());
        Ok(ctx)
    }

    fn find_repo(&self, name: &str, repo_desc: &GitsySettingsRepo) -> Result<String, GitsyError> {
        let repo_path = match &repo_desc.path {
            url if url.starts_with("https://") || url.to_str().unwrap_or_default().contains("@") => {
                if self.settings.outputs.cloned_repos.is_none() {
                    return Err(GitsyError::kind(
                        GitsyErrorKind::Settings,
                        Some(&format!(
                            "ERROR: Found remote repo [{}], but `cloned_repos` directory not configured.",
                            name
                        )),
                    ));
                };
                let clone_path: PathBuf = [self.settings.outputs.cloned_repos.as_deref().unwrap(), name]
                    .iter()
                    .collect();
                match Repository::open(&clone_path) {
                    Ok(r) => {
                        match self.settings.fetch_remote {
                            Some(false) => {}
                            _ => { // explicitly true, or unspecified (default)
                                // Repo already cloned, so update all refs
                                let refs: Vec<String> = r
                                    .references()
                                    .expect(&format!("Unable to enumerate references for repo [{}]", name))
                                    .map(|x| {
                                        x.expect(&format!("Found invalid reference in repo [{}]", name))
                                            .name()
                                            .expect(&format!("Found unnamed reference in repo: [{}]", name))
                                            .to_string()
                                    })
                                    .collect();
                                r.find_remote("origin")
                                    .expect(&format!("Clone of repo [{}] missing `origin` remote.", name))
                                    .fetch(&refs, None, None)
                                    .expect(&format!("Failed to fetch updates from remote repo [{}]", name));
                            },
                        }
                        clone_path.to_string_lossy().to_string()
                    }
                    Err(_) => {
                        let mut builder = git2::build::RepoBuilder::new();

                        // TODO: git2-rs's ssh support just doesn't seem to
                        // work.  It finds the repo, but fails to either
                        // decrypt or use the private key.
                        //
                        //if !url.starts_with("https://") {
                        //    use secrecy::ExposeSecret;
                        //    // this must be SSH, which needs credentials.
                        //    let mut callbacks = git2::RemoteCallbacks::new();
                        //    callbacks.credentials(|_url, username_from_url, _allowed_types| {
                        //        //git2::Cred::ssh_key_from_agent(username_from_url.unwrap())
                        //
                        //        let keyfile = format!("{}/.ssh/id_rsa", std::env::var("HOME").unwrap());
                        //        let passphrase = pinentry::PassphraseInput::with_default_binary().unwrap()
                        //            .with_description(&format!("Enter passphrase for SSH key {} (repo: {})",
                        //                                       keyfile, url.display()))
                        //            .with_prompt("Passphrase:")
                        //            .interact().unwrap();
                        //        git2::Cred::ssh_key(
                        //            username_from_url.unwrap(),
                        //            None,
                        //            Path::new(&keyfile),
                        //            Some(passphrase.expose_secret()),
                        //        )
                        //    });
                        //    let mut options = git2::FetchOptions::new();
                        //    options.remote_callbacks(callbacks);
                        //    builder.fetch_options(options);
                        //}
                        builder
                            .bare(true)
                            .clone(&url.to_string_lossy().to_string(), &clone_path)
                            .expect(&format!("Failed to clone remote repo [{}]", name));
                        clone_path.to_string_lossy().to_string()
                    }
                }
            }
            dir => {
                match dir.metadata() {
                    Ok(m) if m.is_dir() => {}
                    _ => {
                        error!(
                            "ERROR: local repository [{}]: directory not found: {}",
                            name,
                            dir.display()
                        );
                        return Err(GitsyError::kind(
                            GitsyErrorKind::Settings,
                            Some(&format!("ERROR: Local repository not found: {}", name)),
                        ));
                    }
                }
                dir.to_string_lossy().to_string()
            }
        };
        Ok(repo_path)
    }

    #[cfg(feature = "markdown")]
    fn parse_markdown(contents: &str) -> String {
        let mut options = Options::empty();
        options.insert(Options::ENABLE_STRIKETHROUGH);
        options.insert(Options::ENABLE_TABLES);
        let parser = MdParser::new_ext(contents, options);
        let mut html_output: String = String::with_capacity(contents.len() * 3 / 2);
        html::push_html(&mut html_output, parser);
        html_output
    }

    #[cfg(any(feature = "highlight", feature = "highlight_fast"))]
    fn syntax_highlight(contents: &str, extension: &str) -> String {
        let syntax_set = SyntaxSet::load_defaults_newlines();
        let syntax = match syntax_set.find_syntax_by_extension(extension) {
            Some(s) => s,
            _ => {
                return contents.to_string();
            }
        };
        let mut html_generator = ClassedHTMLGenerator::new_with_class_style(syntax, &syntax_set, ClassStyle::Spaced);
        for line in LinesWithEndings::from(contents) {
            match html_generator.parse_html_for_line_which_includes_newline(line) {
                Ok(_) => {}
                Err(_) => {
                    error!("Warning: failed to apply syntax highlighting.");
                    return contents.to_string();
                }
            }
        }
        html_generator.finalize()
    }

    fn fill_file_contents(repo: &Repository, file: &GitFile, settings: &GitsySettingsRepo) -> Result<GitFile, Error> {
        let mut file = file.clone();
        if file.kind == "file" {
            let blob = repo.find_blob(git2::Oid::from_str(&file.id)?)?;
            file.contents = match blob.is_binary() {
                false => {
                    let path = Path::new(&file.path);
                    let cstr = String::from_utf8_lossy(blob.content()).to_string();
                    let (content, rendered, pre) = match path.extension() {
                        #[cfg(feature = "markdown")]
                        Some(x) if settings.render_markdown.unwrap_or(false) && x == "md" => {
                            loudest!(" - rendering Markdown in {}", path.display());
                            let (cstr, rendered, pre) = (GitsyGenerator::parse_markdown(&cstr), true, false);
                            (cstr, rendered, pre)
                        }
                        #[cfg(any(feature = "highlight", feature = "highlight_fast"))]
                        Some(x) if settings.syntax_highlight.unwrap_or(false) => {
                            loudest!(" - syntax highlighting {}", path.display());
                            (
                                GitsyGenerator::syntax_highlight(&cstr, x.to_string_lossy().to_string().as_str()),
                                true,
                                true,
                            )
                        }
                        _ => (cstr, false, true),
                    };
                    file.contents_safe = rendered;
                    file.contents_preformatted = pre;
                    Some(content)
                }
                true => Some(format!("[Binary data ({} bytes)]", blob.content().len())),
            };
        }
        Ok(file)
    }

    fn write_rendered<P: AsRef<Path>>(&self, path: &P, rendered: &str) -> usize {
        let path: &Path = path.as_ref();
        assert!(
            self.settings.outputs.assert_valid(&path),
            "ERROR: attempted to write invalid path: {}",
            path.display()
        );
        // Write the file to disk
        let mut file = File::create(path).expect(&format!("Unable to write to output path: {}", path.display()));
        file.write(rendered.as_bytes())
            .expect(&format!("Failed to save rendered html to path: {}", path.display()));
        louder!(" - wrote file: {}", path.display());
        rendered.as_bytes().len()
    }

    fn tera_init(&self) -> Result<Tera, GitsyError> {
        let mut template_path = self.settings.outputs.template_dir();
        template_path.push("**");
        template_path.push("*.html");
        let mut tera = Tera::new(&template_path.to_string_lossy().to_string())?;
        tera.register_filter("only_files", FileFilter {});
        tera.register_filter("only_dirs", DirFilter {});
        tera.register_filter("hex", HexFilter {});
        tera.register_filter("oct", OctFilter {});
        tera.register_filter("mask", MaskFilter {});
        tera.register_filter("url_string", UrlStringFilter {});
        tera.register_function("ts_to_date", TsDateFn {});
        tera.register_function("ts_to_git_timestamp", TsTimestampFn {});
        Ok(tera)
    }

    pub fn gen_repo_list(&self, ctx: &Context) -> Result<usize, GitsyError> {
        let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
        let mut global_bytes = 0;
        for (templ_path, out_path) in self.settings.outputs.repo_list::<GitRepo>(None, None) {
            let templ_path = templ_path.to_str().expect(&format!(
                "ERROR: a summary template path is invalid: {}",
                templ_path.display()
            ));
            let out_path = out_path.to_str().expect(&format!(
                "ERROR: a summary output path is invalid: {}",
                out_path.display()
            ));
            let rendered = tera.render(templ_path, &ctx)?;
            global_bytes += self.write_rendered(&out_path, &rendered);
        }
        Ok(global_bytes)
    }

    pub fn gen_error(&self, ctx: &Context) -> Result<usize, GitsyError> {
        let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
        let mut global_bytes = 0;
        for (templ_path, out_path) in self.settings.outputs.error::<GitRepo>(None, None) {
            let templ_path = templ_path.to_str().expect(&format!(
                "ERROR: a summary template path is invalid: {}",
                templ_path.display()
            ));
            let out_path = out_path.to_str().expect(&format!(
                "ERROR: a summary output path is invalid: {}",
                out_path.display()
            ));
            match tera.render(templ_path, &ctx) {
                Ok(rendered) => {
                    global_bytes += self.write_rendered(&out_path, &rendered);
                }
                Err(x) => match x.kind {
                    _ => error!("ERROR: {:?}", x),
                },
            }
        }
        Ok(global_bytes)
    }

    pub fn gen_summary(
        &self,
        ctx: &Context,
        atomic_bytes: &AtomicUsize,
        parsed_repo: &GitRepo,
        repo_desc: &GitsySettingsRepo,
        _repo: &Repository,
    ) -> Result<usize, GitsyError> {
        let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
        let mut repo_bytes = 0;
        for (templ_path, out_path) in self.settings.outputs.summary::<GitRepo>(Some(parsed_repo), None) {
            let templ_path = templ_path.to_str().expect(&format!(
                "ERROR: a summary template path is invalid: {}",
                templ_path.display()
            ));
            let out_path = out_path.to_str().expect(&format!(
                "ERROR: a summary output path is invalid: {}",
                out_path.display()
            ));
            match tera.render(templ_path, &ctx) {
                Ok(rendered) => {
                    let bytes = self.write_rendered(&out_path, &rendered);
                    repo_bytes += bytes;
                    atomic_bytes.fetch_add(bytes, Ordering::SeqCst);
                }
                Err(x) => match x.kind {
                    _ => error!("ERROR: {:?}", x),
                },
            }
            size_check_atomic!(
                repo_desc,
                atomic_bytes,
                self.total_bytes,
                return Err(GitsyError::kind(
                    GitsyErrorKind::Settings,
                    Some("ERROR: size limit exceeded")
                ))
            );
        }
        Ok(repo_bytes)
    }

    pub fn gen_history(
        &self,
        ctx: &Context,
        atomic_bytes: &AtomicUsize,
        parsed_repo: &GitRepo,
        repo_desc: &GitsySettingsRepo,
        _repo: &Repository,
    ) -> Result<usize, GitsyError> {
        let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
        let repo_bytes = AtomicUsize::new(0);
        for (templ_path, out_path) in self.settings.outputs.history::<GitRepo>(Some(parsed_repo), None) {
            let templ_path = templ_path.to_str().expect(&format!(
                "ERROR: a summary template path is invalid: {}",
                templ_path.display()
            ));
            let out_path = out_path.to_str().expect(&format!(
                "ERROR: a summary output path is invalid: {}",
                out_path.display()
            ));
            let pages = parsed_repo.history.chunks(self.settings.paginate_history());
            let page_count = pages.len();
            parsed_repo
                .history
                .par_chunks(self.settings.paginate_history())
                .enumerate()
                .try_for_each(|(idx, page)| {
                    let mut paged_ctx = ctx.clone();
                    let pagination = Pagination::new(idx + 1, page_count, &out_path);
                    // make sure the 'commits' map contains the same
                    // commits as the current page.
                    let commits: BTreeMap<String, GitObject> = page
                        .iter()
                        .map(|entry| match parsed_repo.commits.get(&entry.full_hash) {
                            Some(com) => Some((entry.full_hash.clone(), com.clone())),
                            _ => None,
                        })
                        .map_while(|x| x)
                        .collect();
                    if repo_desc.limit_commit_ids_to_related == Some(true) {
                        let parent_ids: Vec<String> = commits.keys().cloned().collect();
                        paged_ctx.insert("commit_ids", &parent_ids);
                    }
                    paged_ctx.insert("page", &pagination.with_relative_paths());
                    paged_ctx.insert("history", &page);
                    paged_ctx.insert("commits", &commits);
                    let rendered = tera.render(templ_path, &paged_ctx)?;
                    let bytes = self.write_rendered(&pagination.cur_page, &rendered);
                    repo_bytes.fetch_add(bytes, Ordering::SeqCst);
                    atomic_bytes.fetch_add(bytes, Ordering::SeqCst);
                    paged_ctx.remove("page");
                    paged_ctx.remove("history");
                    paged_ctx.remove("commits");
                    size_check_atomic!(
                        repo_desc,
                        atomic_bytes,
                        self.total_bytes,
                        return Err(GitsyError::kind(
                            GitsyErrorKind::Settings,
                            Some("ERROR: size limit exceeded")
                        ))
                    );
                    Ok::<(), GitsyError>(())
                })?;
        }
        Ok(repo_bytes.load(Ordering::SeqCst))
    }

    pub fn gen_commit(
        &self,
        ctx: &Context,
        atomic_bytes: &AtomicUsize,
        parsed_repo: &GitRepo,
        repo_desc: &GitsySettingsRepo,
        _repo: &Repository,
    ) -> Result<usize, GitsyError> {
        let mut ctx = ctx.clone();
        let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
        let mut repo_bytes = 0;
        for (_id, commit) in &parsed_repo.commits {
            ctx.try_insert("commit", &commit)
                .expect("Failed to add commit to template engine.");
            if repo_desc.limit_commit_ids_to_related == Some(true) {
                let parent_ids: Vec<String> = commit
                    .parents
                    .iter()
                    .filter(|x| parsed_repo.commits.contains_key(*x))
                    .cloned()
                    .collect();
                ctx.insert("commit_ids", &parent_ids);
            }
            for (templ_path, out_path) in self.settings.outputs.commit(Some(parsed_repo), Some(commit)) {
                let templ_path = templ_path.to_str().expect(&format!(
                    "ERROR: a summary template path is invalid: {}",
                    templ_path.display()
                ));
                let out_path = out_path.to_str().expect(&format!(
                    "ERROR: a summary output path is invalid: {}",
                    out_path.display()
                ));
                match tera.render(templ_path, &ctx) {
                    Ok(rendered) => {
                        let bytes = self.write_rendered(&out_path, &rendered);
                        repo_bytes += bytes;
                        atomic_bytes.fetch_add(bytes, Ordering::SeqCst);
                    }
                    Err(x) => match x.kind {
                        _ => error!("ERROR: {:?}", x),
                    },
                }
            }
            ctx.remove("commit");
            size_check_atomic!(
                repo_desc,
                atomic_bytes,
                self.total_bytes,
                return Err(GitsyError::kind(
                    GitsyErrorKind::Settings,
                    Some("ERROR: size limit exceeded")
                ))
            );
        }
        Ok(repo_bytes)
    }

    pub fn gen_branches(
        &self,
        ctx: &Context,
        atomic_bytes: &AtomicUsize,
        parsed_repo: &GitRepo,
        repo_desc: &GitsySettingsRepo,
        _repo: &Repository,
    ) -> Result<usize, GitsyError> {
        let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
        let mut repo_bytes = 0;
        for (templ_path, out_path) in self.settings.outputs.branches::<GitRepo>(Some(parsed_repo), None) {
            let templ_path = templ_path.to_str().expect(&format!(
                "ERROR: a summary template path is invalid: {}",
                templ_path.display()
            ));
            let out_path = out_path.to_str().expect(&format!(
                "ERROR: a summary output path is invalid: {}",
                out_path.display()
            ));
            let mut paged_ctx = ctx.clone();
            paged_ctx.remove("branches");
            let pages = parsed_repo.branches.chunks(self.settings.paginate_branches());
            let page_count = pages.len();
            for (idx, page) in pages.enumerate() {
                let pagination = Pagination::new(idx + 1, page_count, &out_path);
                paged_ctx.insert("page", &pagination.with_relative_paths());
                paged_ctx.insert("branches", &page);
                match tera.render(templ_path, &paged_ctx) {
                    Ok(rendered) => {
                        let bytes = self.write_rendered(&pagination.cur_page, &rendered);
                        repo_bytes += bytes;
                        atomic_bytes.fetch_add(bytes, Ordering::SeqCst);
                    }
                    Err(x) => match x.kind {
                        _ => error!("ERROR: {:?}", x),
                    },
                }
                paged_ctx.remove("page");
                paged_ctx.remove("branches");
            }
            size_check_atomic!(
                repo_desc,
                atomic_bytes,
                self.total_bytes,
                return Err(GitsyError::kind(
                    GitsyErrorKind::Settings,
                    Some("ERROR: size limit exceeded")
                ))
            );
        }
        Ok(repo_bytes)
    }

    pub fn gen_branch(
        &self,
        ctx: &Context,
        atomic_bytes: &AtomicUsize,
        parsed_repo: &GitRepo,
        repo_desc: &GitsySettingsRepo,
        _repo: &Repository,
    ) -> Result<usize, GitsyError> {
        let mut ctx = ctx.clone();
        let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
        let mut repo_bytes = 0;
        for branch in &parsed_repo.branches {
            ctx.insert("branch", branch);
            if repo_desc.limit_commit_ids_to_related == Some(true) {
                let parent_ids: Vec<String> = [&branch.full_hash]
                    .iter()
                    .filter(|x| parsed_repo.commits.contains_key(**x))
                    .map(|x| (**x).clone())
                    .collect();
                ctx.insert("commit_ids", &parent_ids);
            }
            for (templ_path, out_path) in self.settings.outputs.branch(Some(parsed_repo), Some(branch)) {
                let templ_path = templ_path.to_str().expect(&format!(
                    "ERROR: a summary template path is invalid: {}",
                    templ_path.display()
                ));
                let out_path = out_path.to_str().expect(&format!(
                    "ERROR: a summary output path is invalid: {}",
                    out_path.display()
                ));
                match tera.render(templ_path, &ctx) {
                    Ok(rendered) => {
                        let bytes = self.write_rendered(&out_path, &rendered);
                        repo_bytes += bytes;
                        atomic_bytes.fetch_add(bytes, Ordering::SeqCst);
                    }
                    Err(x) => match x.kind {
                        _ => error!("ERROR: {:?}", x),
                    },
                }
            }
            ctx.remove("branch");
            size_check_atomic!(
                repo_desc,
                atomic_bytes,
                self.total_bytes,
                return Err(GitsyError::kind(
                    GitsyErrorKind::Settings,
                    Some("ERROR: size limit exceeded")
                ))
            );
        }
        Ok(repo_bytes)
    }

    pub fn gen_tags(
        &self,
        ctx: &Context,
        atomic_bytes: &AtomicUsize,
        parsed_repo: &GitRepo,
        repo_desc: &GitsySettingsRepo,
        _repo: &Repository,
    ) -> Result<usize, GitsyError> {
        let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
        let mut repo_bytes = 0;
        for (templ_path, out_path) in self.settings.outputs.tags::<GitRepo>(Some(parsed_repo), None) {
            let templ_path = templ_path.to_str().expect(&format!(
                "ERROR: a summary template path is invalid: {}",
                templ_path.display()
            ));
            let out_path = out_path.to_str().expect(&format!(
                "ERROR: a summary output path is invalid: {}",
                out_path.display()
            ));
            let mut paged_ctx = ctx.clone();
            paged_ctx.remove("tags");
            let pages = parsed_repo.tags.chunks(self.settings.paginate_tags());
            let page_count = pages.len();
            for (idx, page) in pages.enumerate() {
                let pagination = Pagination::new(idx + 1, page_count, &out_path);
                paged_ctx.insert("page", &pagination.with_relative_paths());
                paged_ctx.insert("tags", &page);
                match tera.render(templ_path, &paged_ctx) {
                    Ok(rendered) => {
                        let bytes = self.write_rendered(&pagination.cur_page, &rendered);
                        repo_bytes += bytes;
                        atomic_bytes.fetch_add(bytes, Ordering::SeqCst);
                    }
                    Err(x) => match x.kind {
                        _ => error!("ERROR: {:?}", x),
                    },
                }
                paged_ctx.remove("page");
                paged_ctx.remove("tags");
                size_check_atomic!(
                    repo_desc,
                    atomic_bytes,
                    self.total_bytes,
                    return Err(GitsyError::kind(
                        GitsyErrorKind::Settings,
                        Some("ERROR: size limit exceeded")
                    ))
                );
            }
        }
        Ok(repo_bytes)
    }

    pub fn gen_tag(
        &self,
        ctx: &Context,
        atomic_bytes: &AtomicUsize,
        parsed_repo: &GitRepo,
        repo_desc: &GitsySettingsRepo,
        _repo: &Repository,
    ) -> Result<usize, GitsyError> {
        let mut ctx = ctx.clone();
        let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
        let mut repo_bytes = 0;
        for tag in &parsed_repo.tags {
            ctx.insert("tag", tag);
            if repo_desc.limit_commit_ids_to_related == Some(true) {
                let parent_ids: Vec<String> = [tag.tagged_id.as_deref()]
                    .iter()
                    .map_while(|x| *x)
                    .filter(|x| parsed_repo.commits.contains_key(*x))
                    .map(|x| x.to_string())
                    .collect();
                ctx.insert("commit_ids", &parent_ids);
            }
            if let Some(tagged_id) = tag.tagged_id.as_ref() {
                if let Some(commit) = parsed_repo.commits.get(tagged_id) {
                    ctx.insert("commit", &commit);
                }
            }
            for (templ_path, out_path) in self.settings.outputs.tag(Some(parsed_repo), Some(tag)) {
                let templ_path = templ_path.to_str().expect(&format!(
                    "ERROR: a summary template path is invalid: {}",
                    templ_path.display()
                ));
                let out_path = out_path.to_str().expect(&format!(
                    "ERROR: a summary output path is invalid: {}",
                    out_path.display()
                ));
                match tera.render(templ_path, &ctx) {
                    Ok(rendered) => {
                        let bytes = self.write_rendered(&out_path, &rendered);
                        repo_bytes += bytes;
                        atomic_bytes.fetch_add(bytes, Ordering::SeqCst);
                    }
                    Err(x) => match x.kind {
                        _ => error!("ERROR: {:?}", x),
                    },
                }
            }
            ctx.remove("tag");
            ctx.remove("commit");
            size_check_atomic!(
                repo_desc,
                atomic_bytes,
                self.total_bytes,
                return Err(GitsyError::kind(
                    GitsyErrorKind::Settings,
                    Some("ERROR: size limit exceeded")
                ))
            );
        }
        Ok(repo_bytes)
    }

    pub fn gen_files(
        &self,
        ctx: &Context,
        atomic_bytes: &AtomicUsize,
        parsed_repo: &GitRepo,
        repo_desc: &GitsySettingsRepo,
        _repo: &Repository,
    ) -> Result<usize, GitsyError> {
        let mut ctx = ctx.clone();
        let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
        let mut repo_bytes = 0;
        for (templ_path, out_path) in self.settings.outputs.files::<GitRepo>(Some(parsed_repo), None) {
            let templ_path = templ_path.to_str().expect(&format!(
                "ERROR: a summary template path is invalid: {}",
                templ_path.display()
            ));
            let out_path = out_path.to_str().expect(&format!(
                "ERROR: a summary output path is invalid: {}",
                out_path.display()
            ));
            ctx.insert("root_files", &parsed_repo.root_files);
            ctx.insert("all_files", &parsed_repo.all_files);
            match tera.render(templ_path, &ctx) {
                Ok(rendered) => {
                    let bytes = self.write_rendered(&out_path, &rendered);
                    repo_bytes += bytes;
                    atomic_bytes.fetch_add(bytes, Ordering::SeqCst);
                }
                Err(x) => match x.kind {
                    _ => error!("ERROR: {:?}", x),
                },
            }
            size_check_atomic!(
                repo_desc,
                atomic_bytes,
                self.total_bytes,
                return Err(GitsyError::kind(
                    GitsyErrorKind::Settings,
                    Some("ERROR: size limit exceeded")
                ))
            );
        }
        Ok(repo_bytes)
    }

    pub fn gen_file(
        &self,
        ctx: &Context,
        atomic_bytes: &AtomicUsize,
        parsed_repo: &GitRepo,
        repo_desc: &GitsySettingsRepo,
        repo: &Repository,
    ) -> Result<usize, GitsyError> {
        let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
        let mut repo_bytes = 0;

        #[cfg(any(feature = "highlight", feature = "highlight_fast"))]
        if self.settings.outputs.has_files() {
            let ts = ThemeSet::load_defaults();
            let theme = ts
                .themes
                .get(
                    repo_desc
                        .syntax_highlight_theme
                        .as_deref()
                        .unwrap_or("base16-ocean.dark"),
                )
                .expect("Invalid syntax highlighting theme specified.");
            let css: String = css_for_theme_with_class_style(theme, syntect::html::ClassStyle::Spaced)
                .expect("Invalid syntax highlighting theme specified.");
            let bytes = self.write_rendered(
                &self.settings.outputs.syntax_css::<GitFile>(Some(&parsed_repo), None),
                css.as_str(),
            );
            repo_bytes += bytes;
            atomic_bytes.fetch_add(bytes, Ordering::SeqCst);
        }

        let files: Vec<&GitFile> = parsed_repo.all_files.iter().filter(|x| x.kind == "file").collect();
        let atomic_repo_bytes: AtomicUsize = AtomicUsize::new(repo_bytes);
        let repo_path = repo
            .path()
            .to_str()
            .expect("ERROR: unable to determine path to local repository");
        let _ = files
            .par_iter()
            .fold(
                || Some(0),
                |acc, file| {
                    // These two have to be recreated.  Cloning the Tera context is expensive.
                    let repo = Repository::open(&repo_path).expect("Unable to find git repository.");
                    let mut ctx = ctx.clone();

                    let mut local_bytes = 0;
                    let cur_repo_bytes = atomic_repo_bytes.load(Ordering::SeqCst);
                    size_check!(
                        repo_desc,
                        cur_repo_bytes,
                        self.total_bytes.load(Ordering::SeqCst),
                        return None
                    );
                    let file = match file.size < repo_desc.limit_file_size.unwrap_or(usize::MAX) {
                        true => {
                            GitsyGenerator::fill_file_contents(&repo, &file, &repo_desc).expect("Failed to parse file.")
                        }
                        false => (*file).clone(),
                    };
                    ctx.try_insert("file", &file)
                        .expect("Failed to add file to template engine.");
                    for (templ_path, out_path) in self.settings.outputs.file(Some(parsed_repo), Some(&file)) {
                        let templ_path = templ_path.to_str().expect(&format!(
                            "ERROR: a summary template path is invalid: {}",
                            templ_path.display()
                        ));
                        let out_path = out_path.to_str().expect(&format!(
                            "ERROR: a summary output path is invalid: {}",
                            out_path.display()
                        ));
                        match tera.render(templ_path, &ctx) {
                            Ok(rendered) => {
                                local_bytes = self.write_rendered(&out_path, &rendered);
                                atomic_repo_bytes.fetch_add(local_bytes, Ordering::SeqCst);
                                atomic_bytes.fetch_add(local_bytes, Ordering::SeqCst);

                                // Copy readme files to their real filename, so links to readme files remain valid
                                // across file changes.
                                if let Some(readmes) = &repo_desc.readme_files {
                                    for readme in readmes {
                                        if &file.path == readme {
                                            let mut pretty_path = PathBuf::from(out_path);
                                            pretty_path.pop();
                                            pretty_path.push(&file.path);
                                            match std::fs::copy(&out_path, &pretty_path) {
                                                Ok(_) => louder!(" - wrote readme file: {}", pretty_path.to_string_lossy()),
                                                Err(e) => error!("ERROR: {:?}", e),
                                            }
                                        }
                                    }
                                };

                            }
                            Err(x) => match x.kind {
                                _ => error!("ERROR: {:?}", x),
                            },
                        }
                    }
                    ctx.remove("file");
                    if atomic_repo_bytes.load(Ordering::SeqCst) >= repo_desc.limit_repo_size.unwrap_or(usize::MAX) {
                        return None;
                    }
                    Some(acc.unwrap() + local_bytes)
                },
            )
            .while_some() // allow short-circuiting if size limit is reached
            .sum::<usize>();
        repo_bytes = atomic_repo_bytes.load(Ordering::SeqCst);
        size_check_atomic!(
            repo_desc,
            atomic_bytes,
            self.total_bytes,
            return Err(GitsyError::kind(
                GitsyErrorKind::Settings,
                Some("ERROR: size limit exceeded")
            ))
        );
        Ok(repo_bytes)
    }

    pub fn gen_dir(
        &self,
        ctx: &Context,
        atomic_bytes: &AtomicUsize,
        parsed_repo: &GitRepo,
        repo_desc: &GitsySettingsRepo,
        repo: &Repository,
    ) -> Result<usize, GitsyError> {
        let mut ctx = ctx.clone();
        let tera = self.tera.as_ref().expect("ERROR: generate called without a context!?");
        let mut repo_bytes = 0;
        for dir in parsed_repo.all_files.iter().filter(|x| x.kind == "dir") {
            let listing = dir_listing(&repo, &dir).expect("Failed to parse file.");
            ctx.insert("dir", dir);
            ctx.try_insert("files", &listing)
                .expect("Failed to add dir to template engine.");
            for (templ_path, out_path) in self.settings.outputs.dir(Some(parsed_repo), Some(dir)) {
                let templ_path = templ_path.to_str().expect(&format!(
                    "ERROR: a summary template path is invalid: {}",
                    templ_path.display()
                ));
                let out_path = out_path.to_str().expect(&format!(
                    "ERROR: a summary output path is invalid: {}",
                    out_path.display()
                ));
                match tera.render(templ_path, &ctx) {
                    Ok(rendered) => {
                        let bytes = self.write_rendered(&out_path, &rendered);
                        repo_bytes += bytes;
                        atomic_bytes.fetch_add(bytes, Ordering::SeqCst);
                    }
                    Err(x) => match x.kind {
                        _ => error!("ERROR: {:?}", x),
                    },
                }
            }
            ctx.remove("files");
            ctx.remove("dir");
            size_check_atomic!(
                repo_desc,
                atomic_bytes,
                self.total_bytes,
                return Err(GitsyError::kind(
                    GitsyErrorKind::Settings,
                    Some("ERROR: size limit exceeded")
                ))
            );
        }
        Ok(repo_bytes)
    }

    fn copy_assets(
        &self,
        repo_desc: Option<&GitsySettingsRepo>,
        parsed_repo: Option<&GitRepo>,
        repo: Option<&Repository>,
    ) -> Result<usize, GitsyError> {
        let mut bytes = 0;
        match repo_desc {
            Some(repo_desc) => {
                let parsed_repo = parsed_repo.expect("ERROR: attempted to fill repo assets without a repository");
                let repo = repo.expect("ERROR: attempted to fill repo assets without a repository");
                if repo_desc.asset_files.is_some() {
                    let target_dir = self.settings.outputs.repo_assets::<GitFile>(Some(&parsed_repo), None);
                    for src_file in repo_desc.asset_files.as_ref().unwrap() {
                        // Read the asset file contents from the git repo
                        let src_file = PathBuf::from(src_file);
                        let src_contents = self.settings.outputs
                            .asset_contents(&src_file, Some(parsed_repo), Some(repo))?;

                        // Determine the output path
                        let mut dst_file = PathBuf::from(&target_dir);
                        let basename = src_file.file_name()
                            .ok_or(GitsyError::kind(
                                GitsyErrorKind::Settings,
                                Some(&format!(
                                    "ERROR: repo asset file missing filename: {}",
                                    src_file.display()
                                ))))?;
                        dst_file.push(basename);

                        // Open destination file for writing
                        let mut file = File::create(&dst_file)
                            .map_err(|e| GitsyError::sourced_kind(
                                GitsyErrorKind::Settings,
                                Some(&format!(
                                    "ERROR: unable to open repo asset file for writing: {}",
                                    dst_file.display()
                                )),
                                e))?;

                        // Write to disk
                        file.write(&src_contents)
                            .map_err(|e| GitsyError::sourced_kind(
                                GitsyErrorKind::Settings,
                                Some(&format!(
                                    "ERROR: unable to write repo asset file: {}",
                                    dst_file.display()
                                )),
                                e))?;

                        if let Ok(meta) = std::fs::metadata(dst_file) {
                            bytes += meta.len() as usize;
                        }
                        loud!(" - copied repo asset: {}", src_file.display());
                    }
                }
            }
            _ => {
                if self.settings.asset_files.is_some() {
                    let target_dir = self.settings.outputs.global_assets::<GitFile>(None, None);
                    for src_file in self.settings.asset_files.as_ref().unwrap() {
                        let src_file = self.settings.outputs.asset_path(src_file, None, None);
                        let mut dst_file = PathBuf::from(&target_dir);
                        dst_file.push(
                            src_file
                                .file_name()
                                .expect(&format!("Failed to copy asset file: {}", src_file.display())),
                        );
                        std::fs::copy(&src_file, &dst_file)
                            .expect(&format!("Failed to copy asset file: {}", src_file.display()));
                        if let Ok(meta) = std::fs::metadata(dst_file) {
                            bytes += meta.len() as usize;
                        }
                        loud!(" - copied global asset: {}", src_file.display());
                    }
                }
            }
        }
        Ok(bytes)
    }

    pub fn generate_repo(
        &self,
        repo_desc: &GitsySettingsRepo,
        pad_name_len: usize,
    ) -> Result<(GitRepo, usize), GitsyError> {
        loudest!("Repo settings:\n{:#?}", &repo_desc);
        let start_repo = Instant::now();

        let name = repo_desc.name.as_deref().expect("A configured repository has no name!");
        if self.settings.threads.unwrap_or(0) == 1 || VERBOSITY.load(Ordering::SeqCst) > 1 {
            normal_noln!("[{}{}]... ", name, " ".repeat(pad_name_len - name.len()));
        }
        let repo_path = self.find_repo(&name, &repo_desc)?;
        let repo = Repository::open(&repo_path).expect("Unable to find git repository.");

        let metadata = GitsyMetadata {
            full_name: repo_desc.name.clone(),
            description: repo_desc.description.clone(),
            website: repo_desc.website.clone(),
            clone: repo_desc.clone_url.clone(),
            attributes: repo_desc.attributes.clone().unwrap_or_default(),
        };
        let parsed_repo = parse_repo(&repo, &name, &repo_desc, metadata).expect("Failed to analyze repo HEAD.");
        let minimized_repo = parsed_repo.minimal_clone(self.settings.limit_context.unwrap_or(usize::MAX));
        let atomic_bytes = AtomicUsize::new(0);

        let mut local_ctx = self.new_context(Some(&minimized_repo))?;

        // Add README file to context, if specified and found
        if let Some(readmes) = &repo_desc.readme_files {
            for readme in readmes {
                if let Some(file) = parsed_repo.root_files.iter().filter(|x| &x.name == readme).next() {
                    louder!(" - found readme file: {}", file.name);
                    let _ =
                        GitsyGenerator::fill_file_contents(&repo, &file, &repo_desc).expect("Failed to parse file.");
                    local_ctx.insert("readme", &file);
                    break;
                }
            }
        };

        let fns = &[
            GitsyGenerator::gen_summary,
            GitsyGenerator::gen_branches,
            GitsyGenerator::gen_branch,
            GitsyGenerator::gen_tags,
            GitsyGenerator::gen_tag,
            GitsyGenerator::gen_history,
            GitsyGenerator::gen_commit,
            GitsyGenerator::gen_file,
            GitsyGenerator::gen_dir,
            GitsyGenerator::gen_files,
        ];

        let repo_bytes: usize = fns
            .par_iter()
            .try_fold(
                || 0,
                |acc, x| {
                    let repo = Repository::open(&repo_path).expect("Unable to find git repository.");
                    let bytes = x(&self, &local_ctx, &atomic_bytes, &parsed_repo, repo_desc, &repo)?;
                    // remove these bytes from the current repo bytes and move them to the total bytes.
                    atomic_bytes.fetch_sub(bytes, Ordering::SeqCst);
                    self.total_bytes.fetch_add(bytes, Ordering::SeqCst);
                    Ok::<usize, GitsyError>(acc + bytes)
                },
            )
            .try_reduce(|| 0, |acc, x| Ok(acc + x))?;

        size_check!(
            repo_desc,
            0,
            self.total_bytes.load(Ordering::SeqCst),
            return Err(GitsyError::kind(
                GitsyErrorKind::Settings,
                Some("ERROR: size limit exceeded")
            ))
        );

        self.copy_assets(Some(&repo_desc), Some(&parsed_repo), Some(&repo))?;

        normal!(
            "{}{}done in {:.2}s ({} bytes)",
            match self.settings.threads.unwrap_or(0) == 1 && VERBOSITY.load(Ordering::SeqCst) <= 1 {
                true => "".into(),
                false => format!("[{}{}]... ", name, " ".repeat(pad_name_len - name.len())),
            },
            match VERBOSITY.load(Ordering::SeqCst) > 1 {
                true => " - ",
                _ => "",
            },
            start_repo.elapsed().as_secs_f32(),
            repo_bytes
        );
        Ok((minimized_repo, repo_bytes))
    }

    pub fn generate(&mut self) -> Result<(), GitsyError> {
        let start_all = Instant::now();
        self.tera = Some(self.tera_init()?);
        self.generated_dt = chrono::offset::Local::now();

        if self.cli.should_clean {
            self.settings.outputs.clean();
        }

        if self.repo_descriptions.len() == 0 {
            panic!(
                "No Git repositories defined!  Please check your configuration file ({})",
                self.cli.path.display()
            );
        }

        self.settings.outputs.create();

        // Sort the repositories by name
        let mut repo_vec: Vec<GitsySettingsRepo> = self.repo_descriptions.iter().cloned().collect();
        repo_vec.sort_by(|x, y| {
            x.name
                .as_deref()
                .map(|n| n.cmp(&y.name.as_deref().unwrap_or_default()))
                .unwrap_or(cmp::Ordering::Equal)
        });

        // Find the one with the longest name, for pretty printing
        let global_name = "repo list";
        let longest_repo_name = repo_vec
            .iter()
            .fold(0, |acc, x| {
                cmp::max(acc, x.name.as_deref().map(|n| n.len()).unwrap_or(0))
            })
            .max(global_name.len());

        loudest!("Global settings:\n{:#?}", &self.settings);

        let shared_repos = std::sync::Mutex::new(Vec::<GitRepo>::new());

        // Iterate over each repository, generating outputs
        let mut total_bytes = match self.settings.threads.unwrap_or(0) {
            n if n == 1 => {
                let mut tb = 0;
                for repo_desc in &repo_vec {
                    let (minimized_repo, repo_bytes) = self.generate_repo(repo_desc, longest_repo_name)?;
                    size_check!(
                        repo_desc,
                        0,
                        tb,
                        return Err(GitsyError::kind(
                            GitsyErrorKind::Settings,
                            Some("ERROR: site size limit exceeded")
                        ))
                    );
                    shared_repos.lock().unwrap().push(minimized_repo);
                    tb += repo_bytes;
                }
                tb
            }
            n if n == 0 => {
                let total_bytes: usize = repo_vec
                    .par_iter()
                    .try_fold(
                        || 0,
                        |acc, repo_desc| {
                            let (minimized_repo, repo_bytes) = self.generate_repo(repo_desc, longest_repo_name)?;
                            size_check!(
                                repo_desc,
                                0,
                                acc + repo_bytes,
                                return Err(GitsyError::kind(
                                    GitsyErrorKind::Unknown,
                                    Some("ERROR: site size limit exceeded")
                                ))
                            );
                            shared_repos.lock().unwrap().push(minimized_repo);
                            Ok::<usize, GitsyError>(repo_bytes)
                        },
                    )
                    .try_reduce(|| 0, |acc, x| Ok(acc + x))?;
                total_bytes
            }
            n => {
                let pool = rayon::ThreadPoolBuilder::new().num_threads(n).build().unwrap();

                let total_bytes = pool.install(|| {
                    let total_bytes: usize = repo_vec
                        .par_iter()
                        .try_fold(
                            || 0,
                            |acc, repo_desc| {
                                let (minimized_repo, repo_bytes) = self.generate_repo(repo_desc, longest_repo_name)?;
                                size_check!(
                                    repo_desc,
                                    0,
                                    acc + repo_bytes,
                                    return Err(GitsyError::kind(
                                        GitsyErrorKind::Unknown,
                                        Some("ERROR: site size limit exceeded")
                                    ))
                                );
                                shared_repos.lock().unwrap().push(minimized_repo);
                                Ok::<usize, GitsyError>(repo_bytes)
                            },
                        )
                        .try_reduce(|| 0, |acc, x| Ok(acc + x))?;
                    Ok::<usize, GitsyError>(total_bytes)
                })?;
                total_bytes
            }
        };
        size_check!(
            self.settings,
            0,
            total_bytes,
            return Err(GitsyError::kind(
                GitsyErrorKind::Unknown,
                Some("ERROR: site size limit exceeded")
            ))
        );

        let repos = shared_repos;

        let start_global = Instant::now();
        normal_noln!(
            "[{}{}]... ",
            global_name,
            " ".repeat(longest_repo_name - global_name.len())
        );
        let mut global_ctx = self.new_context(None)?;
        global_ctx.try_insert("repos", &repos)?;

        let mut global_bytes = 0;
        global_bytes += self.gen_repo_list(&global_ctx)?;
        global_bytes += self.gen_error(&global_ctx)?;

        self.copy_assets(None, None, None)?;

        total_bytes += global_bytes;
        size_check!(
            self.settings,
            0,
            total_bytes,
            return Err(GitsyError::kind(
                GitsyErrorKind::Unknown,
                Some("ERROR: site size limit exceeded")
            ))
        );
        normal!(
            "done in {:.2}s ({} bytes)",
            start_global.elapsed().as_secs_f32(),
            global_bytes
        );
        loud!(
            "Wrote {} bytes in {:.2}s",
            total_bytes,
            start_all.elapsed().as_secs_f32()
        );

        if self.cli.should_open {
            if let Some((_templ, out)) = self.settings.outputs.repo_list::<GitFile>(None, None).first() {
                let _ = open::that(&format!("file://{}", out.display()));
            }
        }

        Ok(())
    }
}