natter/src/intermediate/blog_post.rs

use std::path::Path;
use std::path::PathBuf;
use std::sync::Arc;
use std::sync::Mutex;

use tokio::task::JoinHandle;
use walkdir::WalkDir;

use crate::error::CustomError;
use crate::intermediate::registry::Registry;

use super::BlogPostPage;

#[derive(Debug)]
pub(crate) struct BlogPost {
    pub(crate) id: String,
    pub(crate) pages: Vec<BlogPostPage>,
}

impl BlogPost {
    pub(crate) async fn load_blog_post<P: AsRef<Path>, R: AsRef<Path>>(
        root_dir: R,
        post_dir: P,
    ) -> Result<BlogPost, CustomError> {
        async fn inner(_root_dir: &Path, post_dir: &Path) -> Result<BlogPost, CustomError> {
            let post_id = post_dir
                .file_name()
                .expect("The post directory should have a name.");

            let org_files = {
                let mut ret = Vec::new();
                let org_files_iter = get_org_files(post_dir)?;
                for entry in org_files_iter {
                    ret.push(entry.await??);
                }
                ret
            };
            let parsed_org_files = {
                let mut ret = Vec::new();
                for (path, contents) in org_files.iter() {
                    let parsed = organic::parser::parse_file(contents.as_str(), Some(path))
                        .map_err(|_| CustomError::Static("Failed to parse org-mode document."))?;
                    ret.push((path, contents, parsed));
                }
                ret
            };

            let pages = {
                let mut ret = Vec::new();
                for (real_path, _contents, parsed_document) in parsed_org_files.iter() {
                    let mut registry = Registry::new();

                    // Assign IDs to the targets
                    organic::types::AstNode::from(parsed_document)
                        .iter_all_ast_nodes()
                        .for_each(|node| match node {
                            organic::types::AstNode::Target(target) => {
                                registry.get_target(target.value);
                            }
                            _ => {}
                        });

                    let registry = Arc::new(Mutex::new(registry));
                    let relative_to_post_dir_path = real_path.strip_prefix(post_dir)?;
                    ret.push(
                        BlogPostPage::new(relative_to_post_dir_path, registry, parsed_document)
                            .await?,
                    );
                }
                ret
            };

            Ok(BlogPost {
                id: post_id.to_string_lossy().into_owned(),
                pages,
            })
        }
        inner(root_dir.as_ref(), post_dir.as_ref()).await
    }

    /// Get the date for a blog post.
    ///
    /// The date is set by the "#+date" export setting. This will
    /// first attempt to read the date from an index.org if such a
    /// file exists. If that file does not exist or that file does not
    /// contain a date export setting, then this will iterate through
    /// all the pages under the blog post looking for any page that
    /// contains a date export setting. It will return the first date
    /// found.
    pub(crate) fn get_date(&self) -> Result<(), CustomError> {
        if let Some(index_page) = self.get_index_page()? {
            println!("{:?}", index_page);
        }
        Ok(())
    }

    /// Get the blog post page for index.org
    fn get_index_page(&self) -> Result<Option<&BlogPostPage>, CustomError> {
        Ok(self
            .pages
            .iter()
            .find(|page| page.path == Path::new("index.org")))
    }
}

async fn read_file(path: PathBuf) -> std::io::Result<(PathBuf, String)> {
    let contents = tokio::fs::read_to_string(&path).await?;
    Ok((path, contents))
}

fn get_org_files<P: AsRef<Path>>(
    root_dir: P,
) -> Result<impl Iterator<Item = JoinHandle<std::io::Result<(PathBuf, String)>>>, walkdir::Error> {
    let org_files = WalkDir::new(root_dir)
        .into_iter()
        .filter(|e| match e {
            Ok(dir_entry) => {
                dir_entry.file_type().is_file()
                    && Path::new(dir_entry.file_name())
                        .extension()
                        .map(|ext| ext.to_ascii_lowercase() == "org")
                        .unwrap_or(false)
            }
            Err(_) => true,
        })
        .collect::<Result<Vec<_>, _>>()?;
    let org_files = org_files
        .into_iter()
        .map(walkdir::DirEntry::into_path)
        .map(|path| tokio::spawn(read_file(path)));
    Ok(org_files)
}
Switch to using CustomError because a boxed StdError is not Send. 2023-10-22 17:44:03 +00:00			`use std::path::Path;`
			`use std::path::PathBuf;`
Fix build by making the registry guarded by an ArcMutex. 2023-10-30 01:19:30 +00:00			`use std::sync::Arc;`
			`use std::sync::Mutex;`
Switch to using CustomError because a boxed StdError is not Send. 2023-10-22 17:44:03 +00:00
			`use tokio::task::JoinHandle;`
			`use walkdir::WalkDir;`

			`use crate::error::CustomError;`
Introduce a registry into the conversion to intermediate format. 2023-10-27 18:43:06 +00:00			`use crate::intermediate::registry::Registry;`
Switch to using CustomError because a boxed StdError is not Send. 2023-10-22 17:44:03 +00:00
Starting to introduce a BlogPostPage struct. Blog posts are going to be constructed of multiple documents each forming their own page. This will allow me to link to supporting documents without having to promote them to their own pages. 2023-10-23 20:03:37 +00:00			`use super::BlogPostPage;`

Moving into a load_blog_post function to create a BlogPost struct. 2023-10-22 16:04:09 +00:00			`#[derive(Debug)]`
Switch to using CustomError because a boxed StdError is not Send. 2023-10-22 17:44:03 +00:00			`pub(crate) struct BlogPost {`
Serialize the RenderBlogPost to JSON. This struct still does not contain anything, but I'm just setting up the skeleton for this code. 2023-10-22 20:01:42 +00:00			`pub(crate) id: String,`
Switch to rendering blog post pages instead of blog posts. 2023-10-24 00:30:43 +00:00			`pub(crate) pages: Vec<BlogPostPage>,`
Moving into a load_blog_post function to create a BlogPost struct. 2023-10-22 16:04:09 +00:00			`}`

			`impl BlogPost {`
			`pub(crate) async fn load_blog_post<P: AsRef<Path>, R: AsRef<Path>>(`
			`root_dir: R,`
			`post_dir: P,`
Switch to using CustomError because a boxed StdError is not Send. 2023-10-22 17:44:03 +00:00			`) -> Result<BlogPost, CustomError> {`
Move the logic into convert_blog_post_page_to_render_context. I was writing it in the build command's rust files for convenience, but now its getting long enough to warrant moving it into its final location. 2023-10-24 02:10:26 +00:00			`async fn inner(_root_dir: &Path, post_dir: &Path) -> Result<BlogPost, CustomError> {`
Setting the post id based on the folder name. 2023-10-22 17:50:11 +00:00			`let post_id = post_dir`
			`.file_name()`
			`.expect("The post directory should have a name.");`

Moving into a load_blog_post function to create a BlogPost struct. 2023-10-22 16:04:09 +00:00			`let org_files = {`
			`let mut ret = Vec::new();`
			`let org_files_iter = get_org_files(post_dir)?;`
			`for entry in org_files_iter {`
			`ret.push(entry.await??);`
			`}`
			`ret`
			`};`
			`let parsed_org_files = {`
			`let mut ret = Vec::new();`
			`for (path, contents) in org_files.iter() {`
Switch to using CustomError because a boxed StdError is not Send. 2023-10-22 17:44:03 +00:00			`let parsed = organic::parser::parse_file(contents.as_str(), Some(path))`
			`.map_err(\|_\| CustomError::Static("Failed to parse org-mode document."))?;`
Moving into a load_blog_post function to create a BlogPost struct. 2023-10-22 16:04:09 +00:00			`ret.push((path, contents, parsed));`
			`}`
			`ret`
			`};`

Starting to introduce a BlogPostPage struct. Blog posts are going to be constructed of multiple documents each forming their own page. This will allow me to link to supporting documents without having to promote them to their own pages. 2023-10-23 20:03:37 +00:00			`let pages = {`
			`let mut ret = Vec::new();`
Introduce a registry into the conversion to intermediate format. 2023-10-27 18:43:06 +00:00			`for (real_path, _contents, parsed_document) in parsed_org_files.iter() {`
Create an intermediate ast node type. 2023-10-29 17:51:32 +00:00			`let mut registry = Registry::new();`

			`// Assign IDs to the targets`
			`organic::types::AstNode::from(parsed_document)`
			`.iter_all_ast_nodes()`
			`.for_each(\|node\| match node {`
			`organic::types::AstNode::Target(target) => {`
			`registry.get_target(target.value);`
			`}`
			`_ => {}`
			`});`

Fix build by making the registry guarded by an ArcMutex. 2023-10-30 01:19:30 +00:00			`let registry = Arc::new(Mutex::new(registry));`
Starting to introduce a BlogPostPage struct. Blog posts are going to be constructed of multiple documents each forming their own page. This will allow me to link to supporting documents without having to promote them to their own pages. 2023-10-23 20:03:37 +00:00			`let relative_to_post_dir_path = real_path.strip_prefix(post_dir)?;`
Make converstion to intermediate state async. We are going to need to do things like call external tools for syntax highlighting so we are going to need async in there eventually. 2023-10-27 19:55:19 +00:00			`ret.push(`
Fix build by making the registry guarded by an ArcMutex. 2023-10-30 01:19:30 +00:00			`BlogPostPage::new(relative_to_post_dir_path, registry, parsed_document)`
			`.await?,`
Make converstion to intermediate state async. We are going to need to do things like call external tools for syntax highlighting so we are going to need async in there eventually. 2023-10-27 19:55:19 +00:00			`);`
Starting to introduce a BlogPostPage struct. Blog posts are going to be constructed of multiple documents each forming their own page. This will allow me to link to supporting documents without having to promote them to their own pages. 2023-10-23 20:03:37 +00:00			`}`
			`ret`
			`};`

Moving into a load_blog_post function to create a BlogPost struct. 2023-10-22 16:04:09 +00:00			`Ok(BlogPost {`
Setting the post id based on the folder name. 2023-10-22 17:50:11 +00:00			`id: post_id.to_string_lossy().into_owned(),`
Starting to introduce a BlogPostPage struct. Blog posts are going to be constructed of multiple documents each forming their own page. This will allow me to link to supporting documents without having to promote them to their own pages. 2023-10-23 20:03:37 +00:00			`pages,`
Moving into a load_blog_post function to create a BlogPost struct. 2023-10-22 16:04:09 +00:00			`})`
			`}`
			`inner(root_dir.as_ref(), post_dir.as_ref()).await`
			`}`
Finding the index page. 2023-12-17 20:45:50 +00:00
			`/// Get the date for a blog post.`
			`///`
			`/// The date is set by the "#+date" export setting. This will`
			`/// first attempt to read the date from an index.org if such a`
			`/// file exists. If that file does not exist or that file does not`
			`/// contain a date export setting, then this will iterate through`
			`/// all the pages under the blog post looking for any page that`
			`/// contains a date export setting. It will return the first date`
			`/// found.`
			`pub(crate) fn get_date(&self) -> Result<(), CustomError> {`
			`if let Some(index_page) = self.get_index_page()? {`
			`println!("{:?}", index_page);`
			`}`
			`Ok(())`
			`}`

			`/// Get the blog post page for index.org`
			`fn get_index_page(&self) -> Result<Option<&BlogPostPage>, CustomError> {`
			`Ok(self`
			`.pages`
			`.iter()`
			`.find(\|page\| page.path == Path::new("index.org")))`
			`}`
Moving into a load_blog_post function to create a BlogPost struct. 2023-10-22 16:04:09 +00:00			`}`

Switch to using CustomError because a boxed StdError is not Send. 2023-10-22 17:44:03 +00:00			`async fn read_file(path: PathBuf) -> std::io::Result<(PathBuf, String)> {`
			`let contents = tokio::fs::read_to_string(&path).await?;`
			`Ok((path, contents))`
			`}`

Moving into a load_blog_post function to create a BlogPost struct. 2023-10-22 16:04:09 +00:00			`fn get_org_files<P: AsRef<Path>>(`
			`root_dir: P,`
			`) -> Result<impl Iterator<Item = JoinHandle<std::io::Result<(PathBuf, String)>>>, walkdir::Error> {`
			`let org_files = WalkDir::new(root_dir)`
			`.into_iter()`
			`.filter(\|e\| match e {`
			`Ok(dir_entry) => {`
			`dir_entry.file_type().is_file()`
			`&& Path::new(dir_entry.file_name())`
			`.extension()`
			`.map(\|ext\| ext.to_ascii_lowercase() == "org")`
			`.unwrap_or(false)`
			`}`
			`Err(_) => true,`
			`})`
			`.collect::<Result<Vec<_>, _>>()?;`
			`let org_files = org_files`
			`.into_iter()`
			`.map(walkdir::DirEntry::into_path)`
			`.map(\|path\| tokio::spawn(read_file(path)));`
			`Ok(org_files)`
			`}`