Files
sukr/src/content.rs
Timothy DeHerrera 244b0ce85b feat(content): add Section struct and discover_sections()
Enable generic section processing by adding:
- Section struct with index, name, section_type, path
- Section::collect_items() to gather content in a section
- discover_sections() to find all directories with _index.md

Section type is determined from frontmatter `section_type` field,
falling back to directory name. Includes 5 unit tests.
2026-01-31 15:02:20 -07:00

561 lines
18 KiB
Rust

//! Content discovery and frontmatter parsing.
use crate::error::{Error, Result};
use gray_matter::{engine::YAML, Matter};
use serde::Serialize;
use std::fs;
use std::path::{Path, PathBuf};
/// The type of content being processed.
#[derive(Debug, Clone, PartialEq)]
pub enum ContentKind {
/// Blog post with full metadata (date, tags, etc.)
Post,
/// Standalone page (about, collab)
Page,
/// Section index (_index.md)
Section,
/// Project card with external link
Project,
}
/// A navigation menu item discovered from the filesystem.
#[derive(Debug, Clone, Serialize)]
pub struct NavItem {
/// Display label (from nav_label or title)
pub label: String,
/// URL path (e.g., "/blog/index.html" or "/about.html")
pub path: String,
/// Sort order (lower = first, default 50)
pub weight: i64,
}
/// Parsed frontmatter from a content file.
#[derive(Debug)]
pub struct Frontmatter {
pub title: String,
pub description: Option<String>,
pub date: Option<String>,
pub tags: Vec<String>,
/// Sort order for nav and listings
pub weight: Option<i64>,
/// For project cards: external link
pub link_to: Option<String>,
/// Custom navigation label (defaults to title)
pub nav_label: Option<String>,
/// Section type for template dispatch (e.g., "blog", "projects")
pub section_type: Option<String>,
/// Override template for this content item
pub template: Option<String>,
}
/// A content item ready for rendering.
#[derive(Debug)]
pub struct Content {
pub kind: ContentKind,
pub frontmatter: Frontmatter,
pub body: String,
pub source_path: PathBuf,
pub slug: String,
}
impl Content {
/// Load and parse a markdown file with YAML frontmatter.
pub fn from_path(path: impl AsRef<Path>, kind: ContentKind) -> Result<Self> {
Self::from_path_inner(path.as_ref(), kind)
}
fn from_path_inner(path: &Path, kind: ContentKind) -> Result<Self> {
let raw = fs::read_to_string(path).map_err(|e| Error::ReadFile {
path: path.to_path_buf(),
source: e,
})?;
let matter = Matter::<YAML>::new();
let parsed = matter.parse(&raw);
let frontmatter = parse_frontmatter(path, &parsed)?;
// Derive slug from filename (without extension)
let slug = path
.file_stem()
.and_then(|s| s.to_str())
.unwrap_or("untitled")
.to_string();
Ok(Content {
kind,
frontmatter,
body: parsed.content,
source_path: path.to_path_buf(),
slug,
})
}
/// Compute the output path relative to the output directory.
/// e.g., content/blog/foo.md → blog/foo.html
pub fn output_path(&self, content_root: &Path) -> PathBuf {
let relative = self
.source_path
.strip_prefix(content_root)
.unwrap_or(&self.source_path);
match self.kind {
ContentKind::Section => {
// _index.md → parent/index.html (listing pages stay as index.html)
let parent = relative.parent().unwrap_or(Path::new(""));
parent.join("index.html")
}
_ => {
// Regular content → parent/slug.html (flat structure)
let parent = relative.parent().unwrap_or(Path::new(""));
parent.join(format!("{}.html", self.slug))
}
}
}
}
fn parse_frontmatter(path: &Path, parsed: &gray_matter::ParsedEntity) -> Result<Frontmatter> {
let data = parsed.data.as_ref().ok_or_else(|| Error::Frontmatter {
path: path.to_path_buf(),
message: "missing frontmatter".to_string(),
})?;
let pod = data.as_hashmap().map_err(|_| Error::Frontmatter {
path: path.to_path_buf(),
message: "frontmatter is not a valid map".to_string(),
})?;
let title = pod
.get("title")
.and_then(|v| v.as_string().ok())
.ok_or_else(|| Error::Frontmatter {
path: path.to_path_buf(),
message: "missing required 'title' field".to_string(),
})?;
let description = pod.get("description").and_then(|v| v.as_string().ok());
let date = pod.get("date").and_then(|v| v.as_string().ok());
let weight = pod.get("weight").and_then(|v| v.as_i64().ok());
let link_to = pod.get("link_to").and_then(|v| v.as_string().ok());
let nav_label = pod.get("nav_label").and_then(|v| v.as_string().ok());
let section_type = pod.get("section_type").and_then(|v| v.as_string().ok());
let template = pod.get("template").and_then(|v| v.as_string().ok());
// Handle nested taxonomies.tags structure
let tags = if let Some(taxonomies) = pod.get("taxonomies") {
if let Ok(tax_map) = taxonomies.as_hashmap() {
if let Some(tags_pod) = tax_map.get("tags") {
if let Ok(tags_vec) = tags_pod.as_vec() {
tags_vec.iter().filter_map(|v| v.as_string().ok()).collect()
} else {
Vec::new()
}
} else {
Vec::new()
}
} else {
Vec::new()
}
} else {
Vec::new()
};
Ok(Frontmatter {
title,
description,
date,
tags,
weight,
link_to,
nav_label,
section_type,
template,
})
}
/// Discover navigation items from the content directory structure.
///
/// Rules:
/// - Top-level `.md` files (except `_index.md`) become nav items (pages)
/// - Directories containing `_index.md` become nav items (sections)
/// - Items are sorted by weight (lower first), then alphabetically by label
pub fn discover_nav(content_dir: &Path) -> Result<Vec<NavItem>> {
let mut nav_items = Vec::new();
// Read top-level entries in content directory
let entries = fs::read_dir(content_dir).map_err(|e| Error::ReadFile {
path: content_dir.to_path_buf(),
source: e,
})?;
for entry in entries.filter_map(|e| e.ok()) {
let path = entry.path();
if path.is_file() {
// Top-level .md file (except _index.md) → page nav item
if path.extension().is_some_and(|ext| ext == "md") {
let file_name = path.file_name().and_then(|n| n.to_str()).unwrap_or("");
if file_name != "_index.md" {
let content = Content::from_path(&path, ContentKind::Page)?;
let slug = path.file_stem().and_then(|s| s.to_str()).unwrap_or("page");
nav_items.push(NavItem {
label: content
.frontmatter
.nav_label
.unwrap_or(content.frontmatter.title),
path: format!("/{}.html", slug),
weight: content.frontmatter.weight.unwrap_or(50),
});
}
}
} else if path.is_dir() {
// Directory with _index.md → section nav item
let index_path = path.join("_index.md");
if index_path.exists() {
let content = Content::from_path(&index_path, ContentKind::Section)?;
let dir_name = path
.file_name()
.and_then(|n| n.to_str())
.unwrap_or("section");
nav_items.push(NavItem {
label: content
.frontmatter
.nav_label
.unwrap_or(content.frontmatter.title),
path: format!("/{}/index.html", dir_name),
weight: content.frontmatter.weight.unwrap_or(50),
});
}
}
}
// Sort by weight, then alphabetically by label
nav_items.sort_by(|a, b| a.weight.cmp(&b.weight).then_with(|| a.label.cmp(&b.label)));
Ok(nav_items)
}
/// A discovered section from the content directory.
#[derive(Debug)]
pub struct Section {
/// The section's index content (_index.md)
pub index: Content,
/// Directory name (e.g., "blog", "projects")
pub name: String,
/// Section type for template dispatch (from frontmatter or directory name)
pub section_type: String,
/// Path to section directory
pub path: PathBuf,
}
impl Section {
/// Collect all content items in this section (excluding _index.md).
pub fn collect_items(&self) -> Result<Vec<Content>> {
let mut items = Vec::new();
for entry in fs::read_dir(&self.path)
.map_err(|e| Error::ReadFile {
path: self.path.clone(),
source: e,
})?
.filter_map(|e| e.ok())
{
let path = entry.path();
if path.is_file()
&& path.extension().is_some_and(|ext| ext == "md")
&& path.file_name().is_some_and(|n| n != "_index.md")
{
// Determine content kind based on section type
let kind = match self.section_type.as_str() {
"blog" => ContentKind::Post,
"projects" => ContentKind::Project,
_ => ContentKind::Page,
};
items.push(Content::from_path(&path, kind)?);
}
}
Ok(items)
}
}
/// Discover all sections (directories with _index.md) in the content directory.
pub fn discover_sections(content_dir: &Path) -> Result<Vec<Section>> {
let mut sections = Vec::new();
let entries = fs::read_dir(content_dir).map_err(|e| Error::ReadFile {
path: content_dir.to_path_buf(),
source: e,
})?;
for entry in entries.filter_map(|e| e.ok()) {
let path = entry.path();
if path.is_dir() {
let index_path = path.join("_index.md");
if index_path.exists() {
let index = Content::from_path(&index_path, ContentKind::Section)?;
let name = path
.file_name()
.and_then(|n| n.to_str())
.unwrap_or("section")
.to_string();
// Section type from frontmatter, or fall back to directory name
let section_type = index
.frontmatter
.section_type
.clone()
.unwrap_or_else(|| name.clone());
sections.push(Section {
index,
name,
section_type,
path,
});
}
}
}
// Sort by weight
sections.sort_by(|a, b| {
let wa = a.index.frontmatter.weight.unwrap_or(50);
let wb = b.index.frontmatter.weight.unwrap_or(50);
wa.cmp(&wb)
});
Ok(sections)
}
#[cfg(test)]
mod tests {
use super::*;
use std::fs;
fn create_test_dir() -> tempfile::TempDir {
tempfile::tempdir().expect("failed to create temp dir")
}
fn write_frontmatter(path: &Path, title: &str, weight: Option<i64>, nav_label: Option<&str>) {
let mut content = format!("---\ntitle: \"{}\"\n", title);
if let Some(w) = weight {
content.push_str(&format!("weight: {}\n", w));
}
if let Some(label) = nav_label {
content.push_str(&format!("nav_label: \"{}\"\n", label));
}
content.push_str("---\n\nBody content.");
fs::write(path, content).expect("failed to write test file");
}
#[test]
fn test_discover_nav_finds_pages() {
let dir = create_test_dir();
let content_dir = dir.path();
// Create top-level page
write_frontmatter(&content_dir.join("about.md"), "About Me", None, None);
let nav = discover_nav(content_dir).expect("discover_nav failed");
assert_eq!(nav.len(), 1);
assert_eq!(nav[0].label, "About Me");
assert_eq!(nav[0].path, "/about.html");
}
#[test]
fn test_discover_nav_finds_sections() {
let dir = create_test_dir();
let content_dir = dir.path();
// Create section directory with _index.md
let blog_dir = content_dir.join("blog");
fs::create_dir(&blog_dir).expect("failed to create blog dir");
write_frontmatter(&blog_dir.join("_index.md"), "Blog", None, None);
let nav = discover_nav(content_dir).expect("discover_nav failed");
assert_eq!(nav.len(), 1);
assert_eq!(nav[0].label, "Blog");
assert_eq!(nav[0].path, "/blog/index.html");
}
#[test]
fn test_discover_nav_excludes_root_index() {
let dir = create_test_dir();
let content_dir = dir.path();
// Create _index.md at root (should be excluded from nav)
write_frontmatter(&content_dir.join("_index.md"), "Home", None, None);
write_frontmatter(&content_dir.join("about.md"), "About", None, None);
let nav = discover_nav(content_dir).expect("discover_nav failed");
assert_eq!(nav.len(), 1);
assert_eq!(nav[0].label, "About");
}
#[test]
fn test_discover_nav_sorts_by_weight() {
let dir = create_test_dir();
let content_dir = dir.path();
write_frontmatter(&content_dir.join("about.md"), "About", Some(30), None);
write_frontmatter(&content_dir.join("contact.md"), "Contact", Some(10), None);
write_frontmatter(&content_dir.join("blog.md"), "Blog", Some(20), None);
let nav = discover_nav(content_dir).expect("discover_nav failed");
assert_eq!(nav.len(), 3);
assert_eq!(nav[0].label, "Contact"); // weight 10
assert_eq!(nav[1].label, "Blog"); // weight 20
assert_eq!(nav[2].label, "About"); // weight 30
}
#[test]
fn test_discover_nav_uses_nav_label() {
let dir = create_test_dir();
let content_dir = dir.path();
write_frontmatter(
&content_dir.join("about.md"),
"About The Author",
None,
Some("About"),
);
let nav = discover_nav(content_dir).expect("discover_nav failed");
assert_eq!(nav.len(), 1);
assert_eq!(nav[0].label, "About"); // Uses nav_label, not title
}
// =========================================================================
// discover_sections tests
// =========================================================================
fn write_section_index(
path: &Path,
title: &str,
section_type: Option<&str>,
weight: Option<i64>,
) {
let mut content = format!("---\ntitle: \"{}\"\n", title);
if let Some(st) = section_type {
content.push_str(&format!("section_type: \"{}\"\n", st));
}
if let Some(w) = weight {
content.push_str(&format!("weight: {}\n", w));
}
content.push_str("---\nSection content.\n");
fs::write(path, content).expect("failed to write section index");
}
#[test]
fn test_discover_sections_finds_directories() {
let dir = create_test_dir();
let content_dir = dir.path();
// Create two sections
fs::create_dir(content_dir.join("blog")).unwrap();
write_section_index(&content_dir.join("blog/_index.md"), "Blog", None, None);
fs::create_dir(content_dir.join("projects")).unwrap();
write_section_index(
&content_dir.join("projects/_index.md"),
"Projects",
None,
None,
);
let sections = discover_sections(content_dir).expect("discover_sections failed");
assert_eq!(sections.len(), 2);
let names: Vec<_> = sections.iter().map(|s| s.name.as_str()).collect();
assert!(names.contains(&"blog"));
assert!(names.contains(&"projects"));
}
#[test]
fn test_discover_sections_uses_section_type_from_frontmatter() {
let dir = create_test_dir();
let content_dir = dir.path();
fs::create_dir(content_dir.join("writings")).unwrap();
write_section_index(
&content_dir.join("writings/_index.md"),
"My Writings",
Some("blog"),
None,
);
let sections = discover_sections(content_dir).expect("discover_sections failed");
assert_eq!(sections.len(), 1);
assert_eq!(sections[0].name, "writings");
assert_eq!(sections[0].section_type, "blog"); // From frontmatter, not dir name
}
#[test]
fn test_discover_sections_falls_back_to_dir_name() {
let dir = create_test_dir();
let content_dir = dir.path();
fs::create_dir(content_dir.join("gallery")).unwrap();
write_section_index(
&content_dir.join("gallery/_index.md"),
"Gallery",
None,
None,
);
let sections = discover_sections(content_dir).expect("discover_sections failed");
assert_eq!(sections.len(), 1);
assert_eq!(sections[0].section_type, "gallery"); // Falls back to dir name
}
#[test]
fn test_discover_sections_sorts_by_weight() {
let dir = create_test_dir();
let content_dir = dir.path();
fs::create_dir(content_dir.join("blog")).unwrap();
write_section_index(&content_dir.join("blog/_index.md"), "Blog", None, Some(20));
fs::create_dir(content_dir.join("projects")).unwrap();
write_section_index(
&content_dir.join("projects/_index.md"),
"Projects",
None,
Some(10),
);
let sections = discover_sections(content_dir).expect("discover_sections failed");
assert_eq!(sections.len(), 2);
assert_eq!(sections[0].name, "projects"); // weight 10
assert_eq!(sections[1].name, "blog"); // weight 20
}
#[test]
fn test_section_collect_items() {
let dir = create_test_dir();
let content_dir = dir.path();
fs::create_dir(content_dir.join("blog")).unwrap();
write_section_index(
&content_dir.join("blog/_index.md"),
"Blog",
Some("blog"),
None,
);
write_frontmatter(&content_dir.join("blog/post1.md"), "Post 1", None, None);
write_frontmatter(&content_dir.join("blog/post2.md"), "Post 2", None, None);
let sections = discover_sections(content_dir).expect("discover_sections failed");
assert_eq!(sections.len(), 1);
let items = sections[0].collect_items().expect("collect_items failed");
assert_eq!(items.len(), 2);
let titles: Vec<_> = items.iter().map(|c| c.frontmatter.title.as_str()).collect();
assert!(titles.contains(&"Post 1"));
assert!(titles.contains(&"Post 2"));
}
}