diff options
Diffstat (limited to 'src/collect_files.rs')
-rw-r--r-- | src/collect_files.rs | 188 |
1 files changed, 188 insertions, 0 deletions
diff --git a/src/collect_files.rs b/src/collect_files.rs new file mode 100644 index 0000000..88d065f --- /dev/null +++ b/src/collect_files.rs @@ -0,0 +1,188 @@ +use crate::*; + +use vagabond::*; + + +pub struct Website { + pub name: String, + pub pages: Vec<Page>, + pub static_files: Vec<StaticItem>, + pub static_dirs: Vec<StaticItem>, +} + +pub struct Page { + pub name: String, // Display name + pub parent_url: String, // URL base for relative links + pub file_url: String, // Safe file name, no extension + pub full_url: String, // Safe full URL, no extension + pub source_path: PathBuf, // Absolute path to source file + pub document: MarkdownDocument, // File content parsed as markdown + pub headings: Vec<String>, // Safe name of each document heading +} + +pub struct StaticItem { + pub full_url: String, // Safe full URL, with extension + pub source_path: PathBuf, // Absolute path to source file +} + + + +impl Page { + pub fn back_string(&self) -> String { + let mut back = String::new(); + for c in self.full_url.chars() { + if c == '/' { + back.push_str("../"); + } + } + return back; + } +} + + + +impl Website { + pub fn from_path(path: &Path) -> Self { + let mut new = Self { + pages: Vec::new(), + static_files: Vec::new(), + static_dirs: Vec::new(), + name: match Entry::from_path(path) { + Ok(entry) => entry.name, + Err(err) => error!("Couldn't open {:?}: {:?}", &path, err), + }, + }; + new.collect_entry(path, path); + return new; + } + + fn collect_entry(&mut self, path: &Path, prefix: &Path) { + let entry = Entry::from_path(path).unwrap(); + // Ignore dotted entries. + if entry.name.starts_with('.') { + return; + } + // Get name and extension. + let (mut name, extension) = entry.split_name(); + if let Some((prefix, suffix)) = name.split_once(' ') { + if prefix.chars().all(|c| "0123456789-".contains(c)) { + name = suffix.to_string(); + } + } + let file_url = make_url_safe(&name); + // Generate parent URL, used only for files. + let source_path = entry.original_path.clone(); + let relative_path = source_path.strip_prefix(prefix).unwrap_or_else( + |_| error!("Path doesn't start with {:?}: {:?}", prefix, source_path)); + let mut parent_url = String::new(); + let mut components: Vec<_> = relative_path.components().collect(); + components.pop(); // Remove file segment. + for c in &components { + let segment = &make_url_safe(&c.as_os_str().to_string_lossy()); + parent_url.push_str(segment); parent_url.push('/') + }; + + // Process each entry. + if entry.is_directory() { + if let Some(stripped) = entry.name.strip_prefix("!") { + let full_url = make_url_safe(stripped); + self.static_dirs.push(StaticItem { full_url, source_path }); + } else { + for child in list_directory(entry.original_path).unwrap() { + self.collect_entry(&child.original_path, prefix); + } + } + } else { + match extension.as_str() { + "md" => { + let markdown = std::fs::read_to_string(&source_path).unwrap(); + let document = MarkdownDocument::from_str(&markdown); + let headings = document.blocks.iter() + .filter_map(|block| if let Block::Heading { line, .. } = block { + Some(make_url_safe(&line.to_string())) + } else { + None + }).collect(); + // Change name and path if this is an index file. + let mut name = name; + let mut file_url = file_url; + let mut full_url = format!("{parent_url}{file_url}"); + if file_url == "+index" { + if components.is_empty() { + // This is the index file for the whole site. + name = String::from("Home"); + file_url = String::from("index"); + full_url = String::from("index"); + } else { + // This is an index file for a directory. + name = components[components.len()-1] + .as_os_str().to_string_lossy().to_string(); + file_url = make_url_safe(&name); + full_url = parent_url.strip_suffix('/').unwrap_or(&parent_url).to_string(); + } + } + self.pages.push( + Page { name, parent_url, file_url, full_url, source_path, document, headings }); + }, + _ => { + let full_url = format!("{parent_url}{file_url}.{extension}"); + self.static_files.push(StaticItem { full_url, source_path }); + }, + } + } + } + + // Ext is extension without a dot. + // Checks if a relative link to an internal page name can be reached from + // the current page, and returns a resolved absolute link to the page with extension. + pub fn has_page(&self, from: &Page, path: &str, ext: &str) -> Option<String> { + // Remove heading fragment and file extension. + let (path, heading) = match path.rsplit_once('#') { + Some((path, heading)) => match heading.is_empty() { + true => (path, None), + false => (path, Some(heading)), + } + None => (path, None), + }; + let path = path.strip_suffix(&format!(".{ext}")).unwrap_or(path); + + // Attach parent of current page to given path. + let directory = match from.parent_url.rsplit_once('/') { + Some((parent, _)) => parent, + None => &from.parent_url, + }; + let full_path = match path.starts_with("/") { + true => path.to_string(), + false => format!("{directory}/{path}"), + }; + + // Remove relative portions of path. + let segments: Vec<&str> = full_path.split("/") + .filter(|seg| !seg.is_empty() && *seg != ".") + .collect(); + let mut reduced_segments: Vec<&str> = segments.windows(2) + .filter(|w| w[1] != "..") + .map(|w| w[1]) + .collect(); + // The first segment is always skipped by the previous step. + if !segments.is_empty() && segments.get(1) != Some(&"..") { + if segments[0] != ".." { + reduced_segments.insert(0, segments[0]); + } + } + let path = reduced_segments.join("/"); + + for page in &self.pages { + if page.full_url == path { + if let Some(heading) = heading { + if !page.headings.contains(&make_url_safe(heading)) { + warn!("Page {:?} contains link to nonexistent heading {heading:?} on page {path:?}", from.name); + } + } + return Some(format!("{path}.{ext}")); + } + } + return None; + } +} + |