You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

693 lines
25KB

  1. use std::collections::{HashMap};
  2. use std::iter::FromIterator;
  3. use std::fs::{remove_dir_all, copy, create_dir_all};
  4. use std::path::{Path, PathBuf};
  5. use glob::glob;
  6. use tera::{Tera, Context};
  7. use slug::slugify;
  8. use walkdir::WalkDir;
  9. use errors::{Result, ResultExt};
  10. use config::{Config, get_config};
  11. use page::{Page, populate_previous_and_next_pages, sort_pages};
  12. use pagination::Paginator;
  13. use utils::{create_file, create_directory};
  14. use section::{Section};
  15. use front_matter::{SortBy};
  16. use filters;
  17. use global_fns;
  18. lazy_static! {
  19. pub static ref GUTENBERG_TERA: Tera = {
  20. let mut tera = Tera::default();
  21. tera.add_raw_templates(vec![
  22. ("rss.xml", include_str!("templates/rss.xml")),
  23. ("sitemap.xml", include_str!("templates/sitemap.xml")),
  24. ("robots.txt", include_str!("templates/robots.txt")),
  25. ("anchor-link.html", include_str!("templates/anchor-link.html")),
  26. ("shortcodes/youtube.html", include_str!("templates/shortcodes/youtube.html")),
  27. ("shortcodes/vimeo.html", include_str!("templates/shortcodes/vimeo.html")),
  28. ("shortcodes/gist.html", include_str!("templates/shortcodes/gist.html")),
  29. ("internal/alias.html", include_str!("templates/internal/alias.html")),
  30. ]).unwrap();
  31. tera
  32. };
  33. }
  34. /// Renders the `internal/alias.html` template that will redirect
  35. /// via refresh to the url given
  36. fn render_alias(url: &str, tera: &Tera) -> Result<String> {
  37. let mut context = Context::new();
  38. context.add("url", &url);
  39. tera.render("internal/alias.html", &context)
  40. .chain_err(|| format!("Failed to render alias for '{}'", url))
  41. }
  42. #[derive(Debug, PartialEq)]
  43. enum RenderList {
  44. Tags,
  45. Categories,
  46. }
  47. /// A tag or category
  48. #[derive(Debug, Serialize, PartialEq)]
  49. struct ListItem {
  50. name: String,
  51. slug: String,
  52. count: usize,
  53. }
  54. impl ListItem {
  55. pub fn new(name: &str, count: usize) -> ListItem {
  56. ListItem {
  57. name: name.to_string(),
  58. slug: slugify(name),
  59. count: count,
  60. }
  61. }
  62. }
  63. #[derive(Debug)]
  64. pub struct Site {
  65. pub base_path: PathBuf,
  66. pub config: Config,
  67. pub pages: HashMap<PathBuf, Page>,
  68. pub sections: HashMap<PathBuf, Section>,
  69. pub tera: Tera,
  70. live_reload: bool,
  71. output_path: PathBuf,
  72. static_path: PathBuf,
  73. pub tags: HashMap<String, Vec<PathBuf>>,
  74. pub categories: HashMap<String, Vec<PathBuf>>,
  75. pub permalinks: HashMap<String, String>,
  76. }
  77. impl Site {
  78. /// Parse a site at the given path. Defaults to the current dir
  79. /// Passing in a path is only used in tests
  80. pub fn new<P: AsRef<Path>>(path: P, config_file: &str) -> Result<Site> {
  81. let path = path.as_ref();
  82. let tpl_glob = format!("{}/{}", path.to_string_lossy().replace("\\", "/"), "templates/**/*.*ml");
  83. let mut tera = Tera::new(&tpl_glob).chain_err(|| "Error parsing templates")?;
  84. tera.extend(&GUTENBERG_TERA)?;
  85. tera.register_filter("markdown", filters::markdown);
  86. tera.register_filter("base64_encode", filters::base64_encode);
  87. tera.register_filter("base64_decode", filters::base64_decode);
  88. let site = Site {
  89. base_path: path.to_path_buf(),
  90. config: get_config(path, config_file),
  91. pages: HashMap::new(),
  92. sections: HashMap::new(),
  93. tera: tera,
  94. live_reload: false,
  95. output_path: path.join("public"),
  96. static_path: path.join("static"),
  97. tags: HashMap::new(),
  98. categories: HashMap::new(),
  99. permalinks: HashMap::new(),
  100. };
  101. Ok(site)
  102. }
  103. /// What the function name says
  104. pub fn enable_live_reload(&mut self) {
  105. self.live_reload = true;
  106. }
  107. /// Gets the path of all ignored pages in the site
  108. pub fn get_ignored_pages(&self) -> Vec<PathBuf> {
  109. self.sections
  110. .values()
  111. .flat_map(|s| s.ignored_pages.iter().map(|p| p.file_path.clone()))
  112. .collect()
  113. }
  114. /// Get all the orphan (== without section) pages in the site
  115. pub fn get_all_orphan_pages(&self) -> Vec<&Page> {
  116. let mut pages_in_sections = vec![];
  117. let mut orphans = vec![];
  118. for s in self.sections.values() {
  119. pages_in_sections.extend(s.all_pages_path());
  120. }
  121. for page in self.pages.values() {
  122. if !pages_in_sections.contains(&page.file_path) {
  123. orphans.push(page);
  124. }
  125. }
  126. orphans
  127. }
  128. /// Used by tests to change the output path to a tmp dir
  129. #[doc(hidden)]
  130. pub fn set_output_path<P: AsRef<Path>>(&mut self, path: P) {
  131. self.output_path = path.as_ref().to_path_buf();
  132. }
  133. /// Reads all .md files in the `content` directory and create pages/sections
  134. /// out of them
  135. pub fn load(&mut self) -> Result<()> {
  136. let base_path = self.base_path.to_string_lossy().replace("\\", "/");
  137. let content_glob = format!("{}/{}", base_path, "content/**/*.md");
  138. // TODO: make that parallel, that's the main bottleneck
  139. // `add_section` and `add_page` can't be used in the parallel version afaik
  140. for entry in glob(&content_glob).unwrap().filter_map(|e| e.ok()) {
  141. let path = entry.as_path();
  142. if path.file_name().unwrap() == "_index.md" {
  143. self.add_section(path)?;
  144. } else {
  145. self.add_page(path)?;
  146. }
  147. }
  148. // Insert a default index section so we don't need to create a _index.md to render
  149. // the index page
  150. let index_path = self.base_path.join("content").join("_index.md");
  151. if !self.sections.contains_key(&index_path) {
  152. let mut index_section = Section::default();
  153. index_section.permalink = self.config.make_permalink("");
  154. self.sections.insert(index_path, index_section);
  155. }
  156. // A map of all .md files (section and pages) and their permalink
  157. // We need that if there are relative links in the content that need to be resolved
  158. let mut permalinks = HashMap::new();
  159. for page in self.pages.values() {
  160. permalinks.insert(page.relative_path.clone(), page.permalink.clone());
  161. }
  162. for section in self.sections.values() {
  163. permalinks.insert(section.relative_path.clone(), section.permalink.clone());
  164. }
  165. for page in self.pages.values_mut() {
  166. page.render_markdown(&permalinks, &self.tera, &self.config)?;
  167. }
  168. for section in self.sections.values_mut() {
  169. section.render_markdown(&permalinks, &self.tera, &self.config)?;
  170. }
  171. self.permalinks = permalinks;
  172. self.populate_sections();
  173. self.populate_tags_and_categories();
  174. self.tera.register_global_function("get_page", global_fns::make_get_page(&self.pages));
  175. Ok(())
  176. }
  177. /// Simple wrapper fn to avoid repeating that code in several places
  178. fn add_page(&mut self, path: &Path) -> Result<()> {
  179. let page = Page::from_file(&path, &self.config)?;
  180. self.pages.insert(page.file_path.clone(), page);
  181. Ok(())
  182. }
  183. /// Simple wrapper fn to avoid repeating that code in several places
  184. fn add_section(&mut self, path: &Path) -> Result<()> {
  185. let section = Section::from_file(path, &self.config)?;
  186. self.sections.insert(section.file_path.clone(), section);
  187. Ok(())
  188. }
  189. /// Called in serve, add the section and render it
  190. fn add_section_and_render(&mut self, path: &Path) -> Result<()> {
  191. self.add_section(path)?;
  192. let mut section = self.sections.get_mut(path).unwrap();
  193. self.permalinks.insert(section.relative_path.clone(), section.permalink.clone());
  194. section.render_markdown(&self.permalinks, &self.tera, &self.config)?;
  195. Ok(())
  196. }
  197. /// Called in serve, add a page again updating permalinks and its content
  198. /// The bool in the result is whether the front matter has been updated or not
  199. /// TODO: the above is very confusing, change that
  200. fn add_page_and_render(&mut self, path: &Path) -> Result<(bool, Page)> {
  201. let existing_page = self.pages.get(path).cloned();
  202. self.add_page(path)?;
  203. let mut page = self.pages.get_mut(path).unwrap();
  204. self.permalinks.insert(page.relative_path.clone(), page.permalink.clone());
  205. page.render_markdown(&self.permalinks, &self.tera, &self.config)?;
  206. if let Some(prev_page) = existing_page {
  207. return Ok((prev_page.meta != page.meta, page.clone()));
  208. }
  209. Ok((true, page.clone()))
  210. }
  211. /// Find out the direct subsections of each subsection if there are some
  212. /// as well as the pages for each section
  213. pub fn populate_sections(&mut self) {
  214. for page in self.pages.values() {
  215. if self.sections.contains_key(&page.parent_path.join("_index.md")) {
  216. self.sections.get_mut(&page.parent_path.join("_index.md")).unwrap().pages.push(page.clone());
  217. }
  218. }
  219. let mut grandparent_paths = HashMap::new();
  220. for section in self.sections.values() {
  221. if let Some(grand_parent) = section.parent_path.parent() {
  222. grandparent_paths.entry(grand_parent.to_path_buf()).or_insert_with(|| vec![]).push(section.clone());
  223. }
  224. }
  225. for section in self.sections.values_mut() {
  226. // TODO: avoid this clone
  227. let (mut sorted_pages, cannot_be_sorted_pages) = sort_pages(section.pages.clone(), section.meta.sort_by());
  228. sorted_pages = populate_previous_and_next_pages(&sorted_pages);
  229. section.pages = sorted_pages;
  230. section.ignored_pages = cannot_be_sorted_pages;
  231. match grandparent_paths.get(&section.parent_path) {
  232. Some(paths) => section.subsections.extend(paths.clone()),
  233. None => continue,
  234. };
  235. }
  236. }
  237. /// Separated from `parse` for easier testing
  238. pub fn populate_tags_and_categories(&mut self) {
  239. for page in self.pages.values() {
  240. if let Some(ref category) = page.meta.category {
  241. self.categories
  242. .entry(category.to_string())
  243. .or_insert_with(|| vec![])
  244. .push(page.file_path.clone());
  245. }
  246. if let Some(ref tags) = page.meta.tags {
  247. for tag in tags {
  248. self.tags
  249. .entry(tag.to_string())
  250. .or_insert_with(|| vec![])
  251. .push(page.file_path.clone());
  252. }
  253. }
  254. }
  255. }
  256. /// Inject live reload script tag if in live reload mode
  257. fn inject_livereload(&self, html: String) -> String {
  258. if self.live_reload {
  259. return html.replace(
  260. "</body>",
  261. r#"<script src="/livereload.js?port=1112&mindelay=10"></script></body>"#
  262. );
  263. }
  264. html
  265. }
  266. pub fn ensure_public_directory_exists(&self) -> Result<()> {
  267. let public = self.output_path.clone();
  268. if !public.exists() {
  269. create_directory(&public)?;
  270. }
  271. Ok(())
  272. }
  273. /// Copy static file to public directory.
  274. pub fn copy_static_file<P: AsRef<Path>>(&self, path: P) -> Result<()> {
  275. let relative_path = path.as_ref().strip_prefix(&self.static_path).unwrap();
  276. let target_path = self.output_path.join(relative_path);
  277. if let Some(parent_directory) = target_path.parent() {
  278. create_dir_all(parent_directory)?;
  279. }
  280. copy(path.as_ref(), &target_path)?;
  281. Ok(())
  282. }
  283. /// Copy the content of the `static` folder into the `public` folder
  284. pub fn copy_static_directory(&self) -> Result<()> {
  285. for entry in WalkDir::new(&self.static_path).into_iter().filter_map(|e| e.ok()) {
  286. let relative_path = entry.path().strip_prefix(&self.static_path).unwrap();
  287. let target_path = self.output_path.join(relative_path);
  288. if entry.path().is_dir() {
  289. if !target_path.exists() {
  290. create_directory(&target_path)?;
  291. }
  292. } else {
  293. let entry_fullpath = self.base_path.join(entry.path());
  294. self.copy_static_file(entry_fullpath)?;
  295. }
  296. }
  297. Ok(())
  298. }
  299. /// Deletes the `public` directory if it exists
  300. pub fn clean(&self) -> Result<()> {
  301. if self.output_path.exists() {
  302. // Delete current `public` directory so we can start fresh
  303. remove_dir_all(&self.output_path).chain_err(|| "Couldn't delete `public` directory")?;
  304. }
  305. Ok(())
  306. }
  307. pub fn rebuild_after_content_change(&mut self, path: &Path) -> Result<()> {
  308. let is_section = path.ends_with("_index.md");
  309. if path.exists() {
  310. // file exists, either a new one or updating content
  311. if is_section {
  312. self.add_section_and_render(path)?;
  313. self.render_sections()?;
  314. } else {
  315. // probably just an update so just re-parse that page
  316. let (frontmatter_changed, page) = self.add_page_and_render(path)?;
  317. // TODO: can probably be smarter and check what changed
  318. if frontmatter_changed {
  319. self.populate_sections();
  320. self.populate_tags_and_categories();
  321. self.build()?;
  322. } else {
  323. self.render_page(&page)?;
  324. }
  325. }
  326. } else {
  327. // File doesn't exist -> a deletion so we remove it from everything
  328. let relative_path = if is_section {
  329. self.sections[path].relative_path.clone()
  330. } else {
  331. self.pages[path].relative_path.clone()
  332. };
  333. self.permalinks.remove(&relative_path);
  334. if is_section {
  335. self.sections.remove(path);
  336. } else {
  337. self.pages.remove(path);
  338. }
  339. // TODO: probably no need to do that, we should be able to only re-render a page or a section.
  340. self.populate_sections();
  341. self.populate_tags_and_categories();
  342. self.build()?;
  343. }
  344. Ok(())
  345. }
  346. pub fn rebuild_after_template_change(&mut self, path: &Path) -> Result<()> {
  347. self.tera.full_reload()?;
  348. match path.file_name().unwrap().to_str().unwrap() {
  349. "sitemap.xml" => self.render_sitemap(),
  350. "rss.xml" => self.render_rss_feed(),
  351. _ => self.build() // TODO: change that
  352. }
  353. }
  354. /// Renders a single content page
  355. pub fn render_page(&self, page: &Page) -> Result<()> {
  356. self.ensure_public_directory_exists()?;
  357. // Copy the nesting of the content directory if we have sections for that page
  358. let mut current_path = self.output_path.to_path_buf();
  359. for component in page.path.split('/') {
  360. current_path.push(component);
  361. if !current_path.exists() {
  362. create_directory(&current_path)?;
  363. }
  364. }
  365. // Make sure the folder exists
  366. create_directory(&current_path)?;
  367. // Finally, create a index.html file there with the page rendered
  368. let output = page.render_html(&self.tera, &self.config)?;
  369. create_file(current_path.join("index.html"), &self.inject_livereload(output))?;
  370. // Copy any asset we found previously into the same directory as the index.html
  371. for asset in &page.assets {
  372. let asset_path = asset.as_path();
  373. copy(&asset_path, &current_path.join(asset_path.file_name().unwrap()))?;
  374. }
  375. Ok(())
  376. }
  377. /// Builds the site to the `public` directory after deleting it
  378. pub fn build(&self) -> Result<()> {
  379. self.clean()?;
  380. self.render_sections()?;
  381. self.render_orphan_pages()?;
  382. self.render_sitemap()?;
  383. if self.config.generate_rss.unwrap() {
  384. self.render_rss_feed()?;
  385. }
  386. self.render_robots()?;
  387. if self.config.generate_categories_pages.unwrap() {
  388. self.render_categories_and_tags(RenderList::Categories)?;
  389. }
  390. if self.config.generate_tags_pages.unwrap() {
  391. self.render_categories_and_tags(RenderList::Tags)?;
  392. }
  393. self.copy_static_directory()
  394. }
  395. /// Renders robots.txt
  396. fn render_robots(&self) -> Result<()> {
  397. self.ensure_public_directory_exists()?;
  398. create_file(
  399. self.output_path.join("robots.txt"),
  400. &self.tera.render("robots.txt", &Context::new())?
  401. )
  402. }
  403. /// Render the /{categories, list} pages and each individual category/tag page
  404. /// They are the same thing fundamentally, a list of pages with something in common
  405. fn render_categories_and_tags(&self, kind: RenderList) -> Result<()> {
  406. let items = match kind {
  407. RenderList::Categories => &self.categories,
  408. RenderList::Tags => &self.tags,
  409. };
  410. if items.is_empty() {
  411. return Ok(());
  412. }
  413. let (list_tpl_name, single_tpl_name, name, var_name) = if kind == RenderList::Categories {
  414. ("categories.html", "category.html", "categories", "category")
  415. } else {
  416. ("tags.html", "tag.html", "tags", "tag")
  417. };
  418. self.ensure_public_directory_exists()?;
  419. // Create the categories/tags directory first
  420. let public = self.output_path.clone();
  421. let mut output_path = public.to_path_buf();
  422. output_path.push(name);
  423. create_directory(&output_path)?;
  424. // Then render the index page for that kind.
  425. // We sort by number of page in that category/tag
  426. let mut sorted_items = vec![];
  427. for (item, count) in Vec::from_iter(items).into_iter().map(|(a, b)| (a, b.len())) {
  428. sorted_items.push(ListItem::new(item, count));
  429. }
  430. sorted_items.sort_by(|a, b| b.count.cmp(&a.count));
  431. let mut context = Context::new();
  432. context.add(name, &sorted_items);
  433. context.add("config", &self.config);
  434. context.add("current_url", &self.config.make_permalink(name));
  435. context.add("current_path", &format!("/{}", name));
  436. // And render it immediately
  437. let list_output = self.tera.render(list_tpl_name, &context)?;
  438. create_file(output_path.join("index.html"), &self.inject_livereload(list_output))?;
  439. // Now, each individual item
  440. for (item_name, pages_paths) in items.iter() {
  441. let pages: Vec<&Page> = self.pages
  442. .iter()
  443. .filter(|&(path, _)| pages_paths.contains(path))
  444. .map(|(_, page)| page)
  445. .collect();
  446. // TODO: how to sort categories and tag content?
  447. // Have a setting in config.toml or a _category.md and _tag.md
  448. // The latter is more in line with the rest of Gutenberg but order ordering
  449. // doesn't really work across sections.
  450. let mut context = Context::new();
  451. let slug = slugify(&item_name);
  452. context.add(var_name, &item_name);
  453. context.add(&format!("{}_slug", var_name), &slug);
  454. context.add("pages", &pages);
  455. context.add("config", &self.config);
  456. context.add("current_url", &self.config.make_permalink(&format!("{}/{}", name, slug)));
  457. context.add("current_path", &format!("/{}/{}", name, slug));
  458. let single_output = self.tera.render(single_tpl_name, &context)?;
  459. create_directory(&output_path.join(&slug))?;
  460. create_file(
  461. output_path.join(&slug).join("index.html"),
  462. &self.inject_livereload(single_output)
  463. )?;
  464. }
  465. Ok(())
  466. }
  467. fn render_sitemap(&self) -> Result<()> {
  468. self.ensure_public_directory_exists()?;
  469. let mut context = Context::new();
  470. context.add("pages", &self.pages.values().collect::<Vec<&Page>>());
  471. context.add("sections", &self.sections.values().collect::<Vec<&Section>>());
  472. let mut categories = vec![];
  473. if self.config.generate_categories_pages.unwrap() && !self.categories.is_empty() {
  474. categories.push(self.config.make_permalink("categories"));
  475. for category in self.categories.keys() {
  476. categories.push(
  477. self.config.make_permalink(&format!("categories/{}", slugify(category)))
  478. );
  479. }
  480. }
  481. context.add("categories", &categories);
  482. let mut tags = vec![];
  483. if self.config.generate_tags_pages.unwrap() && !self.tags.is_empty() {
  484. tags.push(self.config.make_permalink("tags"));
  485. for tag in self.tags.keys() {
  486. tags.push(
  487. self.config.make_permalink(&format!("tags/{}", slugify(tag)))
  488. );
  489. }
  490. }
  491. context.add("tags", &tags);
  492. let sitemap = self.tera.render("sitemap.xml", &context)?;
  493. create_file(self.output_path.join("sitemap.xml"), &sitemap)?;
  494. Ok(())
  495. }
  496. fn render_rss_feed(&self) -> Result<()> {
  497. self.ensure_public_directory_exists()?;
  498. let mut context = Context::new();
  499. let pages = self.pages.values()
  500. .filter(|p| p.meta.date.is_some())
  501. .take(15) // limit to the last 15 elements
  502. .cloned()
  503. .collect::<Vec<Page>>();
  504. // Don't generate a RSS feed if none of the pages has a date
  505. if pages.is_empty() {
  506. return Ok(());
  507. }
  508. context.add("last_build_date", &pages[0].meta.date);
  509. let (sorted_pages, _) = sort_pages(pages, SortBy::Date);
  510. context.add("pages", &sorted_pages);
  511. context.add("config", &self.config);
  512. let rss_feed_url = if self.config.base_url.ends_with('/') {
  513. format!("{}{}", self.config.base_url, "rss.xml")
  514. } else {
  515. format!("{}/{}", self.config.base_url, "rss.xml")
  516. };
  517. context.add("feed_url", &rss_feed_url);
  518. let sitemap = self.tera.render("rss.xml", &context)?;
  519. create_file(self.output_path.join("rss.xml"), &sitemap)?;
  520. Ok(())
  521. }
  522. fn render_sections(&self) -> Result<()> {
  523. self.ensure_public_directory_exists()?;
  524. let public = self.output_path.clone();
  525. let sections: HashMap<String, Section> = self.sections
  526. .values()
  527. .map(|s| (s.components.join("/"), s.clone()))
  528. .collect();
  529. for section in self.sections.values() {
  530. let mut output_path = public.to_path_buf();
  531. for component in &section.components {
  532. output_path.push(component);
  533. if !output_path.exists() {
  534. create_directory(&output_path)?;
  535. }
  536. }
  537. for page in &section.pages {
  538. self.render_page(page)?;
  539. }
  540. if !section.meta.should_render() {
  541. continue;
  542. }
  543. if section.meta.is_paginated() {
  544. self.render_paginated(&output_path, section)?;
  545. } else {
  546. let output = section.render_html(
  547. &sections,
  548. &self.tera,
  549. &self.config,
  550. )?;
  551. create_file(output_path.join("index.html"), &self.inject_livereload(output))?;
  552. }
  553. }
  554. Ok(())
  555. }
  556. /// Renders all pages that do not belong to any sections
  557. fn render_orphan_pages(&self) -> Result<()> {
  558. self.ensure_public_directory_exists()?;
  559. for page in self.get_all_orphan_pages() {
  560. self.render_page(page)?;
  561. }
  562. Ok(())
  563. }
  564. /// Renders a list of pages when the section/index is wanting pagination.
  565. fn render_paginated(&self, output_path: &Path, section: &Section) -> Result<()> {
  566. self.ensure_public_directory_exists()?;
  567. let paginate_path = match section.meta.paginate_path {
  568. Some(ref s) => s.clone(),
  569. None => unreachable!()
  570. };
  571. let paginator = Paginator::new(&section.pages, section);
  572. for (i, pager) in paginator.pagers.iter().enumerate() {
  573. let folder_path = output_path.join(&paginate_path);
  574. let page_path = folder_path.join(&format!("{}", i + 1));
  575. create_directory(&folder_path)?;
  576. create_directory(&page_path)?;
  577. let output = paginator.render_pager(pager, self)?;
  578. if i > 0 {
  579. create_file(page_path.join("index.html"), &self.inject_livereload(output))?;
  580. } else {
  581. create_file(output_path.join("index.html"), &self.inject_livereload(output))?;
  582. create_file(page_path.join("index.html"), &render_alias(&section.permalink, &self.tera)?)?;
  583. }
  584. }
  585. Ok(())
  586. }
  587. }