nml/src/elements/paragraph.rs

use std::any::Any;

use regex::Regex;

use crate::compiler::compiler::Compiler;
use crate::compiler::compiler::Target;
use crate::document::document::Document;
use crate::document::element::ContainerElement;
use crate::document::element::ElemKind;
use crate::document::element::Element;
use crate::parser::parser::ParseMode;
use crate::parser::parser::ParserState;
use crate::parser::reports::*;
use crate::parser::rule::Rule;
use crate::parser::source::Cursor;
use crate::parser::source::Token;

// TODO: Full refactor
// Problem is that document parsed from other sources i.e by variables
// are not merged correctly into existing paragraph
// A solution would be to use the "(\n){2,}" regex to split paragraph, which would reduce the work needed for process_text
// Another fix would be to keep parsing (recursively) into the same document (like previous version)
// The issue is that this would break the current `Token` implementation
// Which would need to be reworked
#[derive(Debug)]
pub struct Paragraph {
	pub location: Token,
	pub content: Vec<Box<dyn Element>>,
}

impl Paragraph {
	pub fn find_back<P: FnMut(&&Box<dyn Element + 'static>) -> bool>(
		&self,
		predicate: P,
	) -> Option<&Box<dyn Element>> {
		self.content.iter().rev().find(predicate)
	}
}

impl Element for Paragraph {
	fn location(&self) -> &Token { &self.location }

	fn kind(&self) -> ElemKind { ElemKind::Special }

	fn element_name(&self) -> &'static str { "Paragraph" }

	fn compile(
		&self,
		compiler: &Compiler,
		document: &dyn Document,
		cursor: usize,
	) -> Result<String, String> {
		if self.content.is_empty() {
			return Ok(String::new());
		}

		match compiler.target() {
			Target::HTML => {
				if self.content.is_empty() {
					return Ok(String::new());
				}

				let mut result = String::new();
				result.push_str("<p>");

				for elems in &self.content {
					result += elems
						.compile(compiler, document, cursor + result.len())?
						.as_str();
				}

				result.push_str("</p>");
				Ok(result)
			}
			_ => todo!("Unimplemented compiler"),
		}
	}

	fn as_container(&self) -> Option<&dyn ContainerElement> { Some(self) }
}

impl ContainerElement for Paragraph {
	fn contained(&self) -> &Vec<Box<dyn Element>> { &self.content }

	fn push(&mut self, elem: Box<dyn Element>) -> Result<(), String> {
		if elem.location().source() == self.location().source() {
			self.location.range = self.location.start()..elem.location().end();
		}
		if elem.kind() == ElemKind::Block {
			return Err("Attempted to push block element inside a paragraph".to_string());
		}
		self.content.push(elem);
		Ok(())
	}
}

#[auto_registry::auto_registry(registry = "rules", path = "crate::elements::paragraph")]
pub struct ParagraphRule {
	re: Regex,
}

impl ParagraphRule {
	pub fn new() -> Self {
		Self {
			re: Regex::new(r"\n{2,}").unwrap(),
		}
	}
}

impl Rule for ParagraphRule {
	fn name(&self) -> &'static str { "Paragraph" }

	fn previous(&self) -> Option<&'static str> { Some("Comment") }

	fn next_match(
		&self,
		_mode: &ParseMode,
		_state: &ParserState,
		cursor: &Cursor,
	) -> Option<(usize, Box<dyn Any>)> {
		self.re
			.find_at(cursor.source.content(), cursor.pos)
			.map(|m| (m.start(), Box::new([false; 0]) as Box<dyn Any>))
	}

	fn on_match(
		&self,
		state: &ParserState,
		document: &dyn Document,
		cursor: Cursor,
		_match_data: Box<dyn Any>,
	) -> (Cursor, Vec<Report>) {
		let end_cursor = match self.re.captures_at(cursor.source.content(), cursor.pos) {
			None => panic!("Unknown error"),
			Some(capture) => cursor.at(capture.get(0).unwrap().end() - 1),
		};

		state.push(
			document,
			Box::new(Paragraph {
				location: Token::new(cursor.pos..end_cursor.pos, cursor.source.clone()),
				content: Vec::new(),
			}),
		);

		(end_cursor, Vec::new())
	}
}

#[cfg(test)]
mod tests {
	use super::*;
	use crate::elements::paragraph::Paragraph;
	use crate::elements::text::Text;
	use crate::parser::langparser::LangParser;
	use crate::parser::parser::Parser;
	use crate::parser::source::SourceFile;
	use crate::validate_document;
	use std::rc::Rc;

	#[test]
	fn parse() {
		let source = Rc::new(SourceFile::with_content(
			"".to_string(),
			r#"
First paragraph
Second line

Second paragraph\
<- literal \\n


Last paragraph
			"#
			.to_string(),
			None,
		));
		let parser = LangParser::default();
		let (doc, _) = parser.parse(
			ParserState::new(&parser, None),
			source,
			None,
			ParseMode::default(),
		);

		validate_document!(doc.content().borrow(), 0,
			Paragraph {
				Text { content == "First paragraph Second line" };
			};
			Paragraph {
				Text { content == "Second paragraph\n<- literal \\n" };
			};
			Paragraph {
				Text { content == "Last paragraph " };
			};
		);
	}
}
Media 2024-07-25 13:13:12 +02:00			`use std::any::Any;`
Features & slight refector 2024-07-19 11:52:12 +02:00
			`use regex::Regex;`

Media 2024-07-25 13:13:12 +02:00			`use crate::compiler::compiler::Compiler;`
			`use crate::compiler::compiler::Target;`
			`use crate::document::document::Document;`
Update 2024-07-26 20:01:10 +02:00			`use crate::document::element::ContainerElement;`
Media 2024-07-25 13:13:12 +02:00			`use crate::document::element::ElemKind;`
			`use crate::document::element::Element;`
Fix bugs 2024-10-20 19:38:15 +02:00			`use crate::parser::parser::ParseMode;`
Refactor pt1 2024-08-05 18:40:17 +02:00			`use crate::parser::parser::ParserState;`
Lint 2024-10-24 10:18:49 +02:00			`use crate::parser::reports::*;`
Media 2024-07-25 13:13:12 +02:00			`use crate::parser::rule::Rule;`
			`use crate::parser::source::Cursor;`
			`use crate::parser::source::Token;`
Features & slight refector 2024-07-19 11:52:12 +02:00
			`// TODO: Full refactor`
			`// Problem is that document parsed from other sources i.e by variables`
			`// are not merged correctly into existing paragraph`
			`// A solution would be to use the "(\n){2,}" regex to split paragraph, which would reduce the work needed for process_text`
			`// Another fix would be to keep parsing (recursively) into the same document (like previous version)`
			// The issue is that this would break the current `Token` implementation
			`// Which would need to be reworked`
			`#[derive(Debug)]`
Media 2024-07-25 13:13:12 +02:00			`pub struct Paragraph {`
Update 2024-07-26 20:01:10 +02:00			`pub location: Token,`
Media 2024-07-25 13:13:12 +02:00			`pub content: Vec<Box<dyn Element>>,`
Features & slight refector 2024-07-19 11:52:12 +02:00			`}`

Media 2024-07-25 13:13:12 +02:00			`impl Paragraph {`
			`pub fn find_back<P: FnMut(&&Box<dyn Element + 'static>) -> bool>(`
			`&self,`
			`predicate: P,`
			`) -> Option<&Box<dyn Element>> {`
			`self.content.iter().rev().find(predicate)`
Features & slight refector 2024-07-19 11:52:12 +02:00			`}`
			`}`

Media 2024-07-25 13:13:12 +02:00			`impl Element for Paragraph {`
			`fn location(&self) -> &Token { &self.location }`
Features & slight refector 2024-07-19 11:52:12 +02:00
Media 2024-07-25 13:13:12 +02:00			`fn kind(&self) -> ElemKind { ElemKind::Special }`
Features & slight refector 2024-07-19 11:52:12 +02:00
Media 2024-07-25 13:13:12 +02:00			`fn element_name(&self) -> &'static str { "Paragraph" }`
Features & slight refector 2024-07-19 11:52:12 +02:00
Fix bugs 2024-10-20 19:38:15 +02:00			`fn compile(`
			`&self,`
			`compiler: &Compiler,`
			`document: &dyn Document,`
			`cursor: usize,`
			`) -> Result<String, String> {`
Media 2024-07-25 13:13:12 +02:00			`if self.content.is_empty() {`
			`return Ok(String::new());`
			`}`
Features & slight refector 2024-07-19 11:52:12 +02:00
Media 2024-07-25 13:13:12 +02:00			`match compiler.target() {`
			`Target::HTML => {`
Fixes & Add tests 2024-08-02 13:36:04 +02:00			`if self.content.is_empty() {`
			`return Ok(String::new());`
Media 2024-07-25 13:13:12 +02:00			`}`

Fixes & Add tests 2024-08-02 13:36:04 +02:00			`let mut result = String::new();`
			`result.push_str("<p>");`

			`for elems in &self.content {`
Fix bugs 2024-10-20 19:38:15 +02:00			`result += elems`
			`.compile(compiler, document, cursor + result.len())?`
			`.as_str();`
Features & slight refector 2024-07-19 11:52:12 +02:00			`}`
Fixes & Add tests 2024-08-02 13:36:04 +02:00
			`result.push_str("</p>");`
			`Ok(result)`
Media 2024-07-25 13:13:12 +02:00			`}`
Fixes & Add tests 2024-08-02 13:36:04 +02:00			`_ => todo!("Unimplemented compiler"),`
Media 2024-07-25 13:13:12 +02:00			`}`
			`}`
Update 2024-07-26 20:01:10 +02:00
			`fn as_container(&self) -> Option<&dyn ContainerElement> { Some(self) }`
			`}`

			`impl ContainerElement for Paragraph {`
			`fn contained(&self) -> &Vec<Box<dyn Element>> { &self.content }`

			`fn push(&mut self, elem: Box<dyn Element>) -> Result<(), String> {`
			`if elem.location().source() == self.location().source() {`
			`self.location.range = self.location.start()..elem.location().end();`
			`}`
Fix links & tests 2024-08-01 16:15:10 +02:00			`if elem.kind() == ElemKind::Block {`
			`return Err("Attempted to push block element inside a paragraph".to_string());`
			`}`
Update 2024-07-26 20:01:10 +02:00			`self.content.push(elem);`
			`Ok(())`
			`}`
Features & slight refector 2024-07-19 11:52:12 +02:00			`}`

Update macro 2024-08-08 17:11:32 +02:00			`#[auto_registry::auto_registry(registry = "rules", path = "crate::elements::paragraph")]`
Media 2024-07-25 13:13:12 +02:00			`pub struct ParagraphRule {`
Features & slight refector 2024-07-19 11:52:12 +02:00			`re: Regex,`
			`}`

			`impl ParagraphRule {`
Media 2024-07-25 13:13:12 +02:00			`pub fn new() -> Self {`
			`Self {`
			`re: Regex::new(r"\n{2,}").unwrap(),`
Features & slight refector 2024-07-19 11:52:12 +02:00			`}`
Media 2024-07-25 13:13:12 +02:00			`}`
Features & slight refector 2024-07-19 11:52:12 +02:00			`}`

Media 2024-07-25 13:13:12 +02:00			`impl Rule for ParagraphRule {`
Automatic rules registration 2024-08-08 14:12:16 +02:00			`fn name(&self) -> &'static str { "Paragraph" }`
Fix bugs 2024-10-20 19:38:15 +02:00
Automatic rules registration 2024-08-08 14:12:16 +02:00			`fn previous(&self) -> Option<&'static str> { Some("Comment") }`
Features & slight refector 2024-07-19 11:52:12 +02:00
Fix bugs 2024-10-20 19:38:15 +02:00			`fn next_match(`
			`&self,`
			`_mode: &ParseMode,`
			`_state: &ParserState,`
			`cursor: &Cursor,`
			`) -> Option<(usize, Box<dyn Any>)> {`
Media 2024-07-25 13:13:12 +02:00			`self.re`
Fix bugs 2024-10-20 19:38:15 +02:00			`.find_at(cursor.source.content(), cursor.pos)`
			`.map(\|m\| (m.start(), Box::new([false; 0]) as Box<dyn Any>))`
Media 2024-07-25 13:13:12 +02:00			`}`
Features & slight refector 2024-07-19 11:52:12 +02:00
Media 2024-07-25 13:13:12 +02:00			`fn on_match(`
			`&self,`
Refactor done 2024-08-06 18:58:41 +02:00			`state: &ParserState,`
Media 2024-07-25 13:13:12 +02:00			`document: &dyn Document,`
			`cursor: Cursor,`
Refactor done 2024-08-06 18:58:41 +02:00			`_match_data: Box<dyn Any>,`
Reports refactor [2/2] 2024-10-24 09:54:52 +02:00			`) -> (Cursor, Vec<Report>) {`
Media 2024-07-25 13:13:12 +02:00			`let end_cursor = match self.re.captures_at(cursor.source.content(), cursor.pos) {`
Features & slight refector 2024-07-19 11:52:12 +02:00			`None => panic!("Unknown error"),`
Media 2024-07-25 13:13:12 +02:00			`Some(capture) => cursor.at(capture.get(0).unwrap().end() - 1),`
Features & slight refector 2024-07-19 11:52:12 +02:00			`};`

Refactor done 2024-08-06 18:58:41 +02:00			`state.push(`
Media 2024-07-25 13:13:12 +02:00			`document,`
Update 2024-07-26 20:01:10 +02:00			`Box::new(Paragraph {`
			`location: Token::new(cursor.pos..end_cursor.pos, cursor.source.clone()),`
			`content: Vec::new(),`
			`}),`
Media 2024-07-25 13:13:12 +02:00			`);`
Features & slight refector 2024-07-19 11:52:12 +02:00
			`(end_cursor, Vec::new())`
Media 2024-07-25 13:13:12 +02:00			`}`
Features & slight refector 2024-07-19 11:52:12 +02:00			`}`
Fix links & tests 2024-08-01 16:15:10 +02:00
			`#[cfg(test)]`
			`mod tests {`
Reports refactor [2/2] 2024-10-24 09:54:52 +02:00			`use super::*;`
Fix links & tests 2024-08-01 16:15:10 +02:00			`use crate::elements::paragraph::Paragraph;`
			`use crate::elements::text::Text;`
			`use crate::parser::langparser::LangParser;`
Refactor done 2024-08-06 18:58:41 +02:00			`use crate::parser::parser::Parser;`
Fix links & tests 2024-08-01 16:15:10 +02:00			`use crate::parser::source::SourceFile;`
			`use crate::validate_document;`
Lint 2024-10-24 10:18:49 +02:00			`use std::rc::Rc;`
Fix links & tests 2024-08-01 16:15:10 +02:00
			`#[test]`
			`fn parse() {`
			`let source = Rc::new(SourceFile::with_content(`
			`"".to_string(),`
			`r#"`
			`First paragraph`
			`Second line`

			`Second paragraph\`
			`<- literal \\n`


			`Last paragraph`
			`"#`
			`.to_string(),`
			`None,`
			`));`
			`let parser = LangParser::default();`
Fix bugs 2024-10-20 19:38:15 +02:00			`let (doc, _) = parser.parse(`
			`ParserState::new(&parser, None),`
			`source,`
			`None,`
			`ParseMode::default(),`
			`);`
Fix links & tests 2024-08-01 16:15:10 +02:00
			`validate_document!(doc.content().borrow(), 0,`
			`Paragraph {`
			`Text { content == "First paragraph Second line" };`
			`};`
			`Paragraph {`
			`Text { content == "Second paragraph\n<- literal \\n" };`
			`};`
			`Paragraph {`
			`Text { content == "Last paragraph " };`
			`};`
			`);`
			`}`
			`}`