update: added folding into expansion node if possible

2024-10-03 22:52:01 +02:00 · 2024-10-03 22:52:01 +02:00 · 142ac9c9e1
commit 142ac9c9e1
parent 09dbd2de91
11 changed files with 278 additions and 41 deletions
--- a/parser/src/passes/double_quote_parsing.c
+++ b/parser/src/passes/double_quote_parsing.c
@ -0,0 +1,98 @@
+/* ************************************************************************** */
+/*                                                                            */
+/*                                                        :::      ::::::::   */
+/*   double_quote_parsing.c                             :+:      :+:    :+:   */
+/*                                                    +:+ +:+         +:+     */
+/*   By: maiboyer <maiboyer@student.42.fr>          +#+  +:+       +#+        */
+/*                                                +#+#+#+#+#+   +#+           */
+/*   Created: 2024/10/02 19:04:32 by maiboyer          #+#    #+#             */
+/*   Updated: 2024/10/03 22:43:27 by maiboyer         ###   ########.fr       */
+/*                                                                            */
+/* ************************************************************************** */
+
+#include "me/string/string.h"
+#include "parser/passes.h"
+#include "me/types.h"
+#include "me/vec/vec_token.h"
+#include "parser/token.h"
+#include "me/char/char.h"
+
+void	push_token_and_create_new(\
+	t_vec_token *tokens, t_token *tok, enum e_token ttype, t_const_str s);
+void	push_token_and_set_new(\
+	t_vec_token *tokens, t_token *tok, enum e_token ttype, t_const_str s);
+
+t_error	_parse_dquote_inner(t_token dquote, t_vec_token *append)
+{
+	t_token	ctok;
+	t_token	out;
+	t_usize	i;
+	char c;
+
+	out = token_new_meta(TOK_DQUOTE);
+	i = 0;
+	ctok = token_new_none();
+	while (dquote.string.buf[i] != '\0')
+	{
+		c = dquote.string.buf[i++];
+		if (me_isspace(c))
+		{
+			if (ctok.type == TOK_NONE)
+				ctok = token_new(TOK_WHITESPACE);
+			if (ctok.type != TOK_WHITESPACE)
+			{
+				vec_token_push(&out.subtokens, ctok);
+				ctok = token_new(TOK_WHITESPACE);
+			}
+			string_push_char(&ctok.string, c);
+		}
+		else if (c == '$')
+			push_token_and_create_new(&out.subtokens, &ctok, TOK_DOLLAR, "$");
+		else
+		{
+			if (ctok.type == TOK_NONE)
+				ctok = token_new(TOK_NQUOTE);
+			if (ctok.type != TOK_NQUOTE)
+			{
+				vec_token_push(&out.subtokens, ctok);
+				ctok = token_new(TOK_NQUOTE);
+			}
+			string_push_char(&ctok.string, c);
+		}
+	};
+	if (ctok.type != TOK_NONE)
+		vec_token_push(&out.subtokens, ctok);
+	if (ts_dq_apply_passes(out.subtokens, &out.subtokens))
+		return (ERROR);
+	return (vec_token_push(append, out), NO_ERROR);
+}
+
+/// There is a few rules the rest of the tokenizer machinery assumes
+/// theses function follows:
+/// 	- the input vec WILL be freed when the function return, even in
+/// 		case of error
+/// 	- the output vector isn't populated if the function returns an error,
+/// 		thus it shouldn't be freed in case of error
+/// 	- the output tokens may not be direct copy of the input tokens,
+/// 		but need to be cloned (different allocations for stuff)
+t_error	ts_double_string_pass(t_vec_token input, t_vec_token *output)
+{
+	t_vec_token	out;
+	t_usize		i;
+
+	i = 0;
+	out = vec_token_new(input.len, token_free);
+	while (i < input.len)
+	{
+		if (input.buffer[i].type == TOK_DQUOTE)
+		{
+			if (_parse_dquote_inner(input.buffer[i], &out))
+				return (vec_token_free(input), ERROR);
+		}
+		else 
+			vec_token_push(&out, token_clone(&input.buffer[i]));
+		i++;
+	}
+	vec_token_free(input);
+	return (*output = out, NO_ERROR);
+}
--- a/parser/src/passes/fold_expansion.c
+++ b/parser/src/passes/fold_expansion.c
@ -0,0 +1,54 @@
+/* ************************************************************************** */
+/*                                                                            */
+/*                                                        :::      ::::::::   */
+/*   fold_expansion.c                                   :+:      :+:    :+:   */
+/*                                                    +:+ +:+         +:+     */
+/*   By: maiboyer <maiboyer@student.42.fr>          +#+  +:+       +#+        */
+/*                                                +#+#+#+#+#+   +#+           */
+/*   Created: 2024/10/02 19:04:32 by maiboyer          #+#    #+#             */
+/*   Updated: 2024/10/03 22:50:40 by maiboyer         ###   ########.fr       */
+/*                                                                            */
+/* ************************************************************************** */
+
+#include "me/types.h"
+#include "me/vec/vec_token.h"
+#include "parser/passes.h"
+#include "parser/token.h"
+
+/// This is a sample pass
+///
+/// There is a few rules the rest of the tokenizer machinery assumes
+/// theses function follows:
+/// 	- the input vec WILL be freed when the function return, even in
+/// 		case of error
+/// 	- the output vector isn't populated if the function returns an error,
+/// 		thus it shouldn't be freed in case of error
+/// 	- the output tokens may not be direct copy of the input tokens,
+/// 		but need to be cloned (different allocations for stuff)
+t_error ts_fold_expension(t_vec_token input, t_vec_token *output)
+{
+	t_vec_token	out;
+	t_usize		i;
+	t_token		tmp;
+
+	i = 0;
+	out = vec_token_new(input.len, token_free);
+	while (i < input.len)
+	{
+		if (i + 1 >= input.len)
+			vec_token_push(&out, token_clone(&input.buffer[i]));
+		else if (input.buffer[i].type == TOK_DOLLAR \
+			&& (input.buffer[i + 1].type == TOK_DOLLAR \
+				|| input.buffer[i + 1].type == TOK_NQUOTE))
+		{
+			tmp = token_clone(&input.buffer[++i]);
+			tmp.type= TOK_EXPENSION;
+			vec_token_push(&out, tmp);
+		}
+		else
+			vec_token_push(&out, token_clone(&input.buffer[i]));
+		i++;
+	}
+	vec_token_free(input);
+	return (*output = out, NO_ERROR);
+}
--- a/parser/src/passes/template_file.c
+++ b/parser/src/passes/template_file.c
@ -6,7 +6,7 @@
 /*   By: maiboyer <maiboyer@student.42.fr>          +#+  +:+       +#+        */
 /*                                                +#+#+#+#+#+   +#+           */
 /*   Created: 2024/10/02 19:04:32 by maiboyer          #+#    #+#             */
-/*   Updated: 2024/10/03 21:37:04 by maiboyer         ###   ########.fr       */
+/*   Updated: 2024/10/03 22:23:40 by maiboyer         ###   ########.fr       */
 /*                                                                            */
 /* ************************************************************************** */

@ -25,7 +25,7 @@
 /// 		thus it shouldn't be freed in case of error
 /// 	- the output tokens may not be direct copy of the input tokens,
 /// 		but need to be cloned (different allocations for stuff)
-t_error	do_fuck_all(t_vec_token input, t_vec_token *output)
+t_error	ts_do_fuck_all(t_vec_token input, t_vec_token *output)
 {
 	t_vec_token	out;
 	t_usize		i;