kontur-courses · Kostornoj-Dmitrij · Nov 25, 2024 · Nov 30, 2024 · Dec 7, 2024 · Dec 9, 2024
diff --git a/cs/Markdown/Markdown.csproj b/cs/Markdown/Markdown.csproj
@@ -0,0 +1,9 @@
+<Project Sdk="Microsoft.NET.Sdk">
+
+    <PropertyGroup>
+        <TargetFramework>net8.0</TargetFramework>
+        <ImplicitUsings>enable</ImplicitUsings>
+        <Nullable>enable</Nullable>
+    </PropertyGroup>
+
+</Project>
diff --git a/cs/Markdown/Md.cs b/cs/Markdown/Md.cs
@@ -0,0 +1,20 @@
+using Markdown.Parsers;
+using Markdown.Renderers;
+
+namespace Markdown;
+
+public class Md
+{
+    private readonly HtmlRenderer renderer;
+
+    public Md()
+    {
+        renderer = new HtmlRenderer();
+    }
+
+    public string Render(string markdownText)
+    {
+        var tokens = MarkdownParser.ParseTokens(markdownText);
+        return renderer.Render(tokens);
+    }
+}
diff --git a/cs/Markdown/Parsers/MarkdownParser.cs b/cs/Markdown/Parsers/MarkdownParser.cs
@@ -0,0 +1,211 @@
+using Markdown.Tokens;
+
+namespace Markdown.Parsers;
+
+public abstract class MarkdownParser
+{
+    public static IEnumerable<Token> ParseTokens(string markdownText)
+    {
+        if (markdownText == null)
+            throw new ArgumentNullException(nameof(markdownText));
+
+        var context = new MarkdownParseContext
+        {
+            MarkdownText = markdownText
+        };
+
+        while (context.CurrentIndex < context.MarkdownText.Length)
+        {
+            var current = context.MarkdownText[context.CurrentIndex];
+            var next = context.CurrentIndex + 1 < context.MarkdownText.Length ? 
+                context.MarkdownText[context.CurrentIndex + 1] : '\0';
+
+            switch (current)
+            {
+                case '\\':
+                    HandleEscapeCharacter(next, context);
+                    break;
+                case '_':
+                    if (next == '_')
+                        HandleStrongToken(context);
+                    else
+                        HandleEmphasisToken(context);
+                    break;
+                case '#' when (context.CurrentIndex == 0 || 
+                               context.MarkdownText[context.CurrentIndex - 1] == '\n') && next == ' ':
+                    context.HeaderLevel = HandleHeaderToken(context);
+                    break;
+                case '\n' when context.Stack.Count > 0 && context.Stack.Peek().Type == TokenType.Header:
+                    HandleNewLine(context);
+                    break; 
+                default:
+                    context.Buffer.Append(current);
+                    context.CurrentIndex++;
+                    break;
+            }
+
+            if (context.CurrentIndex != context.MarkdownText.Length || 
+                context.Stack.Count <= 0 || context.Stack.Peek().Type != TokenType.Header) continue;
+            AddToken(context, TokenType.Text);
+            context.Tokens.Add(context.Stack.Pop());
+        }
+        AddToken(context, TokenType.Text);
+        return context.Tokens;
+    }
+
+    private static void HandleEscapeCharacter(char next, MarkdownParseContext context)
+    {
+        if (next is '_' or '#' or '\\')
+        {
+            if (next != '\\')
+                context.Buffer.Append(next);
+            context.CurrentIndex += 2;
+        }
+        else
+        {
+            context.Buffer.Append('\\');
+            context.CurrentIndex++;
+        }
+    }
+
+    private static void HandleStrongToken(MarkdownParseContext context)
+    {
+        if (IsValidBoundary(context,"__"))
+        {
+            HandleTokenBoundary(context, TokenType.Strong);
+            context.CurrentIndex += 2;
+        }
+        else
+        {
+            context.Buffer.Append("__");
+            context.CurrentIndex += 2;
+        }
+    }
+
+    private static void HandleEmphasisToken(MarkdownParseContext context)
+    {
+        if (IsValidBoundary(context, "_"))
+        {
+            HandleTokenBoundary(context, TokenType.Emphasis);
+            context.CurrentIndex++;
+        }
+        else
+        {
+            context.Buffer.Append('_');
+            context.CurrentIndex++;
+        }
+    }
+
+    private static int HandleHeaderToken(MarkdownParseContext context)
+    {
+        while (context.CurrentIndex < context.MarkdownText.Length && 
+               context.MarkdownText[context.CurrentIndex] == '#')
+        {
+            context.HeaderLevel++;
+            context.CurrentIndex++;
+        }
+
+        if (context.CurrentIndex < context.MarkdownText.Length && 
+            context.MarkdownText[context.CurrentIndex] == ' ')
+        {
+            context.CurrentIndex++;
+
+            AddToken(context, TokenType.Text);
+            var headerToken = new Token(TokenType.Header)
+            {
+                HeaderLevel = context.HeaderLevel
+            };
+
+            context.Tokens.Add(headerToken);
+
+            var headerEnd = context.MarkdownText.IndexOf('\n', context.CurrentIndex);
+            if (headerEnd == -1)
+                headerEnd = context.MarkdownText.Length;
+
+            var headerContent = ParseTokens(context.MarkdownText[context.CurrentIndex..headerEnd]);
+
+            foreach (var childToken in headerContent)
+            {
+                headerToken.Children.Add(childToken);
+            }
+            context.CurrentIndex = headerEnd;
+        }
+        else
+        {
+            context.Buffer.Append('#', context.HeaderLevel);
+        }
+
+        return context.HeaderLevel;
+    }
+
+    private static void HandleNewLine(MarkdownParseContext context)
+    {
+        AddToken(context, TokenType.Text);
+        context.Tokens.Add(context.Stack.Pop());
+        context.CurrentIndex++;
+    }
+
+    private static void HandleTokenBoundary(MarkdownParseContext context, TokenType type)
+    {
+        AddToken(context, TokenType.Text);
+
+        if (context.Stack.Count > 0 && context.Stack.Peek().Type == type)
+        {
+            var completedToken = context.Stack.Pop();
+
+            completedToken.Content = completedToken.Children.Count > 0 ? string.Empty : completedToken.Content;
+            context.Buffer.Clear();
+
+            if (context.Stack.Count > 0)
+                context.Stack.Peek().Children.Add(completedToken);
+            else
+                context.Tokens.Add(completedToken);
+        }
+        else
+        {
+            var newToken = new Token(type);
+            context.Stack.Push(newToken);
+        }
+    }
+
+    private static void AddToken(MarkdownParseContext context, TokenType type)
+    {
+        if (context.Buffer.Length == 0) return;
+        var token = new Token(type, context.Buffer.ToString());
+        context.Buffer.Clear();
+
+        if (context.Stack.Count > 0)
+            context.Stack.Peek().Children.Add(token);
+        else
+            context.Tokens.Add(token);
+    }
+
+    private static bool IsValidBoundary(MarkdownParseContext context, string delimiter)
+    {
+        var index = context.CurrentIndex;
+        var text = context.MarkdownText;
+        if (context.Stack.Count > 0)
+        {
+            if (context.Buffer.Length == 0) 
+                return false;
+            if (index == 0 || index == text.Length - 1)
+                return true;
+            return !char.IsLetterOrDigit(text[index - 1]) || 
+                   !char.IsLetterOrDigit(context.MarkdownText[index + 1]);
+        }
+
+        var closingIndex = text.IndexOf(delimiter, index + delimiter.Length, StringComparison.Ordinal);
+        if (closingIndex == -1)
+            return false;
+
+        var isInsideWord = (index > 0 && char.IsLetterOrDigit(text[index - 1])) || 
+                           (closingIndex + delimiter.Length < text.Length && 
+                            char.IsLetterOrDigit(text[closingIndex + delimiter.Length]));
+        if (isInsideWord)
+            return false;
+
+        if (closingIndex - index <= delimiter.Length)
+            return false;
+        return index + 1 != closingIndex;
+    }
+}
diff --git a/cs/Markdown/Parsers/MarkdownParserContext.cs b/cs/Markdown/Parsers/MarkdownParserContext.cs
@@ -0,0 +1,13 @@
+using Markdown.Tokens;
+using System.Text;
+namespace Markdown.Parsers;
+
+public class MarkdownParseContext
+{
+    public Stack<Token> Stack { get; set; } = new();
+    public List<Token> Tokens { get; set; } = new();
+    public StringBuilder Buffer { get; set; } = new();
+    public string MarkdownText { get; set; } = "";
+    public int CurrentIndex { get; set; }
+    public int HeaderLevel { get; set; }
+}
diff --git a/cs/Markdown/Renderers/HtmlRenderer.cs b/cs/Markdown/Renderers/HtmlRenderer.cs
@@ -0,0 +1,59 @@
+using System.Text;
+using Markdown.Tokens;
+
+namespace Markdown.Renderers;
+
+public class HtmlRenderer
+{
+    public string Render(IEnumerable<Token> tokens)
+    {
+        var result = new StringBuilder();
+        foreach (var token in tokens)
+        {
+            RenderToken(token, result);
+        }
+        return result.ToString();
+    }
+
+    private void RenderToken(Token token, StringBuilder result)
+    {
+        switch (token.Type)
+        {
+            case TokenType.Text:
+                result.Append(token.Content);
+                break;
+            case TokenType.Emphasis:
+                result.Append("<em>");
+                RenderChildren(token, result);
+                result.Append("</em>");
+                break;
+            case TokenType.Strong:
+                result.Append("<strong>");
+                RenderChildren(token, result);
+                result.Append("</strong>");
+                break;
+            case TokenType.Header:
+                var level = token.HeaderLevel;
+                result.Append($"<h{level}>");
+                RenderChildren(token, result);
+                result.Append($"</h{level}>");
+                break;
+            default:
+                result.Append(token.Content);
+                break;
+        }
+    }
+
+    private void RenderChildren(Token token, StringBuilder result)
+    {
+        if (token.Children.Count > 0)
+        {
+            foreach (var child in token.Children)
+            {
+                RenderToken(child, result);
+            }
+        }
+        else
+            result.Append(token.Content);
+    }
+}
diff --git a/cs/Markdown/Tokens/Token.cs b/cs/Markdown/Tokens/Token.cs
@@ -0,0 +1,23 @@
+namespace Markdown.Tokens;
+
+public class Token
+{
+    public TokenType Type { get; }
+    public string Content { get; set; }
+    public List<Token> Children { get; }
+    public int HeaderLevel { get; init; }
+    public Token(TokenType type, string content, List<Token>? children = null)
+    {
+        Type = type;
+        Content = content;
+        Children = children ?? [];
+        HeaderLevel = 1;
+    }
+
+    public Token(TokenType type)
+    {
+        Type = type;
+        Content = string.Empty;
+        Children = [];
+    }
+}
diff --git a/cs/Markdown/Tokens/TokenType.cs b/cs/Markdown/Tokens/TokenType.cs
@@ -0,0 +1,9 @@
+namespace Markdown.Tokens;
+
+public enum TokenType
+{
+    Text,
+    Emphasis,
+    Strong,
+    Header
+}