mirror of https://github.com/Squidex/squidex.git
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
97 lines
2.7 KiB
97 lines
2.7 KiB
// ==========================================================================
|
|
// Squidex Headless CMS
|
|
// ==========================================================================
|
|
// Copyright (c) Squidex UG (haftungsbeschraenkt)
|
|
// All rights reserved. Licensed under the MIT license.
|
|
// ==========================================================================
|
|
|
|
using System.Text;
|
|
using HtmlAgilityPack;
|
|
using Markdig;
|
|
|
|
namespace Squidex.Domain.Apps.Core
|
|
{
|
|
public static class TextHelpers
|
|
{
|
|
public static string Markdown2Text(string markdown)
|
|
{
|
|
return Markdown.ToPlainText(markdown).Trim(' ', '\n', '\r');
|
|
}
|
|
|
|
public static string Html2Text(string html)
|
|
{
|
|
var document = LoadHtml(html);
|
|
|
|
var sb = new StringBuilder();
|
|
|
|
WriteTextTo(document.DocumentNode, sb);
|
|
|
|
return sb.ToString().Trim(' ', '\n', '\r');
|
|
}
|
|
|
|
private static HtmlDocument LoadHtml(string text)
|
|
{
|
|
var document = new HtmlDocument();
|
|
|
|
document.LoadHtml(text);
|
|
|
|
return document;
|
|
}
|
|
|
|
private static void WriteTextTo(HtmlNode node, StringBuilder sb)
|
|
{
|
|
switch (node.NodeType)
|
|
{
|
|
case HtmlNodeType.Comment:
|
|
break;
|
|
case HtmlNodeType.Document:
|
|
WriteChildrenTextTo(node, sb);
|
|
break;
|
|
case HtmlNodeType.Text:
|
|
var html = ((HtmlTextNode)node).Text;
|
|
|
|
if (HtmlNode.IsOverlappedClosingElement(html))
|
|
{
|
|
break;
|
|
}
|
|
|
|
if (!string.IsNullOrWhiteSpace(html))
|
|
{
|
|
sb.Append(HtmlEntity.DeEntitize(html));
|
|
}
|
|
|
|
break;
|
|
|
|
case HtmlNodeType.Element:
|
|
switch (node.Name)
|
|
{
|
|
case "p":
|
|
sb.AppendLine();
|
|
break;
|
|
case "br":
|
|
sb.AppendLine();
|
|
break;
|
|
case "style":
|
|
return;
|
|
case "script":
|
|
return;
|
|
}
|
|
|
|
if (node.HasChildNodes)
|
|
{
|
|
WriteChildrenTextTo(node, sb);
|
|
}
|
|
|
|
break;
|
|
}
|
|
}
|
|
|
|
private static void WriteChildrenTextTo(HtmlNode node, StringBuilder sb)
|
|
{
|
|
foreach (var child in node.ChildNodes)
|
|
{
|
|
WriteTextTo(child, sb);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|