mirror of
https://github.com/Theodor-Springmann-Stiftung/hamann-ausgabe-core.git
synced 2025-10-30 01:35:32 +00:00
- Abstracted the XML-HTML Parser into a neat little state machine
- Added Settings classes for all things XML-HTML conversion
This commit is contained in:
136
HaWeb/HTMLParser/XMLHelper.cs
Normal file
136
HaWeb/HTMLParser/XMLHelper.cs
Normal file
@@ -0,0 +1,136 @@
|
||||
namespace HaWeb.HTMLParser;
|
||||
using HaXMLReader.Interfaces;
|
||||
using HaXMLReader.EvArgs;
|
||||
using System.Text;
|
||||
using System.Collections.Generic;
|
||||
using System;
|
||||
|
||||
public class XMLHelper<T> where T : IState
|
||||
{
|
||||
private IReader _in;
|
||||
private StringBuilder _target;
|
||||
private List<(Func<Tag, XMLHelper<T>, bool>, Action<StringBuilder, Tag, XMLHelper<T>>)>? _OTag_Funcs;
|
||||
private List<(Func<Tag, XMLHelper<T>, bool>, Action<StringBuilder, Tag, XMLHelper<T>>)>? _STag_Funcs;
|
||||
private List<(Func<Tag, XMLHelper<T>, bool>, Action<StringBuilder, Tag, XMLHelper<T>>)>? _CTag_Funcs;
|
||||
private List<(Func<Text, XMLHelper<T>, bool>, Action<StringBuilder, Text, XMLHelper<T>>)>? _Text_Funcs;
|
||||
private List<(Func<Whitespace, XMLHelper<T>, bool>, Action<StringBuilder, Whitespace, XMLHelper<T>>)>? _WS_Funcs;
|
||||
private bool _deleteLeadingWS;
|
||||
private bool _deleteTrailingWS;
|
||||
|
||||
public T State;
|
||||
public Stack<Tag> OpenTags;
|
||||
public Dictionary<string, List<Tag>> LastSingleTags;
|
||||
public StringBuilder LastText;
|
||||
|
||||
public XMLHelper(
|
||||
T state,
|
||||
IReader input,
|
||||
StringBuilder target,
|
||||
List<(Func<Tag, XMLHelper<T>, bool>, Action<StringBuilder, Tag, XMLHelper<T>>)>? OTag_Funcs = null,
|
||||
List<(Func<Tag, XMLHelper<T>, bool>, Action<StringBuilder, Tag, XMLHelper<T>>)>? STag_Funcs = null,
|
||||
List<(Func<Tag, XMLHelper<T>, bool>, Action<StringBuilder, Tag, XMLHelper<T>>)>? CTag_Funcs = null,
|
||||
List<(Func<Text, XMLHelper<T>, bool>, Action<StringBuilder, Text, XMLHelper<T>>)>? Text_Funcs = null,
|
||||
List<(Func<Whitespace, XMLHelper<T>, bool>, Action<StringBuilder, Whitespace, XMLHelper<T>>)>? WS_Funcs = null,
|
||||
bool deleteLeadingWS = false,
|
||||
bool deleteTrailingWS = false
|
||||
)
|
||||
{
|
||||
if (input == null || target == null || state == null) throw new ArgumentNullException();
|
||||
|
||||
State = state;
|
||||
_in = input;
|
||||
_target = target;
|
||||
_deleteLeadingWS = deleteLeadingWS;
|
||||
_deleteTrailingWS = deleteTrailingWS;
|
||||
|
||||
_OTag_Funcs = OTag_Funcs;
|
||||
_STag_Funcs = STag_Funcs;
|
||||
_CTag_Funcs = CTag_Funcs;
|
||||
_Text_Funcs = Text_Funcs;
|
||||
_WS_Funcs = WS_Funcs;
|
||||
|
||||
OpenTags = new Stack<Tag>();
|
||||
LastSingleTags = new Dictionary<string, List<Tag>>();
|
||||
LastText = new StringBuilder();
|
||||
|
||||
if (_OTag_Funcs != null)
|
||||
_in.OpenTag += OnOTag;
|
||||
if (_STag_Funcs != null)
|
||||
_in.SingleTag += OnSTag;
|
||||
if (_CTag_Funcs != null)
|
||||
_in.CloseTag += OnCTag;
|
||||
if (_Text_Funcs != null)
|
||||
_in.Text += OnText;
|
||||
if (_WS_Funcs != null)
|
||||
_in.Whitespace += OnWS;
|
||||
}
|
||||
|
||||
void OnOTag(object _, Tag tag)
|
||||
{
|
||||
OpenTags.Push(tag);
|
||||
if (_OTag_Funcs != null)
|
||||
foreach (var entry in _OTag_Funcs)
|
||||
if (entry.Item1(tag, this)) entry.Item2(_target, tag, this);
|
||||
}
|
||||
|
||||
void OnText(object _, Text text)
|
||||
{
|
||||
if (_deleteLeadingWS) text.Value = text.Value.TrimStart();
|
||||
if (_deleteTrailingWS) text.Value = text.Value.TrimEnd();
|
||||
LastText.Append(text.Value);
|
||||
if (_Text_Funcs != null)
|
||||
foreach (var entry in _Text_Funcs)
|
||||
if (entry.Item1(text, this)) entry.Item2(_target, text, this);
|
||||
}
|
||||
|
||||
void OnSTag(object _, Tag tag)
|
||||
{
|
||||
if (!LastSingleTags.ContainsKey(tag.Name))
|
||||
LastSingleTags.Add(tag.Name, new List<Tag>());
|
||||
LastSingleTags[tag.Name].Add(tag);
|
||||
if (_STag_Funcs != null)
|
||||
foreach (var entry in _STag_Funcs)
|
||||
if (entry.Item1(tag, this)) entry.Item2(_target, tag, this);
|
||||
}
|
||||
|
||||
void OnCTag(object _, Tag tag)
|
||||
{
|
||||
OpenTags.Pop();
|
||||
if(_CTag_Funcs != null)
|
||||
foreach (var entry in _CTag_Funcs)
|
||||
if (entry.Item1(tag, this)) entry.Item2(_target, tag, this);
|
||||
}
|
||||
|
||||
void OnWS(object _, Whitespace ws)
|
||||
{
|
||||
LastText.Append(ws.Value);
|
||||
if (_WS_Funcs != null)
|
||||
foreach (var entry in _WS_Funcs)
|
||||
if (entry.Item1(ws, this)) entry.Item2(_target, ws, this);
|
||||
}
|
||||
|
||||
internal void Dispose()
|
||||
{
|
||||
OpenTags = null;
|
||||
LastSingleTags = null;
|
||||
LastText = null;
|
||||
if (_in != null)
|
||||
{
|
||||
if (_OTag_Funcs != null)
|
||||
_in.OpenTag -= OnOTag;
|
||||
if (_STag_Funcs != null)
|
||||
_in.SingleTag -= OnSTag;
|
||||
if (_CTag_Funcs != null)
|
||||
_in.CloseTag -= OnCTag;
|
||||
if (_Text_Funcs != null)
|
||||
_in.Text -= OnText;
|
||||
if (_WS_Funcs != null)
|
||||
_in.Whitespace -= OnWS;
|
||||
}
|
||||
}
|
||||
|
||||
~XMLHelper()
|
||||
{
|
||||
Dispose();
|
||||
}
|
||||
}
|
||||
Reference in New Issue
Block a user