mirror of
https://github.com/Theodor-Springmann-Stiftung/lenz-web.git
synced 2025-10-29 01:05:32 +00:00
Seitenumbrüche und Weißraum FIX
This commit is contained in:
155
helpers/functions/textparse.go
Normal file
155
helpers/functions/textparse.go
Normal file
@@ -0,0 +1,155 @@
|
||||
package functions
|
||||
|
||||
import (
|
||||
"strings"
|
||||
|
||||
xmlparsing "github.com/Theodor-Springmann-Stiftung/lenz-web/xml"
|
||||
)
|
||||
|
||||
type outType int
|
||||
|
||||
const (
|
||||
NA outType = iota
|
||||
Text
|
||||
Element
|
||||
EmptyElement
|
||||
EndElement
|
||||
)
|
||||
|
||||
type outToken struct {
|
||||
Type outType
|
||||
Name string
|
||||
Classes []string
|
||||
Id string
|
||||
Value string
|
||||
}
|
||||
|
||||
func (o *outToken) ClassesFromAttrs(attrs map[string]string) {
|
||||
if len(attrs) == 0 {
|
||||
return
|
||||
}
|
||||
for key, value := range attrs {
|
||||
o.Classes = append(o.Classes, key+"-"+value)
|
||||
}
|
||||
}
|
||||
|
||||
func Default(token xmlparsing.Token) outToken {
|
||||
o := outToken{}
|
||||
switch token.Type {
|
||||
case xmlparsing.StartElement:
|
||||
o.Name = "div"
|
||||
o.Type = Element
|
||||
o.Classes = []string{token.Name}
|
||||
o.ClassesFromAttrs(token.Attributes)
|
||||
case xmlparsing.EndElement:
|
||||
o.Type = EndElement
|
||||
case xmlparsing.CharData:
|
||||
o.Type = Text
|
||||
o.Value = token.Data
|
||||
}
|
||||
return o
|
||||
}
|
||||
|
||||
type LenzParseState struct {
|
||||
Out []outToken
|
||||
LC int
|
||||
PC string
|
||||
CloseElement bool
|
||||
}
|
||||
|
||||
func (s *LenzParseState) String() string {
|
||||
builder := strings.Builder{}
|
||||
for _, token := range s.Out {
|
||||
switch token.Type {
|
||||
case Text:
|
||||
builder.WriteString(token.Value)
|
||||
case Element:
|
||||
builder.WriteString("<")
|
||||
builder.WriteString(token.Name)
|
||||
if len(token.Classes) > 0 {
|
||||
builder.WriteString(" class=\"")
|
||||
builder.WriteString(strings.Join(token.Classes, " "))
|
||||
builder.WriteString("\"")
|
||||
}
|
||||
if len(token.Id) > 0 {
|
||||
builder.WriteString(" id=\"")
|
||||
builder.WriteString(token.Id)
|
||||
builder.WriteString("\"")
|
||||
}
|
||||
builder.WriteString(">")
|
||||
case EndElement:
|
||||
builder.WriteString("</div>")
|
||||
case EmptyElement:
|
||||
builder.WriteString("<")
|
||||
builder.WriteString(token.Name)
|
||||
if len(token.Classes) > 0 {
|
||||
builder.WriteString(" class=\"")
|
||||
builder.WriteString(strings.Join(token.Classes, " "))
|
||||
builder.WriteString("\"")
|
||||
}
|
||||
|
||||
if len(token.Id) > 0 {
|
||||
builder.WriteString(" id=\"")
|
||||
builder.WriteString(token.Id)
|
||||
builder.WriteString("\"")
|
||||
}
|
||||
builder.WriteString("/>")
|
||||
}
|
||||
}
|
||||
return builder.String()
|
||||
}
|
||||
|
||||
func ParseGeneric(s string) string {
|
||||
if len(s) == 0 {
|
||||
return ""
|
||||
}
|
||||
|
||||
ps := LenzParseState{CloseElement: true}
|
||||
|
||||
for elem, err := range xmlparsing.Iterate(s, ps) {
|
||||
if err != nil {
|
||||
return err.Error()
|
||||
}
|
||||
|
||||
if elem.Token.Type < 3 {
|
||||
if !ps.CloseElement && elem.Token.Type == xmlparsing.EndElement {
|
||||
ps.CloseElement = true
|
||||
continue
|
||||
} else if elem.Token.Type == xmlparsing.EndElement {
|
||||
ps.Out = append(ps.Out, Default(elem.Token))
|
||||
continue
|
||||
}
|
||||
|
||||
defaultToken := Default(elem.Token)
|
||||
switch elem.Token.Name {
|
||||
case "line":
|
||||
nt := outToken{
|
||||
Type: EmptyElement,
|
||||
Name: "br",
|
||||
}
|
||||
if val := elem.Token.Attributes["type"]; val != "empty" {
|
||||
ps.Out = append(ps.Out, nt)
|
||||
ps.LC += 1
|
||||
ps.Out = append(ps.Out, defaultToken)
|
||||
} else {
|
||||
nt.Classes = []string{"empty"}
|
||||
ps.Out = append(ps.Out, nt)
|
||||
ps.CloseElement = false
|
||||
}
|
||||
case "page":
|
||||
ps.LC = 0
|
||||
ps.PC = elem.Token.Attributes["index"]
|
||||
ps.Out = append(ps.Out, defaultToken)
|
||||
nt := outToken{
|
||||
Type: Text,
|
||||
Value: "[" + ps.PC + "]",
|
||||
}
|
||||
ps.Out = append(ps.Out, nt)
|
||||
default:
|
||||
ps.Out = append(ps.Out, defaultToken)
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
return ps.String()
|
||||
}
|
||||
Reference in New Issue
Block a user