miniflux-v2/internal/reader/sanitizer/strip_tags.go

35 lines
792 B
Go
Raw Normal View History

// SPDX-FileCopyrightText: Copyright The Miniflux Authors. All rights reserved.
// SPDX-License-Identifier: Apache-2.0
2017-11-20 06:10:04 +01:00
package sanitizer // import "miniflux.app/v2/internal/reader/sanitizer"
2017-11-20 06:10:04 +01:00
import (
"bytes"
"io"
"golang.org/x/net/html"
)
// StripTags removes all HTML/XML tags from the input string.
2024-02-27 13:23:47 +01:00
// This function must *only* be used for cosmetic purposes, not to prevent code injections like XSS.
2017-11-20 06:10:04 +01:00
func StripTags(input string) string {
tokenizer := html.NewTokenizer(bytes.NewBufferString(input))
var buffer bytes.Buffer
for {
if tokenizer.Next() == html.ErrorToken {
err := tokenizer.Err()
if err == io.EOF {
return buffer.String()
}
return ""
}
token := tokenizer.Token()
if token.Type == html.TextToken {
2017-11-20 06:10:04 +01:00
buffer.WriteString(token.Data)
}
}
}