aboutsummaryrefslogtreecommitdiffhomepage
path: root/reader/atom
diff options
context:
space:
mode:
authorGravatar Frédéric Guillot <fred@miniflux.net>2019-09-18 22:27:25 -0700
committerGravatar Frédéric Guillot <fred@miniflux.net>2019-09-18 22:45:56 -0700
commit36d773223481dd42d31499b3ea73e6999ff9f58e (patch)
treea122e207303b2fa33b334dbe19e57a508a955a25 /reader/atom
parentca48f7612ada5d64d1097c40321a919eb28eb2bf (diff)
Disable strict XML parsing
This change should improve parsing of broken XML feeds. See https://golang.org/pkg/encoding/xml/#Decoder
Diffstat (limited to 'reader/atom')
-rw-r--r--reader/atom/parser.go1
-rw-r--r--reader/atom/parser_test.go19
2 files changed, 20 insertions, 0 deletions
diff --git a/reader/atom/parser.go b/reader/atom/parser.go
index 85be4b5..4749c1a 100644
--- a/reader/atom/parser.go
+++ b/reader/atom/parser.go
@@ -18,6 +18,7 @@ func Parse(data io.Reader) (*model.Feed, *errors.LocalizedError) {
atomFeed := new(atomFeed)
decoder := xml.NewDecoder(data)
decoder.Entity = xml.HTMLEntity
+ decoder.Strict = false
decoder.CharsetReader = encoding.CharsetReader
err := decoder.Decode(atomFeed)
diff --git a/reader/atom/parser_test.go b/reader/atom/parser_test.go
index dc42575..746c767 100644
--- a/reader/atom/parser_test.go
+++ b/reader/atom/parser_test.go
@@ -577,3 +577,22 @@ func TestParseWithHTMLEntity(t *testing.T) {
t.Errorf(`Incorrect title, got: %q`, feed.Title)
}
}
+
+func TestParseWithInvalidCharacterEntity(t *testing.T) {
+ data := `
+ <?xml version="1.0" encoding="utf-8"?>
+ <feed xmlns="http://www.w3.org/2005/Atom">
+ <title>Example Feed</title>
+ <link href="http://example.org/a&b"/>
+ </feed>
+ `
+
+ feed, err := Parse(bytes.NewBufferString(data))
+ if err != nil {
+ t.Fatal(err)
+ }
+
+ if feed.SiteURL != "http://example.org/a&b" {
+ t.Errorf(`Incorrect URL, got: %q`, feed.SiteURL)
+ }
+}