go-rss/rss.go

100 lines
2.2 KiB
Go
Raw Normal View History

/**
* Simple RSS parser, tested with various feeds.
*/
2012-03-24 20:11:38 +00:00
package rss
import (
"encoding/xml"
"net/http"
"time"
2013-12-17 16:44:03 +00:00
2013-03-14 23:25:13 +00:00
"code.google.com/p/go-charset/charset"
2013-03-14 23:32:01 +00:00
_ "code.google.com/p/go-charset/data"
2012-03-24 20:11:38 +00:00
)
const (
wordpressDateFormat = "Mon, 02 Jan 2006 15:04:05 -0700"
)
type Fetcher interface {
Get(url string) (resp *http.Response, err error)
}
2012-03-28 15:35:35 +00:00
type Channel struct {
Title string `xml:"title"`
Link string `xml:"link"`
Description string `xml:"description"`
Language string `xml:"language"`
LastBuildDate Date `xml:"lastBuildDate"`
Item []Item `xml:"item"`
}
type ItemEnclosure struct {
URL string `xml:"url,attr"`
Type string `xml:"type,attr"`
2012-03-24 20:11:38 +00:00
}
type Item struct {
2012-03-28 15:35:35 +00:00
Title string `xml:"title"`
Link string `xml:"link"`
Comments string `xml:"comments"`
PubDate Date `xml:"pubDate"`
GUID string `xml:"guid"`
Category []string `xml:"category"`
Enclosure ItemEnclosure `xml:"enclosure"`
Description string `xml:"description"`
Content string `xml:"content"`
2012-03-24 20:11:38 +00:00
}
2012-03-28 15:35:35 +00:00
type Date string
func (self Date) Parse() (time.Time, error) {
t, err := self.ParseWithFormat(wordpressDateFormat)
2012-03-24 20:11:38 +00:00
if err != nil {
t, err = self.ParseWithFormat(time.RFC822) // RSS 2.0 spec
2012-03-24 20:11:38 +00:00
}
return t, err
}
func (self Date) ParseWithFormat(format string) (time.Time, error) {
return time.Parse(format, string(self))
}
2012-03-28 15:35:35 +00:00
func (self Date) Format(format string) (string, error) {
t, err := self.Parse()
2012-03-24 20:11:38 +00:00
if err != nil {
return "", err
}
return t.Format(format), nil
}
2012-03-28 15:35:35 +00:00
func (self Date) MustFormat(format string) string {
s, err := self.Format(format)
2012-03-24 20:11:38 +00:00
if err != nil {
return err.Error()
}
return s
}
2012-03-28 15:35:35 +00:00
func Read(url string) (*Channel, error) {
2014-02-27 00:57:03 +00:00
return ReadWithClient(url, http.DefaultClient)
}
func ReadWithClient(url string, client Fetcher) (*Channel, error) {
2014-02-27 00:57:03 +00:00
response, err := client.Get(url)
2012-03-24 20:11:38 +00:00
if err != nil {
return nil, err
}
defer response.Body.Close()
2013-03-14 23:25:13 +00:00
xmlDecoder := xml.NewDecoder(response.Body)
xmlDecoder.CharsetReader = charset.NewReader
2012-03-28 15:35:35 +00:00
2012-03-24 20:11:38 +00:00
var rss struct {
2012-03-28 15:35:35 +00:00
Channel Channel `xml:"channel"`
2012-03-24 20:11:38 +00:00
}
2014-02-27 00:57:03 +00:00
if err = xmlDecoder.Decode(&rss); err != nil {
2012-03-24 20:11:38 +00:00
return nil, err
}
return &rss.Channel, nil
}