Compare commits
2 Commits
Author | SHA1 | Date |
---|---|---|
|
6f29ac4b03 | |
|
5e0a725deb |
24
main.go
24
main.go
|
@ -98,6 +98,15 @@ func splitFeeds() []string {
|
||||||
return feeds
|
return feeds
|
||||||
}
|
}
|
||||||
|
|
||||||
|
func fetchLoop(feeds []string, db *nomad.DB) {
|
||||||
|
for _, feed := range feeds {
|
||||||
|
log.Infof("fetching items for feed %s", feed)
|
||||||
|
if err := fetchItems(db, feed, false); err != nil {
|
||||||
|
log.Errln(err)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
func main() {
|
func main() {
|
||||||
var (
|
var (
|
||||||
configFile string
|
configFile string
|
||||||
|
@ -105,12 +114,14 @@ func main() {
|
||||||
initDB bool
|
initDB bool
|
||||||
level string
|
level string
|
||||||
markOnly bool
|
markOnly bool
|
||||||
|
singleRun bool
|
||||||
)
|
)
|
||||||
|
|
||||||
flag.StringVar(&configFile, "f", defaultPath("nlink.conf"), "`path` to config file")
|
flag.StringVar(&configFile, "f", defaultPath("nlink.conf"), "`path` to config file")
|
||||||
flag.BoolVar(&initDB, "i", false, "initialize a new DB")
|
flag.BoolVar(&initDB, "i", false, "initialize a new DB")
|
||||||
flag.StringVar(&level, "l", "DEBUG", "log level")
|
flag.StringVar(&level, "l", "DEBUG", "log level")
|
||||||
flag.BoolVar(&markOnly, "m", false, "only mark posts as having been posted")
|
flag.BoolVar(&markOnly, "m", false, "only mark posts as having been posted")
|
||||||
|
flag.BoolVar(&singleRun, "s", false, "only go through a single run")
|
||||||
flag.DurationVar(&interval, "t", defaultInterval, "interval between fetching posts")
|
flag.DurationVar(&interval, "t", defaultInterval, "interval between fetching posts")
|
||||||
flag.Parse()
|
flag.Parse()
|
||||||
|
|
||||||
|
@ -167,15 +178,16 @@ func main() {
|
||||||
return
|
return
|
||||||
}
|
}
|
||||||
|
|
||||||
|
if singleRun {
|
||||||
|
log.Debugf("running a single loop")
|
||||||
|
fetchLoop(feeds, db)
|
||||||
|
return
|
||||||
|
}
|
||||||
|
|
||||||
log.Debugf("will look for new items every %s\n", interval)
|
log.Debugf("will look for new items every %s\n", interval)
|
||||||
for {
|
for {
|
||||||
log.Infoln("running fetch loop")
|
log.Infoln("running fetch loop")
|
||||||
for _, feed := range feeds {
|
fetchLoop(feeds, db)
|
||||||
log.Infof("fetching items for feed %s", feed)
|
|
||||||
if err := fetchItems(db, feed, markOnly); err != nil {
|
|
||||||
log.Errln(err)
|
|
||||||
}
|
|
||||||
}
|
|
||||||
time.Sleep(interval)
|
time.Sleep(interval)
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -4,14 +4,26 @@ import (
|
||||||
"bytes"
|
"bytes"
|
||||||
"errors"
|
"errors"
|
||||||
"fmt"
|
"fmt"
|
||||||
|
"net/url"
|
||||||
"path/filepath"
|
"path/filepath"
|
||||||
|
|
||||||
"git.sr.ht/~thrrgilag/woodstock"
|
"git.sr.ht/~thrrgilag/woodstock"
|
||||||
|
"git.wntrmute.dev/kyle/goutils/log"
|
||||||
"github.com/anaskhan96/soup"
|
"github.com/anaskhan96/soup"
|
||||||
)
|
)
|
||||||
|
|
||||||
func nomadLink(url Source) string {
|
func nomadLink(item Item) string {
|
||||||
return fmt.Sprintf("[nomad.wntrmute.net](%s)", url.ID())
|
if item.Title != "" {
|
||||||
|
return fmt.Sprintf("[%s](%s)", item.Title, item.URL.ID())
|
||||||
|
}
|
||||||
|
|
||||||
|
u, err := url.Parse(item.URL.ID())
|
||||||
|
if err != nil {
|
||||||
|
log.Errf("nomadLink: %s", err)
|
||||||
|
return fmt.Sprintf("[%s](%s)", item.URL.ID(), item.URL.ID())
|
||||||
|
}
|
||||||
|
|
||||||
|
return fmt.Sprintf("[%s](%s)", u.Host, item.URL.ID())
|
||||||
}
|
}
|
||||||
|
|
||||||
type sel struct {
|
type sel struct {
|
||||||
|
@ -22,6 +34,23 @@ func selector(selectors ...string) sel {
|
||||||
return sel{selectors: selectors}
|
return sel{selectors: selectors}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
type imageFinder func(soup.Root) (string, bool)
|
||||||
|
|
||||||
|
var imageFinders = []imageFinder{
|
||||||
|
func(root soup.Root) (string, bool) {
|
||||||
|
return find(
|
||||||
|
root, "src",
|
||||||
|
selector("div", "class", "entry-image"),
|
||||||
|
selector("img"))
|
||||||
|
},
|
||||||
|
func(root soup.Root) (string, bool) {
|
||||||
|
return find(
|
||||||
|
root, "src",
|
||||||
|
selector("div", "class", "gh-inner"),
|
||||||
|
selector("img"))
|
||||||
|
},
|
||||||
|
}
|
||||||
|
|
||||||
func find(root soup.Root, attr string, selectors ...sel) (string, bool) {
|
func find(root soup.Root, attr string, selectors ...sel) (string, bool) {
|
||||||
result := root
|
result := root
|
||||||
for _, selector := range selectors {
|
for _, selector := range selectors {
|
||||||
|
@ -41,16 +70,18 @@ func find(root soup.Root, attr string, selectors ...sel) (string, bool) {
|
||||||
}
|
}
|
||||||
|
|
||||||
type Post struct {
|
type Post struct {
|
||||||
|
Title string
|
||||||
Image Source
|
Image Source
|
||||||
Body string
|
Body string
|
||||||
URL Source
|
URL Source
|
||||||
}
|
}
|
||||||
|
|
||||||
func NewPost(item Item) Post {
|
func NewPost(item Item) Post {
|
||||||
return Post{
|
post := Post{
|
||||||
Body: nomadLink(item.URL),
|
Body: nomadLink(item),
|
||||||
URL: item.URL,
|
URL: item.URL,
|
||||||
}
|
}
|
||||||
|
return post
|
||||||
}
|
}
|
||||||
|
|
||||||
func (p *Post) Fetch() error {
|
func (p *Post) Fetch() error {
|
||||||
|
@ -65,10 +96,15 @@ func (p *Post) Fetch() error {
|
||||||
p.Body = body + " " + p.Body
|
p.Body = body + " " + p.Body
|
||||||
}
|
}
|
||||||
|
|
||||||
imageURL, hasImageURL := find(
|
var imageURL string
|
||||||
root, "src",
|
var hasImageURL bool
|
||||||
selector("div", "class", "entry-image"),
|
|
||||||
selector("img"))
|
for _, finder := range imageFinders {
|
||||||
|
imageURL, hasImageURL = finder(root)
|
||||||
|
if hasImageURL {
|
||||||
|
break
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
if hasImageURL {
|
if hasImageURL {
|
||||||
p.Image = NewURLSource(imageURL)
|
p.Image = NewURLSource(imageURL)
|
||||||
|
|
Loading…
Reference in New Issue