This commit is contained in:
Balakrishnan Balasubramanian 2022-05-02 23:23:56 -04:00
parent 55320df622
commit ccbf558fa1
7 changed files with 86 additions and 28 deletions

View File

@ -9,12 +9,12 @@
* ✓ Posting to telegram * ✓ Posting to telegram
* ✓ Telegram rate limit: 20 msgs/min https://core.telegram.org/bots/faq#my-bot-is-hitting-limits-how-do-i-avoid-this * ✓ Telegram rate limit: 20 msgs/min https://core.telegram.org/bots/faq#my-bot-is-hitting-limits-how-do-i-avoid-this
https://gist.github.com/zdebra/10f0e284c4672e99f0cb767298f20c11 https://gist.github.com/zdebra/10f0e284c4672e99f0cb767298f20c11
* First Run skip all but first n * ✓ First Run skip all but first n
* Folder creation * ✓ Folder creation
* ✓ Wrap content inside item
* Change flags to os.Args[1] for config path * Change flags to os.Args[1] for config path
* Cleanup * Cleanup
* Make Rhash optional * Make Rhash optional
* Wrap content inside item
## Issues ## Issues
* ✓ Last record is not written fully to csv: *Fixed*. Had to Flush writer * ✓ Last record is not written fully to csv: *Fixed*. Had to Flush writer

View File

@ -73,16 +73,34 @@ func ProcessFeed(feed FeedCfg, scheduler Scheduler, dbDir string, tgram telegram
scheduler.Good(feed.Name) scheduler.Good(feed.Name)
filteredEntries, err := db.Filter(entries) var records []Record
var newEntries []FeedEntry
if db.IsNewFeed() {
ftl := int(feed.FirstTimeLimit)
if feed.FirstTimeLimit == NoLimit || len(entries) <= ftl {
newEntries = entries
} else {
var filteredEntries []FeedEntry
newEntries, filteredEntries = entries[:ftl], entries[ftl:]
for _, entry := range filteredEntries {
records = append(records, Record{
Time: time.Now(),
Status: Filtered,
Filter: "FirstTime",
FeedEntry: entry,
})
}
}
} else {
newEntries, err = db.Filter(entries)
if err != nil { if err != nil {
log.Error("failed to filter entries", "feed", feed.Name, "error", err) log.Error("failed to filter entries", "feed", feed.Name, "error", err)
} }
}
var records []Record for _, entry := range newEntries {
for _, entry := range filteredEntries {
now := time.Now()
r := Record{ r := Record{
Time: now, Time: time.Now(),
FeedEntry: entry, FeedEntry: entry,
} }
err := tgram.SendLink(entry.Link, feed.Channel, feed.Rhash) err := tgram.SendLink(entry.Link, feed.Channel, feed.Rhash)

View File

@ -7,6 +7,10 @@ import (
"gopkg.in/yaml.v3" "gopkg.in/yaml.v3"
) )
type FeedLimit int
const NoLimit FeedLimit = -1
type FeedCfg struct { type FeedCfg struct {
Name string `yaml:"name"` Name string `yaml:"name"`
Channel string `yaml:"channel"` Channel string `yaml:"channel"`
@ -14,16 +18,18 @@ type FeedCfg struct {
Url string `yaml:"url"` Url string `yaml:"url"`
Cron string `yaml:"cron"` Cron string `yaml:"cron"`
Proxy string `yaml:"proxy"` Proxy string `yaml:"proxy"`
FTL *int `yaml:"first_time_limit"`
FirstTimeLimit FeedLimit `yaml:"-"`
} }
type Config struct { type Config struct {
Proxy string `yaml:"proxy"` Proxy string `yaml:"proxy"`
TelegramProxy string `yaml:"telegram_proxy"` TelegramProxy string `yaml:"telegram_proxy"`
//TODO: read from credential file TelegramAuthToken string `yaml:"telegram_auth_token"` //TODO: read from credential file
TelegramAuthToken string `yaml:"telegram_auth_token"`
DataDir string `yaml:"data_dir"` DataDir string `yaml:"data_dir"`
LastSuccessPath string `yaml:"last_loaded_path"` LastSuccessPath string `yaml:"last_loaded_path"`
DbDir string `yaml:"db_dir"` DbDir string `yaml:"db_dir"`
FTL *int `yaml:"first_time_limit"`
Feeds []FeedCfg `yaml:"feeds"` Feeds []FeedCfg `yaml:"feeds"`
} }
@ -53,6 +59,17 @@ func ParseConfig(configPath string) (*Config, error) {
c.DbDir = path.Join(c.DataDir, "feed_data") c.DbDir = path.Join(c.DataDir, "feed_data")
} }
err = os.MkdirAll(c.DbDir, 0755)
if err != nil {
return nil, err
}
err = os.MkdirAll(c.DataDir, 0755)
if err != nil {
return nil, err
}
if c.Proxy != "" { if c.Proxy != "" {
if c.TelegramProxy == "" { if c.TelegramProxy == "" {
c.TelegramProxy = c.Proxy c.TelegramProxy = c.Proxy
@ -74,6 +91,13 @@ func ParseConfig(configPath string) (*Config, error) {
if feedCfg.Proxy == "NONE" { if feedCfg.Proxy == "NONE" {
feedCfg.Proxy = "" feedCfg.Proxy = ""
} }
if feedCfg.FTL != nil {
feedCfg.FirstTimeLimit = FeedLimit(*feedCfg.FTL)
} else if c.FTL != nil {
feedCfg.FirstTimeLimit = FeedLimit(*c.FTL)
} else {
feedCfg.FirstTimeLimit = NoLimit
}
} }
return &c, nil return &c, nil

View File

@ -26,10 +26,12 @@ const TimeFormat string = "2006-01-02T15:04:05.999999999-07:00"
type Record struct { type Record struct {
Time time.Time Time time.Time
Status Status Status Status
Filter string
FeedEntry FeedEntry FeedEntry FeedEntry
} }
type DB interface { type DB interface {
IsNewFeed() bool
Filter(entries []FeedEntry) ([]FeedEntry, error) Filter(entries []FeedEntry) ([]FeedEntry, error)
Save([]Record) error Save([]Record) error
} }
@ -39,6 +41,10 @@ type db struct {
seenLinks map[string]struct{} seenLinks map[string]struct{}
} }
func (d *db) IsNewFeed() bool {
return len(d.seenLinks) == 0
}
func NewDB(storageDir, feedName string) (DB, error) { func NewDB(storageDir, feedName string) (DB, error) {
dbPath := path.Join(storageDir, fmt.Sprintf("%s.csv", feedName)) dbPath := path.Join(storageDir, fmt.Sprintf("%s.csv", feedName))
db := db{dbPath: dbPath} db := db{dbPath: dbPath}
@ -91,7 +97,7 @@ func (d *db) Save(records []Record) error {
"Date", "Date",
"Link", "Link",
"Status", "Status",
"FilteredBy", "Filter",
"Content", "Content",
}) })
} }
@ -100,8 +106,8 @@ func (d *db) Save(records []Record) error {
r.Time.Format(TimeFormat), r.Time.Format(TimeFormat),
r.FeedEntry.Link, r.FeedEntry.Link,
string(r.Status), string(r.Status),
"-", r.Filter,
strings.ReplaceAll(r.FeedEntry.Content, "\n", " "), fmt.Sprintf("<item>%s</item>", strings.ReplaceAll(r.FeedEntry.Content, "\n", " ")),
}) })
} }
csvw.Flush() csvw.Flush()

View File

@ -23,7 +23,7 @@ type scheduler struct {
} }
func NewScheduler(filePath string) (Scheduler, error) { func NewScheduler(filePath string) (Scheduler, error) {
s := scheduler{filePath: filePath} s := scheduler{filePath: filePath, lastSuccessTime: map[string]time.Time{}}
data, err := os.ReadFile(filePath) data, err := os.ReadFile(filePath)
if err != nil { if err != nil {
if !errors.Is(err, os.ErrNotExist) { if !errors.Is(err, os.ErrNotExist) {

14
exp/slice/main.go Normal file
View File

@ -0,0 +1,14 @@
package main
import "fmt"
func main() {
var arr []int
for i := 0; i < 10; i++ {
arr = append(arr, i)
}
fmt.Println(arr)
fmt.Println(arr[:0], arr[0:])
fmt.Println(arr[:4], arr[4:])
fmt.Println(arr[:15], arr[15:])
}

View File

@ -15,10 +15,6 @@ import (
"golang.org/x/time/rate" "golang.org/x/time/rate"
) )
func main() {
fmt.Println("vim-go")
}
type TelegramSender interface { type TelegramSender interface {
SendLink(link, channel, rhash string) error SendLink(link, channel, rhash string) error
} }