package main
import (
"flag"
"github.com/gorilla/feeds"
"io/ioutil"
"log"
"net/http"
"regexp"
"strconv"
"time"
)
type subst struct {
from string
to string
}
var (
substitutes = []subst{
{from: `"`, to: `"`},
{from: `–`, to: `–`},
}
programNameRe = regexp.MustCompile(`<h2>(.+?)?</h2>`)
programAboutRe = regexp.MustCompile(`(?s)<div class="brand__content_text__anons">(.+?)?</div>`)
programImageRe = regexp.MustCompile(`(?s)<div class="brand\-promo__header">(.+?)?<img src="(.+?)?"(.+?)?alt='(.+?)?'>`)
episodeRe = regexp.MustCompile(`(?s)<div class="brand__list\-\-wrap\-\-item">(.+?)?<div class="add\-to\-list">`)
episodeAudioRe = regexp.MustCompile(`data\-id="(.+?)?">`)
episodeDateRe = regexp.MustCompile(`brand\-time brand\-menu\-link">(.+?)?\.(.+?)?\.(.+?)? в (.+?)?:(.+?)?</a>`)
episodeDescRe = regexp.MustCompile(`<p class="anons">(.+?)?</p>`)
episodeTitleRe = regexp.MustCompile(`title brand\-menu\-link">(.+?)?</a>`)
episodeUrlRe = regexp.MustCompile(`<a href="/brand/(.+?)?" class="title`)
feed = &feeds.Feed{
Created: time.Now(),
}
outputPath, programNumber string
err error
)
func main() {
flag.StringVar(&outputPath, "path", "./", "path to put resulting RSS file in")
flag.StringVar(&programNumber, "brand", "57083", "brand number (defaults to Aerostat)")
flag.Parse()
programUrl := "http://www.radiorus.ru/brand/" + programNumber + "/episodes"
programPage := getPage(programUrl)
feed.Title = string(programNameRe.FindSubmatch(programPage)[1])
feed.Link = &feeds.Link{Href: programUrl}
programImage := programImageRe.FindSubmatch(programPage)
feed.Image = &feeds.Image{
Link: programUrl,
Url: string(programImage[2]),
Title: string(programImage[4]),
}
episodes := episodeRe.FindAll(programPage, -1)
programAboutUrl := "http://www.radiorus.ru/brand/" + programNumber + "/about"
programAboutPage := getPage(programAboutUrl)
programAbout := programAboutRe.FindSubmatch(programAboutPage)[1]
re := regexp.MustCompile(`<(.+?)?>`)
feed.Description = string(re.ReplaceAll(programAbout, []byte(``)))
for _, episode := range episodes {
episodeUrl := "http://www.radiorus.ru/brand/" + string(episodeUrlRe.FindSubmatch(episode)[1])
episodeTitle := string(episodeTitleRe.FindSubmatch(episode)[1])
episodeAudioUrl := "https://audio.vgtrk.com/download?id=" + string(episodeAudioRe.FindSubmatch(episode)[1])
dateBytes := episodeDateRe.FindSubmatch(episode)
var date [5]int
for i, b := range dateBytes[1:] {
date[i], err = strconv.Atoi(string(b))
if err != nil {
log.Fatal(err)
}
}
moscow := time.FixedZone("Moscow Time", int((3 * time.Hour).Seconds()))
episodeDate := time.Date(date[2], time.Month(date[1]), date[0], date[3], date[4], 0, 0, moscow)
episodePage := getPage(episodeUrl)
episodeDesc := string(episodeDescRe.FindSubmatch(episodePage)[1])
feed.Add(&feeds.Item{
Id: episodeUrl,
Link: &feeds.Link{Href: episodeUrl},
Title: episodeTitle,
Enclosure: &feeds.Enclosure{
Url: episodeAudioUrl,
Length: "1024",
Type: "audio/mpeg",
},
Created: episodeDate,
Description: episodeDesc,
})
}
rss, err := feed.ToRss()
if err != nil {
log.Fatal(err)
}
outputFile := outputPath + "radiorus-" + programNumber + ".rss"
output := []byte(rss)
if err := ioutil.WriteFile(outputFile, output, 0644); err != nil {
log.Fatal(err)
}
}
func getPage(pageUrl string) []byte {
res, err := http.Get(pageUrl)
if err != nil {
log.Fatal(err)
}
defer res.Body.Close()
page, err := ioutil.ReadAll(res.Body)
if err != nil {
log.Fatal(err)
}
for _, sub := range substitutes {
re := regexp.MustCompile(sub.from)
page = re.ReplaceAll(page, []byte(sub.to))
}
return page
}