package blog import ( "fmt" "github.com/Kugelschieber/marvinblum.de/tpl" emvi "github.com/emvi/api-go" "github.com/emvi/logbuch" "io/ioutil" "net/http" "os" "path/filepath" "regexp" "sync" "time" ) const ( blogCacheTime = time.Minute * 15 blogFileCache = "static/blog" maxLatestArticles = 3 ) var ( linkRegex = regexp.MustCompile(`(?iU)href="/read/([^"]+)"`) attachmentRegex = regexp.MustCompile(`(?iU)(href|src)="([^"]+)/api/v1/content/([^"]+)"`) attachmentURLRegex = regexp.MustCompile(`(?iU)(href|src)="([^"]+/api/v1/content/)([^"]+)"`) ) type Blog struct { client *emvi.Client articles []emvi.Article // sorted by date published (descending) articleMap map[string]emvi.Article // id -> article articlesYear map[int][]emvi.Article // year -> articleMap nextUpdate time.Time cache *tpl.Cache m sync.Mutex } func NewBlog(cache *tpl.Cache) *Blog { logbuch.Info("Initializing blog") b := &Blog{cache: cache} b.client = emvi.NewClient(os.Getenv("MB_EMVI_CLIENT_ID"), os.Getenv("MB_EMVI_CLIENT_SECRET"), os.Getenv("MB_EMVI_ORGA"), nil) b.nextUpdate = time.Now().Add(blogCacheTime) if err := os.MkdirAll(blogFileCache, 0755); err != nil { logbuch.Error("Error creating blog file cache directory", logbuch.Fields{"err": err}) } b.loadArticles() return b } func (blog *Blog) GetArticle(id string) emvi.Article { blog.refreshIfRequired() return blog.articleMap[id] } func (blog *Blog) GetArticles() map[int][]emvi.Article { blog.refreshIfRequired() return blog.articlesYear } func (blog *Blog) GetLatestArticles() []emvi.Article { blog.refreshIfRequired() articles := make([]emvi.Article, 0, 3) i := 1 for _, v := range blog.articles { articles = append(articles, v) i++ if i > maxLatestArticles { break } } return articles } func (blog *Blog) loadArticles() { blog.m.Lock() defer blog.m.Unlock() logbuch.Info("Refreshing blog articleMap...") articles, offset, count := make([]emvi.Article, 0), 0, 1 var err error for count > 0 { var results []emvi.Article results, _, err = blog.client.FindArticles("", &emvi.ArticleFilter{ BaseSearch: emvi.BaseSearch{Offset: offset}, Tags: "blog", SortPublished: emvi.SortDescending, }) if err != nil { logbuch.Error("Error loading blog articleMap", logbuch.Fields{"err": err}) break } offset += len(results) count = len(results) for _, article := range results { articles = append(articles, article) } } if err == nil { for i, article := range articles { article.LatestArticleContent = blog.loadArticle(article) articles[i] = article } blog.setArticles(articles) } blog.nextUpdate = time.Now().Add(blogCacheTime) logbuch.Info("Done", logbuch.Fields{"count": len(articles)}) } func (blog *Blog) loadArticle(article emvi.Article) *emvi.ArticleContent { existingArticle := blog.articleMap[article.Id] var content *emvi.ArticleContent if len(existingArticle.Id) == 0 || !existingArticle.ModTime.Equal(article.ModTime) { var err error _, content, _, err = blog.client.GetArticle(article.Id, article.LatestArticleContent.LanguageId, 0) if err != nil { logbuch.Error("Error loading article", logbuch.Fields{"err": err, "id": article.Id}) return nil } blog.downloadAttachments(article.Id, content.Content) content.Content = linkRegex.ReplaceAllString(content.Content, `href="/blog/$1"`) content.Content = attachmentRegex.ReplaceAllString(content.Content, fmt.Sprintf(`$1="/static/blog/%s/$3"`, article.Id)) logbuch.Debug("Article loaded", logbuch.Fields{"id": article.Id}) } else { content = existingArticle.LatestArticleContent logbuch.Debug("Article up to date, skipping refreshing cache", logbuch.Fields{"id": article.Id}) } return content } func (blog *Blog) downloadAttachments(id, content string) { if _, err := os.Stat(filepath.Join(blogFileCache, id)); os.IsNotExist(err) { if err := os.MkdirAll(filepath.Join(blogFileCache, id), 0755); err != nil { logbuch.Error("Error creating article file cache directory", logbuch.Fields{"err": err, "id": id}) return } } results := attachmentURLRegex.FindAllStringSubmatch(content, -1) for _, attachment := range results { if len(attachment) == 4 { resp, err := http.Get(attachment[2] + attachment[3]) if err != nil { logbuch.Error("Error downloading blog attachment", logbuch.Fields{"err": err, "id": id}) continue } data, err := ioutil.ReadAll(resp.Body) if err != nil { logbuch.Error("Error reading blog attachment body", logbuch.Fields{"err": err, "id": id}) continue } if err := resp.Body.Close(); err != nil { logbuch.Error("Error closing response body on attachment download", logbuch.Fields{"err": err, "id": id}) } if err := ioutil.WriteFile(filepath.Join(blogFileCache, id, attachment[3]), data, 0755); err != nil { logbuch.Error("Error saving blog attachment on disk", logbuch.Fields{"err": err, "id": id}) } } } } func (blog *Blog) setArticles(articles []emvi.Article) { blog.articles = articles blog.articleMap = make(map[string]emvi.Article) blog.articlesYear = make(map[int][]emvi.Article) for _, article := range articles { if blog.articlesYear[article.Published.Year()] == nil { blog.articlesYear[article.Published.Year()] = make([]emvi.Article, 0) } blog.articlesYear[article.Published.Year()] = append(blog.articlesYear[article.Published.Year()], article) blog.articleMap[article.Id] = article } } func (blog *Blog) refreshIfRequired() { if blog.nextUpdate.Before(time.Now()) { blog.cache.Clear() blog.loadArticles() } }