From c1c4f344cbfff654e729c83a6fb8013aa62d1504 Mon Sep 17 00:00:00 2001 From: David Howden Date: Tue, 15 Sep 2015 21:36:06 +1000 Subject: [PATCH] Added basic support for extracting published_time meta value --- crawler.go | 2 ++ 1 file changed, 2 insertions(+) diff --git a/crawler.go b/crawler.go index 64a135d..661cf57 100644 --- a/crawler.go +++ b/crawler.go @@ -87,6 +87,8 @@ func (this Crawler) Crawl() *Article { article.MetaLang = extractor.getMetaLanguage(article) article.MetaFavicon = extractor.getFavicon(article) + article.PublishDate = extractor.getMetaContentWithSelector(article, "meta[property#=(?i)article:published_time]") + article.MetaDescription = extractor.getMetaContentWithSelector(article, "meta[name#=(?i)description]") article.MetaKeywords = extractor.getMetaContentWithSelector(article, "meta[name#=(?i)keywords]") article.CanonicalLink = extractor.getCanonicalLink(article)