[rzz] create feed from the webpage instead

pull/30/head
Alpha Chen 5 years ago
parent 036dbe2f2f
commit fa09f59de0

@ -8,36 +8,32 @@ module Rzz
class App < Roda
plugin :caching
plugin :json
route do |r|
r.get do
r.is "test-gym" do
url = "https://elemental.medium.com/feed"
xml = URI.open(url).read
r.etag Digest::SHA1.hexdigest(xml)
doc = Nokogiri::XML(xml)
self_url = "#{r.base_url}#{r.path}" # Should this be configured via the environment?
doc.at_xpath("/rss/channel/link/text()").content = self_url
doc.at_xpath("/rss/channel/atom:link[@href='#{url}']")["href"] = self_url
doc.at_xpath("/rss/channel/atom:link[@rel='hub']").remove
doc
.xpath("/rss/channel/item")
.select {|item| item.xpath("./category[text()='test-gym']").empty? }
.each(&:remove)
doc
.xpath("/rss/channel/item")
.each do |item|
link = item.at_xpath("./link/text()").content
item.at_xpath("./description/text()").content = URI.open(link).read
end
response.headers["Content-Type"] = "text/xml"
doc.to_xml
url = "https://elemental.medium.com/test-gym/home"
html = URI.open(url).read
doc = Nokogiri::HTML(html)
items = doc.xpath("//a[@data-post-id]").map {|a|
attrs = a.attributes
id = attrs.fetch("data-post-id").value
title = a.xpath("./h3").text
content = a.xpath("./div").text
href = URI(attrs.fetch("href"))
url = "#{href.scheme}://#{href.host}#{href.path}"
{ id: id, title: title, content_text: content, url: url }
}
{
version: "https://jsonfeed.org/version/1",
title: "Test Gym",
home_page_url: url,
feed_url: "#{r.base_url}#{r.path}",
items: items,
}
end
end
end

Loading…
Cancel
Save