Files
danbooru/app/logical/sources/strategies/lofter.rb
evazion a7dc05ce63 Enable frozen string literals.
Make all string literals immutable by default.
2021-12-14 21:33:27 -06:00

117 lines
3.0 KiB
Ruby

# frozen_string_literal: true
# Image URLs
#
# # sample
# * https://imglf3.lf127.net/img/S1d2QlVsWkJhSW1qcnpIS0ZSa3ZJSzFCWFlnUWgzb01DcUdpT1lreG5yQjJVMkhGS09HNGR3PT0.png?imageView&thumbnail=1680x0&quality=96&stripmeta=0
#
# # full size
# * https://imglf3.lf127.net/img/S1d2QlVsWkJhSW1qcnpIS0ZSa3ZJSzFCWFlnUWgzb01DcUdpT1lreG5yQjJVMkhGS09HNGR3PT0.png
# * http://imglf0.nosdn.127.net/img/cHl3bXNZdDRaaHBnNWJuN1Y4OXBqR01CeVBZSVNmU2FWZWtHc1h4ZTZiUGxlRzMwZnFDM1JnPT0.jpg (404)
#
# Page URLs
#
# * https://gengar563.lofter.com/post/1e82da8c_1c98dae1b
# * https://yuli031458.lofter.com/post/3163d871_1cbdc5f6d (different theme/css selectors)
# * https://ssucrose.lofter.com/post/1d30f3e4_1cc58e9f0 (another different theme)
# * https://zuodaoxing.lofter.com/post/30b9c9c3_1cd15b686 (another theme)
#
# Profile URLs
#
# * http://gengar563.lofter.com/
module Sources
module Strategies
class Lofter < Base
PROFILE_URL = %r{\Ahttps?://(?<artist_name>[\w-]+).lofter.com}i
PAGE_URL = %r{#{PROFILE_URL}/post/(?<illust_id>[\w-]+)}i
IMAGE_HOST = %r{\Ahttps?://imglf\d\.(?:nosdn\d?\.12\d|lf127)\.net}i
def domains
["lofter.com", "lf127.net"]
end
def site_name
"Lofter"
end
def match?
return false if parsed_url.nil?
parsed_url.domain.in?(domains) || parsed_url.host =~ IMAGE_HOST
end
def image_url
if url =~ IMAGE_HOST
get_full_version(url)
else
image_urls.first
end
end
def image_urls
images = page&.search(".imgclasstag img")
images.to_a.map { |img| get_full_version(img["src"]) }
end
def get_full_version(url)
parsed = URI.parse(url)
"https://#{parsed.host}#{parsed.path}"
end
def profile_url
return nil if artist_name.blank?
"https://#{artist_name}.lofter.com"
end
def page_url
return nil if illust_id.blank? || profile_url.blank?
"#{profile_url}/post/#{illust_id}"
end
def page
return nil if page_url.blank?
response = http.cache(1.minute).get(page_url)
response.parse if response.status == 200
end
def tags
tags = page&.search(".info .tag, .main .tag a, .tagarea, .m-info .tags .tag")
tags.to_a.map do |tag|
[tag.text.gsub(/^● /, ""), tag.attr("href")]
end
if tags.blank?
tags = page&.search(".main .tags a").to_a.map do |tag|
[tag.text.gsub(/^#/, ""), tag.attr("href")]
end
end
tags
end
def artist_commentary_desc
page&.search(".ct .text, .content .text, .posts .photo .text").to_a.compact.first&.to_html
end
def normalize_for_source
page_url
end
def illust_id
urls.map { |u| u[PAGE_URL, :illust_id] }.compact.first
end
def artist_name
urls.map { |u| u[PROFILE_URL, :artist_name] || u[PAGE_URL, :artist_name] }.compact.first
end
def download_timeout
60
end
end
end
end