# frozen_string_literal: true # Image URLs # # # sample # * https://imglf3.lf127.net/img/S1d2QlVsWkJhSW1qcnpIS0ZSa3ZJSzFCWFlnUWgzb01DcUdpT1lreG5yQjJVMkhGS09HNGR3PT0.png?imageView&thumbnail=1680x0&quality=96&stripmeta=0 # # # full size # * https://imglf3.lf127.net/img/S1d2QlVsWkJhSW1qcnpIS0ZSa3ZJSzFCWFlnUWgzb01DcUdpT1lreG5yQjJVMkhGS09HNGR3PT0.png # * http://imglf0.nosdn.127.net/img/cHl3bXNZdDRaaHBnNWJuN1Y4OXBqR01CeVBZSVNmU2FWZWtHc1h4ZTZiUGxlRzMwZnFDM1JnPT0.jpg (404) # # Page URLs # # * https://gengar563.lofter.com/post/1e82da8c_1c98dae1b # * https://yuli031458.lofter.com/post/3163d871_1cbdc5f6d (different theme/css selectors) # * https://ssucrose.lofter.com/post/1d30f3e4_1cc58e9f0 (another different theme) # * https://zuodaoxing.lofter.com/post/30b9c9c3_1cd15b686 (another theme) # # Profile URLs # # * http://gengar563.lofter.com/ module Sources module Strategies class Lofter < Base PROFILE_URL = %r{\Ahttps?://(?[\w-]+).lofter.com}i PAGE_URL = %r{#{PROFILE_URL}/post/(?[\w-]+)}i IMAGE_HOST = %r{\Ahttps?://imglf\d\.(?:nosdn\d?\.12\d|lf127)\.net}i def domains ["lofter.com", "lf127.net"] end def site_name "Lofter" end def match? return false if parsed_url.nil? parsed_url.domain.in?(domains) || parsed_url.host =~ IMAGE_HOST end def image_url if url =~ IMAGE_HOST get_full_version(url) else image_urls.first end end def image_urls images = page&.search(".imgclasstag img") images.to_a.map { |img| get_full_version(img["src"]) } end def get_full_version(url) parsed = URI.parse(url) "https://#{parsed.host}#{parsed.path}" end def profile_url return nil if artist_name.blank? "https://#{artist_name}.lofter.com" end def page_url return nil if illust_id.blank? || profile_url.blank? "#{profile_url}/post/#{illust_id}" end def page return nil if page_url.blank? response = http.cache(1.minute).get(page_url) response.parse if response.status == 200 end def tags tags = page&.search(".info .tag, .main .tag a, .tagarea, .m-info .tags .tag") tags.to_a.map do |tag| [tag.text.gsub(/^● /, ""), tag.attr("href")] end if tags.blank? tags = page&.search(".main .tags a").to_a.map do |tag| [tag.text.gsub(/^#/, ""), tag.attr("href")] end end tags end def artist_commentary_desc page&.search(".ct .text, .content .text, .posts .photo .text").to_a.compact.first&.to_html end def normalize_for_source page_url end def illust_id urls.map { |u| u[PAGE_URL, :illust_id] }.compact.first end def artist_name urls.map { |u| u[PROFILE_URL, :artist_name] || u[PAGE_URL, :artist_name] }.compact.first end def download_timeout 60 end end end end