Files
danbooru/app/logical/source/extractor/hentai_foundry.rb
evazion c19fc16885 sources: don't escape Unicode characters in tag search URLs.
Fix it so that Unicode characters aren't unnecessarily percent-encoded when generating tag search
URLs. For example, generate URLs like this:

* https://www.pixiv.net/tags/オリジナル/artworks

Not like this:

* https://www.pixiv.net/tags/%E3%82%AA%E3%83%AA%E3%82%B8%E3%83%8A%E3%83%AB/artworks
2022-12-02 16:35:49 -06:00

75 lines
1.8 KiB
Ruby

# frozen_string_literal: true
# @see Source::URL::HentaiFoundry
module Source
class Extractor
class HentaiFoundry < Source::Extractor
def match?
Source::URL::HentaiFoundry === parsed_url
end
def image_urls
image = page&.search("#picBox img")
return [] unless image
image.to_a.map { |img| URI.join(page_url, img["src"]).to_s }
end
def page_url
return nil if illust_id.blank?
if artist_name.blank?
"https://www.hentai-foundry.com/pic-#{illust_id}"
else
"https://www.hentai-foundry.com/pictures/user/#{artist_name}/#{illust_id}"
end
end
def page
return nil if page_url.blank?
response = http.cache(1.minute).get("#{page_url}?enterAgree=1")
return nil unless response.status == 200
response.parse
end
def tags
tags = page&.search(".boxbody [rel='tag']").to_a.map(&:text)
tags.map do |tag|
[tag, "https://www.hentai-foundry.com/pictures/tagged/#{Danbooru::URL.escape(tag)}"]
end
end
def artist_name
parsed_url.username || parsed_referer&.username
end
def profile_url
return nil if artist_name.blank?
"https://www.hentai-foundry.com/user/#{artist_name}"
end
def artist_commentary_title
page&.search("#picBox .imageTitle")&.text
end
def artist_commentary_desc
page&.search("#descriptionBox .picDescript")&.to_html
end
def dtext_artist_commentary_desc
DText.from_html(artist_commentary_desc).gsub(/\A[[:space:]]+|[[:space:]]+\z/, "").gsub(/\n+/, "\n")
end
def illust_id
parsed_url.work_id || parsed_referer&.work_id
end
memoize :page
end
end
end