Files
danbooru/app/logical/source/extractor/newgrounds.rb
2022-11-09 15:01:28 +01:00

113 lines
3.0 KiB
Ruby

# frozen_string_literal: true
# @see Source::URL::Newgrounds
module Source
class Extractor
class Newgrounds < Source::Extractor
def match?
Source::URL::Newgrounds === parsed_url
end
def image_urls
if parsed_url.full_image_url.present?
[parsed_url.full_image_url]
elsif parsed_url.image_url?
[url]
elsif video_data.present?
[video_data.dig("sources", "1080p", 0, "src")&.sub(".1080p.", ".")].compact
else
urls = []
urls += page&.css(".image img").to_a.pluck("src")
urls += page&.css("#author_comments img[data-user-image='1']").to_a.map { |img| img["data-smartload-src"] || img["src"] }
urls.compact
end
end
def page_url
parsed_url.page_url || parsed_referer&.page_url
end
def tags
page&.css("#sidestats .tags a").to_a.map do |tag|
[tag.text, "https://www.newgrounds.com/search/conduct/art?match=tags&tags=#{tag.text}"]
end
end
def normalize_tag(tag)
tag = tag.tr("-", "_")
super(tag)
end
def artist_name
name = page&.css(".item-user .item-details h4 a")&.text&.strip || user_name
name&.downcase
end
def other_names
[artist_name, user_name].compact.uniq
end
def profile_url
# user names are not mutable, artist names are.
# However we need the latest name for normalization
"https://#{artist_name}.newgrounds.com" if artist_name.present?
end
def artist_commentary_title
page&.css(".pod-head > [itemprop='name']")&.text
end
def artist_commentary_desc
return "" if page.nil?
page.dup.css("#author_comments").tap { _1.css("ul.itemlist").remove }.to_html
end
def dtext_artist_commentary_desc
DText.from_html(artist_commentary_desc).strip
end
def user_name
parsed_url.username || parsed_referer&.username
end
def illust_title
parsed_url.work_title || parsed_referer&.work_title
end
def video_id
parsed_url.video_id || parsed_referer&.video_id
end
def http
super.cookies(vmkIdu5l8m: Danbooru.config.newgrounds_session_cookie)
end
def page
return nil if page_url.blank?
response = http.cache(1.minute).get(page_url)
return nil if response.status == 404
response.parse
end
def video_data
# flash files return {"error"=>{"code"=>404, "msg"=>"The submission you are looking for does not have a video."}}
return {} unless video_id.present?
response = http.headers("X-Requested-With": "XMLHttpRequest").cache(1.minute).get("https://www.newgrounds.com/portal/video/#{video_id}")
return {} unless response.status == 200
JSON.parse(response).with_indifferent_access
rescue JSON::ParserError
{}
end
memoize :page, :video_data
end
end
end