Files
danbooru/app/logical/source/extractor/newgrounds.rb
2022-11-11 12:28:23 +01:00

115 lines
3.1 KiB
Ruby

# frozen_string_literal: true
# @see Source::URL::Newgrounds
module Source
class Extractor
class Newgrounds < Source::Extractor
def match?
Source::URL::Newgrounds === parsed_url
end
def image_urls
if parsed_url.full_image_url.present?
[parsed_url.full_image_url]
elsif parsed_url.image_url?
[url]
elsif video_data.present?
sample = video_data&.[]("sources")&.max_by { |k, _v| k.gsub(/p$/, "").to_i }&.dig(1, 0, "src")
final = [Source::URL.parse(sample)&.full_image_url, sample].compact.find { |u| http_exists?(u) }
[final].compact
else
urls = []
urls += page&.css(".image img").to_a.pluck("src")
urls += page&.css("#author_comments img[data-user-image='1']").to_a.map { |img| img["data-smartload-src"] || img["src"] }
urls.compact
end
end
def page_url
parsed_url.page_url || parsed_referer&.page_url
end
def tags
page&.css("#sidestats .tags a").to_a.map do |tag|
[tag.text, "https://www.newgrounds.com/search/conduct/art?match=tags&tags=#{tag.text}"]
end
end
def normalize_tag(tag)
tag = tag.tr("-", "_")
super(tag)
end
def artist_name
name = page&.css(".item-user .item-details h4 a")&.text&.strip || user_name
name&.downcase
end
def other_names
[artist_name, user_name].compact.uniq
end
def profile_url
# user names are not mutable, artist names are.
# However we need the latest name for normalization
"https://#{artist_name}.newgrounds.com" if artist_name.present?
end
def artist_commentary_title
page&.css(".pod-head > [itemprop='name']")&.text
end
def artist_commentary_desc
return "" if page.nil?
page.dup.css("#author_comments").tap { _1.css("ul.itemlist").remove }.to_html
end
def dtext_artist_commentary_desc
DText.from_html(artist_commentary_desc).strip
end
def user_name
parsed_url.username || parsed_referer&.username
end
def illust_title
parsed_url.work_title || parsed_referer&.work_title
end
def video_id
parsed_url.video_id || parsed_referer&.video_id
end
def http
super.cookies(vmkIdu5l8m: Danbooru.config.newgrounds_session_cookie)
end
def page
return nil if page_url.blank?
response = http.cache(1.minute).get(page_url)
return nil if response.status == 404
response.parse
end
def video_data
# flash files return {"error"=>{"code"=>404, "msg"=>"The submission you are looking for does not have a video."}}
return {} unless video_id.present?
response = http.headers("X-Requested-With": "XMLHttpRequest").cache(1.minute).get("https://www.newgrounds.com/portal/video/#{video_id}")
return {} unless response.status == 200
JSON.parse(response).with_indifferent_access
rescue JSON::ParserError
{}
end
memoize :page, :video_data
end
end
end