* `legacy_normalize` came from c6012535, which is no longer a problem.
* `normalize_for_search` is only used for "[mass edit]" links
in artist entries. These links are a shortcut for performing a
`-artist_name source:<artist_url> -> artist_name` mass edit to tag
untagged artists, but this won't work for most sites these days.
97 lines
2.5 KiB
Ruby
97 lines
2.5 KiB
Ruby
class ArtistUrl < ApplicationRecord
|
|
before_validation :parse_prefix
|
|
before_validation :initialize_normalized_url, on: :create
|
|
before_validation :normalize
|
|
validates :url, presence: true, uniqueness: { scope: :artist_id }
|
|
validate :validate_url_format
|
|
belongs_to :artist, :touch => true
|
|
|
|
def self.strip_prefixes(url)
|
|
url.sub(/^[-]+/, "")
|
|
end
|
|
|
|
def self.is_active?(url)
|
|
url !~ /^-/
|
|
end
|
|
|
|
def self.normalize(url)
|
|
if url.nil?
|
|
nil
|
|
else
|
|
url = url.sub(%r!^https://!, "http://")
|
|
url = url.sub(%r!^http://([^/]+)!i) { |domain| domain.downcase }
|
|
url = url.sub(%r!^http://blog\d+\.fc2!, "http://blog.fc2")
|
|
url = url.sub(%r!^http://blog-imgs-\d+\.fc2!, "http://blog.fc2")
|
|
url = url.sub(%r!^http://blog-imgs-\d+-\w+\.fc2!, "http://blog.fc2")
|
|
# url = url.sub(%r!^(http://seiga.nicovideo.jp/user/illust/\d+)\?.+!, '\1/')
|
|
url = url.sub(%r!^http://pictures.hentai-foundry.com//!, "http://pictures.hentai-foundry.com/")
|
|
|
|
# the strategy won't always work for twitter because it looks for a status
|
|
url = url.downcase if url =~ %r!^https?://(?:mobile\.)?twitter\.com!
|
|
|
|
begin
|
|
source = Sources::Strategies.find(url)
|
|
|
|
if !source.normalized_for_artist_finder? && source.normalizable_for_artist_finder?
|
|
url = source.normalize_for_artist_finder
|
|
end
|
|
rescue Net::OpenTimeout, PixivApiClient::Error
|
|
raise if Rails.env.test?
|
|
end
|
|
|
|
url = url.gsub(/\/+\Z/, "")
|
|
url = url.gsub(%r!^https://!, "http://")
|
|
url + "/"
|
|
end
|
|
end
|
|
|
|
def parse_prefix
|
|
case url
|
|
when /^-/
|
|
self.url = url[1..-1]
|
|
self.is_active = false
|
|
end
|
|
end
|
|
|
|
def priority
|
|
if normalized_url =~ /pixiv\.net\/member\.php/
|
|
10
|
|
|
|
elsif normalized_url =~ /seiga\.nicovideo\.jp\/user\/illust/
|
|
10
|
|
|
|
elsif normalized_url =~ /twitter\.com/ && normalized_url !~ /status/
|
|
15
|
|
|
|
elsif normalized_url =~ /tumblr|patreon|deviantart|artstation/
|
|
20
|
|
|
|
else
|
|
100
|
|
end
|
|
end
|
|
|
|
def normalize
|
|
self.normalized_url = self.class.normalize(url)
|
|
end
|
|
|
|
def initialize_normalized_url
|
|
self.normalized_url = url
|
|
end
|
|
|
|
def to_s
|
|
if is_active?
|
|
url
|
|
else
|
|
"-#{url}"
|
|
end
|
|
end
|
|
|
|
def validate_url_format
|
|
uri = Addressable::URI.parse(url)
|
|
errors[:url] << "#{uri} must begin with http:// or https://" if !uri.scheme.in?(%w[http https])
|
|
rescue Addressable::URI::InvalidURIError => error
|
|
errors[:url] << "is malformed: #{error}"
|
|
end
|
|
end
|