2019-05-02 17:17:27 -05:00
|
|
|
# frozen_string_literal: true
|
|
|
|
|
2015-06-12 05:02:36 -05:00
|
|
|
class UrlHelper
|
2013-11-20 06:10:08 -06:00
|
|
|
|
2018-12-11 01:03:13 -06:00
|
|
|
# At the moment this handles invalid URLs that browser address bar accepts
|
|
|
|
# where second # is not encoded
|
|
|
|
#
|
|
|
|
# Longer term we can add support of simpleidn and encode unicode domains
|
|
|
|
def self.relaxed_parse(url)
|
|
|
|
url, fragment = url.split("#", 2)
|
|
|
|
uri = URI.parse(url)
|
|
|
|
if uri
|
2019-12-11 20:49:21 -06:00
|
|
|
# Addressable::URI::CharacterClasses::UNRESERVED is used here because without it
|
|
|
|
# the # in the fragment is not encoded
|
|
|
|
fragment = Addressable::URI.encode_component(fragment, Addressable::URI::CharacterClasses::UNRESERVED) if fragment&.include?('#')
|
2018-12-11 01:03:13 -06:00
|
|
|
uri.fragment = fragment
|
|
|
|
uri
|
|
|
|
end
|
|
|
|
rescue URI::Error
|
|
|
|
end
|
|
|
|
|
2019-12-11 20:49:21 -06:00
|
|
|
def self.encode_and_parse(url)
|
|
|
|
URI.parse(Addressable::URI.encode(url))
|
|
|
|
end
|
|
|
|
|
|
|
|
def self.encode(url)
|
|
|
|
Addressable::URI.encode(url)
|
|
|
|
end
|
|
|
|
|
|
|
|
def self.unencode(url)
|
|
|
|
Addressable::URI.unencode(url)
|
|
|
|
end
|
|
|
|
|
|
|
|
def self.encode_component(url_component)
|
|
|
|
Addressable::URI.encode_component(url_component)
|
|
|
|
end
|
|
|
|
|
2015-06-12 05:02:36 -05:00
|
|
|
def self.is_local(url)
|
2014-07-18 10:54:18 -05:00
|
|
|
url.present? && (
|
|
|
|
Discourse.store.has_been_uploaded?(url) ||
|
2019-04-13 12:35:23 -05:00
|
|
|
!!(url =~ Regexp.new("^#{Discourse.base_uri}/(assets|plugins|images)/")) ||
|
2014-07-18 10:54:18 -05:00
|
|
|
url.start_with?(Discourse.asset_host || Discourse.base_url_no_prefix)
|
|
|
|
)
|
2013-11-20 06:10:08 -06:00
|
|
|
end
|
|
|
|
|
2015-06-12 05:02:36 -05:00
|
|
|
def self.absolute(url, cdn = Discourse.asset_host)
|
2019-05-02 17:17:27 -05:00
|
|
|
cdn = "https:#{cdn}" if cdn && cdn =~ /^\/\//
|
2013-12-16 17:35:34 -06:00
|
|
|
url =~ /^\/[^\/]/ ? (cdn || Discourse.base_url_no_prefix) + url : url
|
|
|
|
end
|
|
|
|
|
2015-06-12 05:02:36 -05:00
|
|
|
def self.absolute_without_cdn(url)
|
|
|
|
self.absolute(url, nil)
|
2013-11-20 06:10:08 -06:00
|
|
|
end
|
|
|
|
|
2015-06-12 05:02:36 -05:00
|
|
|
def self.schemaless(url)
|
2016-06-30 09:55:01 -05:00
|
|
|
url.sub(/^http:/i, "")
|
2013-11-20 06:10:08 -06:00
|
|
|
end
|
|
|
|
|
2019-11-17 19:25:42 -06:00
|
|
|
def self.secure_proxy_without_cdn(url)
|
2020-01-23 19:59:30 -06:00
|
|
|
self.absolute(Upload.secure_media_url_from_upload_url(url), nil)
|
2019-11-17 19:25:42 -06:00
|
|
|
end
|
|
|
|
|
2017-12-12 10:50:39 -06:00
|
|
|
# Prevents double URL encode
|
|
|
|
# https://stackoverflow.com/a/37599235
|
2019-12-11 20:49:21 -06:00
|
|
|
def self.escape_uri(uri)
|
2020-01-30 17:09:34 -06:00
|
|
|
return uri if s3_presigned_url?(uri)
|
2019-12-11 20:49:21 -06:00
|
|
|
UrlHelper.encode_component(CGI.unescapeHTML(UrlHelper.unencode(uri)))
|
2020-01-30 17:09:34 -06:00
|
|
|
end
|
|
|
|
|
|
|
|
def self.s3_presigned_url?(url)
|
|
|
|
(url.downcase =~ /x-amz-algorithm|x-amz-credential/).present?
|
2017-12-12 10:50:39 -06:00
|
|
|
end
|
|
|
|
|
2019-11-17 19:25:42 -06:00
|
|
|
def self.cook_url(url, secure: false)
|
2018-08-14 05:23:32 -05:00
|
|
|
return url unless is_local(url)
|
|
|
|
|
|
|
|
uri = URI.parse(url)
|
|
|
|
filename = File.basename(uri.path)
|
2019-11-17 19:25:42 -06:00
|
|
|
is_attachment = !FileHelper.is_supported_media?(filename)
|
2018-08-14 05:23:32 -05:00
|
|
|
|
|
|
|
no_cdn = SiteSetting.login_required || SiteSetting.prevent_anons_from_downloading_files
|
|
|
|
|
2019-11-17 19:25:42 -06:00
|
|
|
url = secure ? secure_proxy_without_cdn(url) : absolute_without_cdn(url)
|
2019-02-20 12:24:38 -06:00
|
|
|
|
2019-11-21 23:29:31 -06:00
|
|
|
# we always want secure media to come from
|
|
|
|
# Discourse.base_url_no_prefix/secure-media-uploads
|
|
|
|
# to avoid asset_host mixups
|
|
|
|
return schemaless(url) if secure
|
|
|
|
|
2019-02-20 12:24:38 -06:00
|
|
|
unless is_attachment && no_cdn
|
|
|
|
url = Discourse.store.cdn_url(url)
|
|
|
|
url = local_cdn_url(url) if Discourse.store.external?
|
|
|
|
end
|
2018-08-14 05:23:32 -05:00
|
|
|
|
|
|
|
schemaless(url)
|
|
|
|
rescue URI::Error
|
|
|
|
url
|
|
|
|
end
|
|
|
|
|
2019-02-20 12:24:38 -06:00
|
|
|
def self.local_cdn_url(url)
|
|
|
|
return url if Discourse.asset_host.blank?
|
2019-10-14 01:09:16 -05:00
|
|
|
if url.start_with?("/#{Discourse.store.upload_path}/")
|
|
|
|
"#{Discourse.asset_host}#{url}"
|
|
|
|
else
|
|
|
|
url.sub(Discourse.base_url_no_prefix, Discourse.asset_host)
|
|
|
|
end
|
2019-02-20 12:24:38 -06:00
|
|
|
end
|
|
|
|
|
2013-11-20 06:10:08 -06:00
|
|
|
end
|