FIX: ignore canonical link to localhost (#13577)

This commit is contained in:
Arpit Jalan
2021-06-30 13:55:17 +05:30
committed by GitHub
parent 6986b36985
commit b63c9febe8
2 changed files with 18 additions and 1 deletions

View File

@ -36,7 +36,7 @@ module Onebox
# prefer canonical link
canonical_link = doc.at('//link[@rel="canonical"]/@href')
canonical_uri = Addressable::URI.parse(canonical_link)
if canonical_link && "#{canonical_uri.host}#{canonical_uri.path}" != "#{uri.host}#{uri.path}"
if canonical_link && "#{canonical_uri.host}#{canonical_uri.path}" != "#{uri.host}#{uri.path}" && canonical_uri.host != "localhost"
response = (fetch_response(canonical_uri.to_s, headers: headers, body_cacher: body_cacher) rescue nil)
doc = Nokogiri::HTML(response) if response
end