2020-12-24 03:33:14 +01:00
|
|
|
# typed: true
|
2020-08-08 07:16:06 +05:30
|
|
|
# frozen_string_literal: true
|
|
|
|
|
|
|
|
module Homebrew
|
|
|
|
module Livecheck
|
|
|
|
module Strategy
|
2020-11-05 17:17:03 -05:00
|
|
|
# The {PageMatch} strategy fetches content at a URL and scans it for
|
2020-08-08 07:16:06 +05:30
|
|
|
# matching text using the provided regex.
|
|
|
|
#
|
|
|
|
# This strategy can be used in a `livecheck` block when no specific
|
2020-11-05 17:17:03 -05:00
|
|
|
# strategies apply to a given URL. Though {PageMatch} will technically
|
2020-08-08 07:16:06 +05:30
|
|
|
# match any HTTP URL, the strategy also requires a regex to function.
|
|
|
|
#
|
2021-08-10 18:38:21 -04:00
|
|
|
# The {find_versions} method is also used within other strategies,
|
|
|
|
# to handle the process of identifying version text in content.
|
2020-08-08 07:16:06 +05:30
|
|
|
#
|
|
|
|
# @api public
|
|
|
|
class PageMatch
|
2020-12-24 03:33:14 +01:00
|
|
|
extend T::Sig
|
|
|
|
|
2020-08-08 07:16:06 +05:30
|
|
|
NICE_NAME = "Page match"
|
|
|
|
|
|
|
|
# A priority of zero causes livecheck to skip the strategy. We do this
|
2021-08-10 18:38:21 -04:00
|
|
|
# for {PageMatch} so we can selectively apply it only when a regex is
|
|
|
|
# provided in a `livecheck` block.
|
2020-08-08 07:16:06 +05:30
|
|
|
PRIORITY = 0
|
|
|
|
|
|
|
|
# The `Regexp` used to determine if the strategy applies to the URL.
|
|
|
|
URL_MATCH_REGEX = %r{^https?://}i.freeze
|
|
|
|
|
|
|
|
# Whether the strategy can be applied to the provided URL.
|
2021-08-10 18:38:21 -04:00
|
|
|
# {PageMatch} will technically match any HTTP URL but is only
|
2020-12-12 21:56:07 +01:00
|
|
|
# usable with a `livecheck` block containing a regex.
|
2021-08-10 18:38:21 -04:00
|
|
|
#
|
|
|
|
# @param url [String] the URL to match against
|
|
|
|
# @return [Boolean]
|
2020-12-24 03:33:14 +01:00
|
|
|
sig { params(url: String).returns(T::Boolean) }
|
2020-08-08 07:16:06 +05:30
|
|
|
def self.match?(url)
|
|
|
|
URL_MATCH_REGEX.match?(url)
|
|
|
|
end
|
|
|
|
|
2020-12-22 22:46:52 -05:00
|
|
|
# Uses the regex to match text in the content or, if a block is
|
|
|
|
# provided, passes the page content to the block to handle matching.
|
|
|
|
# With either approach, an array of unique matches is returned.
|
2020-11-05 17:17:03 -05:00
|
|
|
#
|
2020-12-22 22:46:52 -05:00
|
|
|
# @param content [String] the page content to check
|
2020-08-08 07:16:06 +05:30
|
|
|
# @param regex [Regexp] a regex used for matching versions in the
|
|
|
|
# content
|
|
|
|
# @return [Array]
|
2021-07-26 20:32:10 -04:00
|
|
|
sig {
|
|
|
|
params(
|
|
|
|
content: String,
|
|
|
|
regex: Regexp,
|
|
|
|
block: T.nilable(
|
|
|
|
T.proc.params(arg0: String, arg1: Regexp).returns(T.any(String, T::Array[String], NilClass)),
|
|
|
|
),
|
|
|
|
).returns(T::Array[String])
|
|
|
|
}
|
2021-08-10 11:09:55 -04:00
|
|
|
def self.versions_from_content(content, regex, &block)
|
|
|
|
return Strategy.handle_block_return(block.call(content, regex)) if block
|
2020-12-14 02:07:07 +01:00
|
|
|
|
2020-12-22 22:46:52 -05:00
|
|
|
content.scan(regex).map do |match|
|
2020-12-15 20:08:53 +01:00
|
|
|
case match
|
|
|
|
when String
|
|
|
|
match
|
2021-07-26 20:32:10 -04:00
|
|
|
when Array
|
2020-12-15 20:08:53 +01:00
|
|
|
match.first
|
|
|
|
end
|
2021-07-26 20:32:10 -04:00
|
|
|
end.compact.uniq
|
2020-08-08 07:16:06 +05:30
|
|
|
end
|
|
|
|
|
|
|
|
# Checks the content at the URL for new versions, using the provided
|
|
|
|
# regex for matching.
|
2020-12-23 09:12:53 -05:00
|
|
|
#
|
|
|
|
# @param url [String] the URL of the content to check
|
2021-08-10 18:38:21 -04:00
|
|
|
# @param regex [Regexp] a regex used for matching versions
|
|
|
|
# @param provided_content [String, nil] page content to use in place of
|
2020-12-23 09:12:53 -05:00
|
|
|
# fetching via Strategy#page_content
|
|
|
|
# @return [Hash]
|
2021-01-17 22:45:55 -08:00
|
|
|
sig {
|
2020-12-23 09:12:53 -05:00
|
|
|
params(
|
|
|
|
url: String,
|
2021-07-26 20:32:10 -04:00
|
|
|
regex: Regexp,
|
2020-12-23 09:12:53 -05:00
|
|
|
provided_content: T.nilable(String),
|
2021-08-12 11:54:29 -04:00
|
|
|
_unused: T.nilable(T::Hash[Symbol, T.untyped]),
|
2021-07-26 20:32:10 -04:00
|
|
|
block: T.nilable(
|
|
|
|
T.proc.params(arg0: String, arg1: Regexp).returns(T.any(String, T::Array[String], NilClass)),
|
|
|
|
),
|
2020-12-23 09:12:53 -05:00
|
|
|
).returns(T::Hash[Symbol, T.untyped])
|
2021-01-17 22:45:55 -08:00
|
|
|
}
|
2021-08-12 11:54:29 -04:00
|
|
|
def self.find_versions(url:, regex:, provided_content: nil, **_unused, &block)
|
2020-08-08 07:16:06 +05:30
|
|
|
match_data = { matches: {}, regex: regex, url: url }
|
2021-08-19 09:01:11 -04:00
|
|
|
return match_data if url.blank? || (regex.blank? && block.blank?)
|
2020-08-08 07:16:06 +05:30
|
|
|
|
2020-12-24 21:49:30 -05:00
|
|
|
content = if provided_content.is_a?(String)
|
2020-12-24 22:19:14 -05:00
|
|
|
match_data[:cached] = true
|
2020-12-23 09:12:53 -05:00
|
|
|
provided_content
|
|
|
|
else
|
|
|
|
match_data.merge!(Strategy.page_content(url))
|
2020-12-24 21:48:31 -05:00
|
|
|
match_data[:content]
|
2020-12-23 09:12:53 -05:00
|
|
|
end
|
2020-12-22 22:46:52 -05:00
|
|
|
return match_data if content.blank?
|
|
|
|
|
2021-08-10 11:09:55 -04:00
|
|
|
versions_from_content(content, regex, &block).each do |match_text|
|
2020-12-22 22:46:52 -05:00
|
|
|
match_data[:matches][match_text] = Version.new(match_text)
|
2020-08-08 07:16:06 +05:30
|
|
|
end
|
|
|
|
|
|
|
|
match_data
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|