2021-07-28 13:20:12 -04:00
|
|
|
# typed: true
|
2020-08-08 07:16:06 +05:30
|
|
|
# frozen_string_literal: true
|
|
|
|
|
|
|
|
module Homebrew
|
|
|
|
module Livecheck
|
|
|
|
module Strategy
|
2020-11-05 17:17:03 -05:00
|
|
|
# The {Apache} strategy identifies versions of software at apache.org
|
2020-08-08 07:16:06 +05:30
|
|
|
# by checking directory listing pages.
|
|
|
|
#
|
2021-10-23 22:54:20 -04:00
|
|
|
# Most Apache URLs start with `https://www.apache.org/dyn/` and include
|
2021-10-19 10:01:39 -04:00
|
|
|
# a `filename` or `path` query string parameter where the value is a
|
|
|
|
# path to a file. The path takes one of the following formats:
|
2020-11-05 17:17:03 -05:00
|
|
|
#
|
2020-08-08 07:16:06 +05:30
|
|
|
# * `example/1.2.3/example-1.2.3.tar.gz`
|
|
|
|
# * `example/example-1.2.3/example-1.2.3.tar.gz`
|
|
|
|
# * `example/example-1.2.3-bin.tar.gz`
|
|
|
|
#
|
2021-10-23 22:54:20 -04:00
|
|
|
# This strategy also handles a few common mirror/backup URLs where the
|
|
|
|
# path is provided outside of a query string parameter (e.g.
|
|
|
|
# `https://archive.apache.org/dist/example/1.2.3/example-1.2.3.tar.gz`).
|
|
|
|
#
|
2021-10-19 10:01:39 -04:00
|
|
|
# When the path contains a version directory (e.g. `/1.2.3/`,
|
2020-08-08 07:16:06 +05:30
|
|
|
# `/example-1.2.3/`, etc.), the default regex matches numeric versions
|
|
|
|
# in directory names. Otherwise, the default regex matches numeric
|
|
|
|
# versions in filenames.
|
|
|
|
#
|
|
|
|
# @api public
|
|
|
|
class Apache
|
2021-04-04 03:00:34 +02:00
|
|
|
extend T::Sig
|
|
|
|
|
2020-08-08 07:16:06 +05:30
|
|
|
# The `Regexp` used to determine if the strategy applies to the URL.
|
2020-12-21 00:48:31 -05:00
|
|
|
URL_MATCH_REGEX = %r{
|
2021-10-23 22:54:20 -04:00
|
|
|
^https?://
|
|
|
|
(?:www\.apache\.org/dyn/.+(?:path|filename)=/?|
|
|
|
|
archive\.apache\.org/dist/|
|
|
|
|
dlcdn\.apache\.org/|
|
|
|
|
downloads\.apache\.org/)
|
2020-12-21 00:48:31 -05:00
|
|
|
(?<path>.+?)/ # Path to directory of files or version directories
|
|
|
|
(?<prefix>[^/]*?) # Any text in filename or directory before version
|
|
|
|
v?\d+(?:\.\d+)+ # The numeric version
|
|
|
|
(?<suffix>/|[^/]*) # Any text in filename or directory after version
|
|
|
|
}ix.freeze
|
2020-08-08 07:16:06 +05:30
|
|
|
|
|
|
|
# Whether the strategy can be applied to the provided URL.
|
2020-11-05 17:17:03 -05:00
|
|
|
#
|
2020-08-08 07:16:06 +05:30
|
|
|
# @param url [String] the URL to match against
|
|
|
|
# @return [Boolean]
|
2021-08-10 18:24:51 -04:00
|
|
|
sig { params(url: String).returns(T::Boolean) }
|
2020-08-08 07:16:06 +05:30
|
|
|
def self.match?(url)
|
|
|
|
URL_MATCH_REGEX.match?(url)
|
|
|
|
end
|
|
|
|
|
2021-07-28 13:20:12 -04:00
|
|
|
# Extracts information from a provided URL and uses it to generate
|
|
|
|
# various input values used by the strategy to check for new versions.
|
|
|
|
# Some of these values act as defaults and can be overridden in a
|
|
|
|
# `livecheck` block.
|
|
|
|
#
|
|
|
|
# @param url [String] the URL used to generate values
|
|
|
|
# @return [Hash]
|
|
|
|
sig { params(url: String).returns(T::Hash[Symbol, T.untyped]) }
|
|
|
|
def self.generate_input_values(url)
|
|
|
|
values = {}
|
|
|
|
|
|
|
|
match = url.match(URL_MATCH_REGEX)
|
|
|
|
return values if match.blank?
|
|
|
|
|
|
|
|
# Example URL: `https://archive.apache.org/dist/example/`
|
|
|
|
values[:url] = "https://archive.apache.org/dist/#{match[:path]}/"
|
|
|
|
|
|
|
|
regex_prefix = Regexp.escape(match[:prefix] || "").gsub("\\-", "-")
|
|
|
|
|
|
|
|
# Use `\.t` instead of specific tarball extensions (e.g. .tar.gz)
|
2022-12-13 10:54:22 +00:00
|
|
|
suffix = match[:suffix]&.sub(Strategy::TARBALL_EXTENSION_REGEX, ".t")
|
2021-07-28 13:20:12 -04:00
|
|
|
regex_suffix = Regexp.escape(suffix || "").gsub("\\-", "-")
|
|
|
|
|
|
|
|
# Example directory regex: `%r{href=["']?v?(\d+(?:\.\d+)+)/}i`
|
|
|
|
# Example file regexes:
|
|
|
|
# * `/href=["']?example-v?(\d+(?:\.\d+)+)\.t/i`
|
|
|
|
# * `/href=["']?example-v?(\d+(?:\.\d+)+)-bin\.zip/i`
|
|
|
|
values[:regex] = /href=["']?#{regex_prefix}v?(\d+(?:\.\d+)+)#{regex_suffix}/i
|
|
|
|
|
|
|
|
values
|
|
|
|
end
|
|
|
|
|
2020-08-08 07:16:06 +05:30
|
|
|
# Generates a URL and regex (if one isn't provided) and passes them
|
2020-11-05 17:17:03 -05:00
|
|
|
# to {PageMatch.find_versions} to identify versions in the content.
|
|
|
|
#
|
2020-08-08 07:16:06 +05:30
|
|
|
# @param url [String] the URL of the content to check
|
|
|
|
# @param regex [Regexp] a regex used for matching versions in content
|
|
|
|
# @return [Hash]
|
2021-04-04 03:00:34 +02:00
|
|
|
sig {
|
|
|
|
params(
|
2021-08-12 11:54:29 -04:00
|
|
|
url: String,
|
|
|
|
regex: T.nilable(Regexp),
|
|
|
|
unused: T.nilable(T::Hash[Symbol, T.untyped]),
|
Handle variable strategy block arguments
There are times where a regex isn't needed in a `strategy` block and
these changes explicitly handle that situation.
This allows the Symbol Proc format used in some `Sparkle` `livecheck`
blocks (e.g., `strategy :sparkle, &:version`) to continue working
instead of failing with a "wrong number of arguments (given 1,
expected 0)" error. This error would occur because a Symbol Proc only
only expects one argument (e.g., an `Item`, not an `Item` and a
regex/nil).
There's an argument to be made for avoiding the Symbol Proc format
for `strategy` blocks but I haven't found a way of selectively
disabling the Style/SymbolProc cop only for a `strategy` DSL method
call. That is to say, if we don't use the Symbol Proc format, `brew
style` will give a "Pass &:version as an argument to strategy instead
of a block." offense.
Besides that, this also replaces the `block` type signatures in
livecheck strategies with `T.untyped`. Sorbet doesn't know how to
handle a `Proc` with a variable number of arguments and can't be
taught how (i.e., `T.any` with a `Proc` signature for each variation
doesn't work). The aforementioned changes cause Sorbet to complain
about there being both too many and too few arguments, so the only
way to win is not to play the game. Hopefully we can restore the
`block` type signatures in the future (if upstream resolves this
years-old issue) but `T.untyped` seems to be our only option for now.
2021-11-19 22:42:15 -05:00
|
|
|
block: T.untyped,
|
2021-04-04 03:00:34 +02:00
|
|
|
).returns(T::Hash[Symbol, T.untyped])
|
|
|
|
}
|
2021-08-12 11:54:29 -04:00
|
|
|
def self.find_versions(url:, regex: nil, **unused, &block)
|
2021-07-28 13:20:12 -04:00
|
|
|
generated = generate_input_values(url)
|
2020-08-08 07:16:06 +05:30
|
|
|
|
2023-04-03 17:34:39 -07:00
|
|
|
PageMatch.find_versions(url: generated[:url], regex: regex || generated[:regex], **unused, &block)
|
2020-08-08 07:16:06 +05:30
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|