2020-10-10 14:16:11 +02:00
|
|
|
# typed: false
|
2020-08-08 07:16:06 +05:30
|
|
|
# frozen_string_literal: true
|
|
|
|
|
|
|
|
module Homebrew
|
|
|
|
module Livecheck
|
|
|
|
module Strategy
|
2020-11-05 17:17:03 -05:00
|
|
|
# The {Apache} strategy identifies versions of software at apache.org
|
2020-08-08 07:16:06 +05:30
|
|
|
# by checking directory listing pages.
|
|
|
|
#
|
|
|
|
# Apache URLs start with `https://www.apache.org/dyn/closer.lua?path=`.
|
|
|
|
# The `path` parameter takes one of the following formats:
|
2020-11-05 17:17:03 -05:00
|
|
|
#
|
2020-08-08 07:16:06 +05:30
|
|
|
# * `example/1.2.3/example-1.2.3.tar.gz`
|
|
|
|
# * `example/example-1.2.3/example-1.2.3.tar.gz`
|
|
|
|
# * `example/example-1.2.3-bin.tar.gz`
|
|
|
|
#
|
2020-11-05 17:17:03 -05:00
|
|
|
# When the `path` contains a version directory (e.g. `/1.2.3/`,
|
2020-08-08 07:16:06 +05:30
|
|
|
# `/example-1.2.3/`, etc.), the default regex matches numeric versions
|
|
|
|
# in directory names. Otherwise, the default regex matches numeric
|
|
|
|
# versions in filenames.
|
|
|
|
#
|
|
|
|
# @api public
|
|
|
|
class Apache
|
2021-04-04 03:00:34 +02:00
|
|
|
extend T::Sig
|
|
|
|
|
2020-08-08 07:16:06 +05:30
|
|
|
# The `Regexp` used to determine if the strategy applies to the URL.
|
2020-12-21 00:48:31 -05:00
|
|
|
URL_MATCH_REGEX = %r{
|
|
|
|
^https?://www\.apache\.org
|
|
|
|
/dyn/.+path=
|
|
|
|
(?<path>.+?)/ # Path to directory of files or version directories
|
|
|
|
(?<prefix>[^/]*?) # Any text in filename or directory before version
|
|
|
|
v?\d+(?:\.\d+)+ # The numeric version
|
|
|
|
(?<suffix>/|[^/]*) # Any text in filename or directory after version
|
|
|
|
}ix.freeze
|
2020-08-08 07:16:06 +05:30
|
|
|
|
|
|
|
# Whether the strategy can be applied to the provided URL.
|
2020-11-05 17:17:03 -05:00
|
|
|
#
|
2020-08-08 07:16:06 +05:30
|
|
|
# @param url [String] the URL to match against
|
|
|
|
# @return [Boolean]
|
|
|
|
def self.match?(url)
|
|
|
|
URL_MATCH_REGEX.match?(url)
|
|
|
|
end
|
|
|
|
|
|
|
|
# Generates a URL and regex (if one isn't provided) and passes them
|
2020-11-05 17:17:03 -05:00
|
|
|
# to {PageMatch.find_versions} to identify versions in the content.
|
|
|
|
#
|
2020-08-08 07:16:06 +05:30
|
|
|
# @param url [String] the URL of the content to check
|
|
|
|
# @param regex [Regexp] a regex used for matching versions in content
|
|
|
|
# @return [Hash]
|
2021-04-04 03:00:34 +02:00
|
|
|
sig {
|
|
|
|
params(
|
|
|
|
url: String,
|
|
|
|
regex: T.nilable(Regexp),
|
|
|
|
cask: T.nilable(Cask::Cask),
|
|
|
|
block: T.nilable(T.proc.params(arg0: String).returns(T.any(T::Array[String], String))),
|
|
|
|
).returns(T::Hash[Symbol, T.untyped])
|
|
|
|
}
|
|
|
|
def self.find_versions(url, regex, cask: nil, &block)
|
2020-12-21 00:48:31 -05:00
|
|
|
match = url.match(URL_MATCH_REGEX)
|
2020-08-08 07:16:06 +05:30
|
|
|
|
2020-11-05 17:17:03 -05:00
|
|
|
# Use `\.t` instead of specific tarball extensions (e.g. .tar.gz)
|
2020-12-21 00:48:31 -05:00
|
|
|
suffix = match[:suffix].sub(/\.t(?:ar\..+|[a-z0-9]+)$/i, "\.t")
|
2020-08-08 07:16:06 +05:30
|
|
|
|
|
|
|
# Example URL: `https://archive.apache.org/dist/example/`
|
2020-12-21 00:48:31 -05:00
|
|
|
page_url = "https://archive.apache.org/dist/#{match[:path]}/"
|
2020-08-08 07:16:06 +05:30
|
|
|
|
|
|
|
# Example directory regex: `%r{href=["']?v?(\d+(?:\.\d+)+)/}i`
|
|
|
|
# Example file regexes:
|
|
|
|
# * `/href=["']?example-v?(\d+(?:\.\d+)+)\.t/i`
|
|
|
|
# * `/href=["']?example-v?(\d+(?:\.\d+)+)-bin\.zip/i`
|
2020-12-21 00:48:31 -05:00
|
|
|
regex ||= /href=["']?#{Regexp.escape(match[:prefix])}v?(\d+(?:\.\d+)+)#{Regexp.escape(suffix)}/i
|
2020-08-08 07:16:06 +05:30
|
|
|
|
2021-04-04 03:00:34 +02:00
|
|
|
PageMatch.find_versions(page_url, regex, cask: cask, &block)
|
2020-08-08 07:16:06 +05:30
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|