# typed: true # frozen_string_literal: true module Homebrew module Livecheck module Strategy # The {Apache} strategy identifies versions of software at apache.org # by checking directory listing pages. # # Most Apache URLs start with `https://www.apache.org/dyn/` and include # a `filename` or `path` query string parameter where the value is a # path to a file. The path takes one of the following formats: # # * `example/1.2.3/example-1.2.3.tar.gz` # * `example/example-1.2.3/example-1.2.3.tar.gz` # * `example/example-1.2.3-bin.tar.gz` # # This strategy also handles a few common mirror/backup URLs where the # path is provided outside of a query string parameter (e.g. # `https://archive.apache.org/dist/example/1.2.3/example-1.2.3.tar.gz`). # # When the path contains a version directory (e.g. `/1.2.3/`, # `/example-1.2.3/`, etc.), the default regex matches numeric versions # in directory names. Otherwise, the default regex matches numeric # versions in filenames. # # @api public class Apache extend T::Sig # The `Regexp` used to determine if the strategy applies to the URL. URL_MATCH_REGEX = %r{ ^https?:// (?:www\.apache\.org/dyn/.+(?:path|filename)=/?| archive\.apache\.org/dist/| dlcdn\.apache\.org/| downloads\.apache\.org/) (?.+?)/ # Path to directory of files or version directories (?[^/]*?) # Any text in filename or directory before version v?\d+(?:\.\d+)+ # The numeric version (?/|[^/]*) # Any text in filename or directory after version }ix.freeze # Whether the strategy can be applied to the provided URL. # # @param url [String] the URL to match against # @return [Boolean] sig { params(url: String).returns(T::Boolean) } def self.match?(url) URL_MATCH_REGEX.match?(url) end # Extracts information from a provided URL and uses it to generate # various input values used by the strategy to check for new versions. # Some of these values act as defaults and can be overridden in a # `livecheck` block. # # @param url [String] the URL used to generate values # @return [Hash] sig { params(url: String).returns(T::Hash[Symbol, T.untyped]) } def self.generate_input_values(url) values = {} match = url.match(URL_MATCH_REGEX) return values if match.blank? # Example URL: `https://archive.apache.org/dist/example/` values[:url] = "https://archive.apache.org/dist/#{match[:path]}/" regex_prefix = Regexp.escape(match[:prefix] || "").gsub("\\-", "-") # Use `\.t` instead of specific tarball extensions (e.g. .tar.gz) suffix = match[:suffix]&.sub(Strategy::TARBALL_EXTENSION_REGEX, ".t") regex_suffix = Regexp.escape(suffix || "").gsub("\\-", "-") # Example directory regex: `%r{href=["']?v?(\d+(?:\.\d+)+)/}i` # Example file regexes: # * `/href=["']?example-v?(\d+(?:\.\d+)+)\.t/i` # * `/href=["']?example-v?(\d+(?:\.\d+)+)-bin\.zip/i` values[:regex] = /href=["']?#{regex_prefix}v?(\d+(?:\.\d+)+)#{regex_suffix}/i values end # Generates a URL and regex (if one isn't provided) and passes them # to {PageMatch.find_versions} to identify versions in the content. # # @param url [String] the URL of the content to check # @param regex [Regexp] a regex used for matching versions in content # @return [Hash] sig { params( url: String, regex: T.nilable(Regexp), unused: T.nilable(T::Hash[Symbol, T.untyped]), block: T.untyped, ).returns(T::Hash[Symbol, T.untyped]) } def self.find_versions(url:, regex: nil, **unused, &block) generated = generate_input_values(url) T.unsafe(PageMatch).find_versions(url: generated[:url], regex: regex || generated[:regex], **unused, &block) end end end end end