77 lines
2.8 KiB
Ruby
Raw Normal View History

2020-12-11 04:31:14 +01:00
# typed: false
# frozen_string_literal: true
module Homebrew
module Livecheck
module Strategy
# The {Cpan} strategy identifies versions of software at
# cpan.metacpan.org by checking directory listing pages.
#
# CPAN URLs take the following formats:
#
# * `https://cpan.metacpan.org/authors/id/H/HO/HOMEBREW/Brew-v1.2.3.tar.gz`
# * `https://cpan.metacpan.org/authors/id/H/HO/HOMEBREW/brew/brew-v1.2.3.tar.gz`
2020-12-11 04:31:14 +01:00
#
# In these examples, `HOMEBREW` is the author name and the preceding `H`
# and `HO` directories correspond to the first letter(s). Some authors
# also store files in subdirectories, as in the second example above.
2020-12-11 04:31:14 +01:00
#
# @api public
class Cpan
2021-04-04 03:00:34 +02:00
extend T::Sig
2020-12-11 04:31:14 +01:00
NICE_NAME = "CPAN"
# The `Regexp` used to determine if the strategy applies to the URL.
URL_MATCH_REGEX = %r{
^https?://cpan\.metacpan\.org
(?<path>/authors/id(?:/[^/]+){3,}/) # Path before the filename
(?<prefix>[^/]+) # Filename text before the version
-v?\d+(?:\.\d+)* # The numeric version
(?<suffix>[^/]+) # Filename text after the version
}ix.freeze
2020-12-11 04:31:14 +01:00
# Whether the strategy can be applied to the provided URL.
#
# @param url [String] the URL to match against
# @return [Boolean]
sig { params(url: String).returns(T::Boolean) }
2020-12-11 04:31:14 +01:00
def self.match?(url)
URL_MATCH_REGEX.match?(url)
2020-12-11 04:31:14 +01:00
end
# Generates a URL and regex (if one isn't provided) and passes them
# to {PageMatch.find_versions} to identify versions in the content.
#
# @param url [String] the URL of the content to check
# @param regex [Regexp] a regex used for matching versions in content
# @return [Hash]
2021-04-04 03:00:34 +02:00
sig {
params(
url: String,
regex: T.nilable(Regexp),
cask: T.nilable(Cask::Cask),
block: T.nilable(
T.proc.params(arg0: String, arg1: Regexp).returns(T.any(String, T::Array[String], NilClass)),
),
2021-04-04 03:00:34 +02:00
).returns(T::Hash[Symbol, T.untyped])
}
def self.find_versions(url, regex, cask: nil, &block)
match = url.match(URL_MATCH_REGEX)
2020-12-11 04:31:14 +01:00
# Use `\.t` instead of specific tarball extensions (e.g. .tar.gz)
suffix = match[:suffix].sub(/\.t(?:ar\..+|[a-z0-9]+)$/i, "\.t")
2020-12-11 04:31:14 +01:00
# The directory listing page where the archive files are found
page_url = "https://cpan.metacpan.org#{match[:path]}"
2020-12-11 04:31:14 +01:00
# Example regex: `/href=.*?Brew[._-]v?(\d+(?:\.\d+)*)\.t/i`
regex ||= /href=.*?#{match[:prefix]}[._-]v?(\d+(?:\.\d+)*)#{Regexp.escape(suffix)}/i
2020-12-11 04:31:14 +01:00
2021-04-04 03:00:34 +02:00
PageMatch.find_versions(page_url, regex, cask: cask, &block)
2020-12-11 04:31:14 +01:00
end
end
end
end
end