2021-07-28 13:20:12 -04:00
|
|
|
# typed: true
|
2020-08-08 07:16:06 +05:30
|
|
|
# frozen_string_literal: true
|
|
|
|
|
|
|
|
module Homebrew
|
|
|
|
module Livecheck
|
|
|
|
module Strategy
|
2020-11-05 17:17:03 -05:00
|
|
|
# The {Pypi} strategy identifies versions of software at pypi.org by
|
2020-08-08 07:16:06 +05:30
|
|
|
# checking project pages for archive files.
|
|
|
|
#
|
|
|
|
# PyPI URLs have a standard format but the hexadecimal text between
|
|
|
|
# `/packages/` and the filename varies:
|
2020-11-05 17:17:03 -05:00
|
|
|
#
|
2020-08-08 07:16:06 +05:30
|
|
|
# * `https://files.pythonhosted.org/packages/<hex>/<hex>/<long_hex>/example-1.2.3.tar.gz`
|
|
|
|
#
|
|
|
|
# As such, the default regex only targets the filename at the end of the
|
|
|
|
# URL.
|
|
|
|
#
|
|
|
|
# @api public
|
|
|
|
class Pypi
|
|
|
|
NICE_NAME = "PyPI"
|
|
|
|
|
2023-09-08 14:46:15 -04:00
|
|
|
# The `Regexp` used to extract the package name and suffix (e.g. file
|
2020-12-21 00:48:31 -05:00
|
|
|
# extension) from the URL basename.
|
|
|
|
FILENAME_REGEX = /
|
|
|
|
(?<package_name>.+)- # The package name followed by a hyphen
|
|
|
|
.*? # The version string
|
|
|
|
(?<suffix>\.tar\.[a-z0-9]+|\.[a-z0-9]+)$ # Filename extension
|
2024-01-18 22:18:42 +00:00
|
|
|
/ix
|
2020-12-21 00:48:31 -05:00
|
|
|
|
2020-08-08 07:16:06 +05:30
|
|
|
# The `Regexp` used to determine if the strategy applies to the URL.
|
2020-12-21 00:48:31 -05:00
|
|
|
URL_MATCH_REGEX = %r{
|
|
|
|
^https?://files\.pythonhosted\.org
|
|
|
|
/packages
|
|
|
|
(?:/[^/]+)+ # The hexadecimal paths before the filename
|
|
|
|
/#{FILENAME_REGEX.source.strip} # The filename
|
2024-01-18 22:18:42 +00:00
|
|
|
}ix
|
2020-08-08 07:16:06 +05:30
|
|
|
|
|
|
|
# Whether the strategy can be applied to the provided URL.
|
2020-11-05 17:17:03 -05:00
|
|
|
#
|
2020-08-08 07:16:06 +05:30
|
|
|
# @param url [String] the URL to match against
|
|
|
|
# @return [Boolean]
|
2021-08-10 18:24:51 -04:00
|
|
|
sig { params(url: String).returns(T::Boolean) }
|
2020-08-08 07:16:06 +05:30
|
|
|
def self.match?(url)
|
|
|
|
URL_MATCH_REGEX.match?(url)
|
|
|
|
end
|
|
|
|
|
2021-07-28 13:20:12 -04:00
|
|
|
# Extracts information from a provided URL and uses it to generate
|
|
|
|
# various input values used by the strategy to check for new versions.
|
|
|
|
# Some of these values act as defaults and can be overridden in a
|
|
|
|
# `livecheck` block.
|
|
|
|
#
|
|
|
|
# @param url [String] the URL used to generate values
|
|
|
|
# @return [Hash]
|
|
|
|
sig { params(url: String).returns(T::Hash[Symbol, T.untyped]) }
|
|
|
|
def self.generate_input_values(url)
|
|
|
|
values = {}
|
|
|
|
|
|
|
|
match = File.basename(url).match(FILENAME_REGEX)
|
|
|
|
return values if match.blank?
|
|
|
|
|
|
|
|
# It's not technically necessary to have the `#files` fragment at the
|
|
|
|
# end of the URL but it makes the debug output a bit more useful.
|
|
|
|
values[:url] = "https://pypi.org/project/#{T.must(match[:package_name]).gsub(/%20|_/, "-")}/#files"
|
|
|
|
|
|
|
|
# Use `\.t` instead of specific tarball extensions (e.g. .tar.gz)
|
2022-12-13 10:54:22 +00:00
|
|
|
suffix = T.must(match[:suffix]).sub(Strategy::TARBALL_EXTENSION_REGEX, ".t")
|
2021-07-28 13:20:12 -04:00
|
|
|
regex_suffix = Regexp.escape(suffix).gsub("\\-", "-")
|
|
|
|
|
|
|
|
# Example regex: `%r{href=.*?/packages.*?/example[._-]v?(\d+(?:\.\d+)*(?:[._-]post\d+)?)\.t}i`
|
|
|
|
regex_name = Regexp.escape(T.must(match[:package_name])).gsub("\\-", "-")
|
|
|
|
values[:regex] =
|
|
|
|
%r{href=.*?/packages.*?/#{regex_name}[._-]v?(\d+(?:\.\d+)*(?:[._-]post\d+)?)#{regex_suffix}}i
|
|
|
|
|
|
|
|
values
|
|
|
|
end
|
|
|
|
|
2020-08-08 07:16:06 +05:30
|
|
|
# Generates a URL and regex (if one isn't provided) and passes them
|
2020-11-05 17:17:03 -05:00
|
|
|
# to {PageMatch.find_versions} to identify versions in the content.
|
|
|
|
#
|
2020-08-08 07:16:06 +05:30
|
|
|
# @param url [String] the URL of the content to check
|
|
|
|
# @param regex [Regexp] a regex used for matching versions in content
|
|
|
|
# @return [Hash]
|
2021-04-04 03:00:34 +02:00
|
|
|
sig {
|
|
|
|
params(
|
2021-08-12 11:54:29 -04:00
|
|
|
url: String,
|
|
|
|
regex: T.nilable(Regexp),
|
|
|
|
unused: T.nilable(T::Hash[Symbol, T.untyped]),
|
2023-04-04 22:40:31 -07:00
|
|
|
block: T.nilable(Proc),
|
2021-04-04 03:00:34 +02:00
|
|
|
).returns(T::Hash[Symbol, T.untyped])
|
|
|
|
}
|
2021-08-12 11:54:29 -04:00
|
|
|
def self.find_versions(url:, regex: nil, **unused, &block)
|
2021-07-28 13:20:12 -04:00
|
|
|
generated = generate_input_values(url)
|
2020-08-08 07:16:06 +05:30
|
|
|
|
2023-04-03 17:34:39 -07:00
|
|
|
PageMatch.find_versions(url: generated[:url], regex: regex || generated[:regex], **unused, &block)
|
2020-08-08 07:16:06 +05:30
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|