2020-10-10 14:16:11 +02:00
|
|
|
# typed: false
|
2020-08-08 07:16:06 +05:30
|
|
|
# frozen_string_literal: true
|
|
|
|
|
|
|
|
module Homebrew
|
|
|
|
module Livecheck
|
|
|
|
module Strategy
|
2020-11-05 17:17:03 -05:00
|
|
|
# The {Sourceforge} strategy identifies versions of software at
|
2020-08-08 07:16:06 +05:30
|
|
|
# sourceforge.net by checking a project's RSS feed.
|
|
|
|
#
|
|
|
|
# SourceForge URLs take a few different formats:
|
2020-11-05 17:17:03 -05:00
|
|
|
#
|
|
|
|
# * `https://downloads.sourceforge.net/project/example/example-1.2.3.tar.gz`
|
|
|
|
# * `https://svn.code.sf.net/p/example/code/trunk`
|
|
|
|
# * `:pserver:anonymous:@example.cvs.sourceforge.net:/cvsroot/example`
|
2020-08-08 07:16:06 +05:30
|
|
|
#
|
|
|
|
# The RSS feed for a project contains the most recent release archives
|
2020-11-05 17:17:03 -05:00
|
|
|
# and while this is fine for most projects, this approach has some
|
2020-08-08 07:16:06 +05:30
|
|
|
# shortcomings. Some project releases involve so many files that the one
|
|
|
|
# we're interested in isn't present in the feed content. Some projects
|
|
|
|
# contain additional software and the archive we're interested in is
|
|
|
|
# pushed out of the feed (especially if it hasn't been updated recently).
|
|
|
|
#
|
|
|
|
# Usually we address this situation by adding a `livecheck` block to
|
2021-01-11 17:12:48 -05:00
|
|
|
# the formula/cask that checks the page for the relevant directory in the
|
2020-08-08 07:16:06 +05:30
|
|
|
# project instead. In this situation, it's necessary to use
|
2020-11-05 17:17:03 -05:00
|
|
|
# `strategy :page_match` to prevent the {Sourceforge} stratgy from
|
2020-08-08 07:16:06 +05:30
|
|
|
# being used.
|
|
|
|
#
|
|
|
|
# The default regex matches within `url` attributes in the RSS feed
|
|
|
|
# and identifies versions within directory names or filenames.
|
|
|
|
#
|
|
|
|
# @api public
|
|
|
|
class Sourceforge
|
2021-04-04 03:00:34 +02:00
|
|
|
extend T::Sig
|
|
|
|
|
2020-08-08 07:16:06 +05:30
|
|
|
NICE_NAME = "SourceForge"
|
|
|
|
|
|
|
|
# The `Regexp` used to determine if the strategy applies to the URL.
|
2020-12-21 00:48:31 -05:00
|
|
|
URL_MATCH_REGEX = %r{
|
|
|
|
^https?://(?:[^/]+?\.)*(?:sourceforge|sf)\.net
|
|
|
|
(?:/projects?/(?<project_name>[^/]+)/
|
|
|
|
|/p/(?<project_name>[^/]+)/
|
|
|
|
|(?::/cvsroot)?/(?<project_name>[^/]+))
|
|
|
|
}ix.freeze
|
2020-08-08 07:16:06 +05:30
|
|
|
|
|
|
|
# Whether the strategy can be applied to the provided URL.
|
2020-11-05 17:17:03 -05:00
|
|
|
#
|
2020-08-08 07:16:06 +05:30
|
|
|
# @param url [String] the URL to match against
|
|
|
|
# @return [Boolean]
|
2021-08-10 18:24:51 -04:00
|
|
|
sig { params(url: String).returns(T::Boolean) }
|
2020-08-08 07:16:06 +05:30
|
|
|
def self.match?(url)
|
|
|
|
URL_MATCH_REGEX.match?(url)
|
|
|
|
end
|
|
|
|
|
|
|
|
# Generates a URL and regex (if one isn't provided) and passes them
|
2020-11-05 17:17:03 -05:00
|
|
|
# to {PageMatch.find_versions} to identify versions in the content.
|
|
|
|
#
|
2020-08-08 07:16:06 +05:30
|
|
|
# @param url [String] the URL of the content to check
|
|
|
|
# @param regex [Regexp] a regex used for matching versions in content
|
|
|
|
# @return [Hash]
|
2021-04-04 03:00:34 +02:00
|
|
|
sig {
|
|
|
|
params(
|
2021-08-12 11:54:29 -04:00
|
|
|
url: String,
|
|
|
|
regex: T.nilable(Regexp),
|
|
|
|
unused: T.nilable(T::Hash[Symbol, T.untyped]),
|
|
|
|
block: T.nilable(
|
2021-07-26 20:32:10 -04:00
|
|
|
T.proc.params(arg0: String, arg1: Regexp).returns(T.any(String, T::Array[String], NilClass)),
|
|
|
|
),
|
2021-04-04 03:00:34 +02:00
|
|
|
).returns(T::Hash[Symbol, T.untyped])
|
|
|
|
}
|
2021-08-12 11:54:29 -04:00
|
|
|
def self.find_versions(url:, regex: nil, **unused, &block)
|
2020-12-21 00:48:31 -05:00
|
|
|
match = url.match(URL_MATCH_REGEX)
|
2020-08-08 07:16:06 +05:30
|
|
|
|
2021-07-19 15:13:25 -04:00
|
|
|
page_url = if url.match?(%r{/rss(?:/?$|\?)})
|
|
|
|
url
|
|
|
|
else
|
|
|
|
"https://sourceforge.net/projects/#{match[:project_name]}/rss"
|
|
|
|
end
|
2020-08-08 07:16:06 +05:30
|
|
|
|
|
|
|
# It may be possible to improve the default regex but there's quite a
|
|
|
|
# bit of variation between projects and it can be challenging to
|
|
|
|
# create something that works for most URLs.
|
2020-12-21 00:48:31 -05:00
|
|
|
regex ||= %r{url=.*?/#{Regexp.escape(match[:project_name])}/files/.*?[-_/](\d+(?:[-.]\d+)+)[-_/%.]}i
|
2020-08-08 07:16:06 +05:30
|
|
|
|
2021-08-12 11:54:29 -04:00
|
|
|
PageMatch.find_versions(url: page_url, regex: regex, **unused, &block)
|
2020-08-08 07:16:06 +05:30
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|