From 631fb78db78a58216ca0340411b9bd2e43dc958e Mon Sep 17 00:00:00 2001 From: Scrub <72096833+ScrubN@users.noreply.github.com> Date: Fri, 19 Jul 2024 23:40:15 -0400 Subject: [PATCH] Improve ID parsing (#1158) * Annotate TwitchRegex.Match* with [return: MaybeNull] * Support URLs ending with / * Add tests * Move id parsing related functions to IdParse, TwitchRegexTests -> IdParseTests --- TwitchDownloaderCLI/Modes/DownloadChat.cs | 2 +- TwitchDownloaderCLI/Modes/DownloadClip.cs | 2 +- TwitchDownloaderCLI/Modes/DownloadVideo.cs | 2 +- .../ToolTests/IdParseTests.cs | 134 ++++++++++++++++++ TwitchDownloaderCore/Tools/IdParse.cs | 71 ++++++++++ TwitchDownloaderCore/Tools/TwitchRegex.cs | 54 ------- TwitchDownloaderWPF/PageChatDownload.xaml.cs | 2 +- TwitchDownloaderWPF/PageClipDownload.xaml.cs | 2 +- TwitchDownloaderWPF/PageVodDownload.xaml.cs | 2 +- 9 files changed, 211 insertions(+), 60 deletions(-) create mode 100644 TwitchDownloaderCore.Tests/ToolTests/IdParseTests.cs create mode 100644 TwitchDownloaderCore/Tools/IdParse.cs diff --git a/TwitchDownloaderCLI/Modes/DownloadChat.cs b/TwitchDownloaderCLI/Modes/DownloadChat.cs index 152cc780..07a8ba45 100644 --- a/TwitchDownloaderCLI/Modes/DownloadChat.cs +++ b/TwitchDownloaderCLI/Modes/DownloadChat.cs @@ -31,7 +31,7 @@ private static ChatDownloadOptions GetDownloadOptions(ChatDownloadArgs inputOpti Environment.Exit(1); } - var vodClipIdMatch = TwitchRegex.MatchVideoOrClipId(inputOptions.Id); + var vodClipIdMatch = IdParse.MatchVideoOrClipId(inputOptions.Id); if (vodClipIdMatch is not { Success: true }) { logger.LogError("Unable to parse Vod/Clip ID/URL."); diff --git a/TwitchDownloaderCLI/Modes/DownloadClip.cs b/TwitchDownloaderCLI/Modes/DownloadClip.cs index 24c44c26..a3e137a4 100644 --- a/TwitchDownloaderCLI/Modes/DownloadClip.cs +++ b/TwitchDownloaderCLI/Modes/DownloadClip.cs @@ -36,7 +36,7 @@ private static ClipDownloadOptions GetDownloadOptions(ClipDownloadArgs inputOpti Environment.Exit(1); } - var clipIdMatch = TwitchRegex.MatchClipId(inputOptions.Id); + var clipIdMatch = IdParse.MatchClipId(inputOptions.Id); if (clipIdMatch is not { Success: true }) { logger.LogError("Unable to parse Clip ID/URL."); diff --git a/TwitchDownloaderCLI/Modes/DownloadVideo.cs b/TwitchDownloaderCLI/Modes/DownloadVideo.cs index 4ab857b8..fe0043df 100644 --- a/TwitchDownloaderCLI/Modes/DownloadVideo.cs +++ b/TwitchDownloaderCLI/Modes/DownloadVideo.cs @@ -34,7 +34,7 @@ private static VideoDownloadOptions GetDownloadOptions(VideoDownloadArgs inputOp Environment.Exit(1); } - var vodIdMatch = TwitchRegex.MatchVideoId(inputOptions.Id); + var vodIdMatch = IdParse.MatchVideoId(inputOptions.Id); if (vodIdMatch is not { Success: true }) { logger.LogError("Unable to parse Vod ID/URL."); diff --git a/TwitchDownloaderCore.Tests/ToolTests/IdParseTests.cs b/TwitchDownloaderCore.Tests/ToolTests/IdParseTests.cs new file mode 100644 index 00000000..713ff682 --- /dev/null +++ b/TwitchDownloaderCore.Tests/ToolTests/IdParseTests.cs @@ -0,0 +1,134 @@ +using TwitchDownloaderCore.Tools; + +namespace TwitchDownloaderCore.Tests.ToolTests +{ + // ReSharper disable StringLiteralTypo + public class IdParseTests + { + [Theory] + [InlineData("41546181")] // Oldest VODs - 8 + [InlineData("982306410")] // Old VODs - 9 + [InlineData("6834869128")] // Current VODs - 10 + [InlineData("11987163407")] // Future VODs - 11 + public void CorrectlyParsesVodId(string id) + { + var match = IdParse.MatchVideoId(id); + + Assert.NotNull(match); + Assert.Equal(id, match.Value); + } + + [Theory] + [InlineData("https://www.twitch.tv/videos/41546181", "41546181")] // Oldest VODs - 8 + [InlineData("https://www.twitch.tv/videos/982306410", "982306410")] // Old VODs - 9 + [InlineData("https://www.twitch.tv/videos/6834869128", "6834869128")] // Current VODs - 10 + [InlineData("https://www.twitch.tv/videos/11987163407", "11987163407")] // Future VODs - 11 + [InlineData("https://www.twitch.tv/kitboga/video/2865132173", "2865132173")] // Alternate highlight URL + [InlineData("https://www.twitch.tv/kitboga/v/2865132173", "2865132173")] // Alternate highlight URL + [InlineData("https://www.twitch.tv/videos/4894164023/", "4894164023")] + public void CorrectlyParsesVodLink(string link, string expectedId) + { + var match = IdParse.MatchVideoId(link); + + Assert.NotNull(match); + Assert.Equal(expectedId, match.Value); + } + + [Theory] + [InlineData("SpineyPieTwitchRPGNurturing")] + [InlineData("FuriousFlaccidTireArgieB8-NHbTiYQlzwHVvv_Vf")] + public void CorrectlyParsesClipId(string id) + { + var match = IdParse.MatchClipId(id); + + Assert.NotNull(match); + Assert.Equal(id, match.Value); + } + + [Theory] + [InlineData("https://www.twitch.tv/streamer8/clip/SpineyPieTwitchRPGNurturing", "SpineyPieTwitchRPGNurturing")] + [InlineData("https://www.twitch.tv/streamer8/clip/FuriousFlaccidTireArgieB8-NHbTiYQlzwHVvv_Vf", "FuriousFlaccidTireArgieB8-NHbTiYQlzwHVvv_Vf")] + [InlineData("https://www.twitch.tv/streamer8/clip/SpineyPieTwitchRPGNurturing?featured=false&filter=clips&range=all&sort=time", "SpineyPieTwitchRPGNurturing")] + [InlineData("https://www.twitch.tv/streamer8/clip/FuriousFlaccidTireArgieB8-NHbTiYQlzwHVvv_Vf?featured=false&filter=clips&range=all&sort=time", "FuriousFlaccidTireArgieB8-NHbTiYQlzwHVvv_Vf")] + [InlineData("https://clips.twitch.tv/SpineyPieTwitchRPGNurturing", "SpineyPieTwitchRPGNurturing")] + [InlineData("https://clips.twitch.tv/FuriousFlaccidTireArgieB8-NHbTiYQlzwHVvv_Vf", "FuriousFlaccidTireArgieB8-NHbTiYQlzwHVvv_Vf")] + [InlineData("https://clips.twitch.tv/SpineyPieTwitchRPGNurturing/", "SpineyPieTwitchRPGNurturing")] + [InlineData("https://clips.twitch.tv/FuriousFlaccidTireArgieB8-NHbTiYQlzwHVvv_Vf/", "FuriousFlaccidTireArgieB8-NHbTiYQlzwHVvv_Vf")] + public void CorrectlyParsesClipLink(string link, string expectedId) + { + var match = IdParse.MatchClipId(link); + + Assert.NotNull(match); + Assert.Equal(expectedId, match.Value); + } + + [Theory] + [InlineData("41546181")] // Oldest VODs - 8 + [InlineData("982306410")] // Old VODs - 9 + [InlineData("6834869128")] // Current VODs - 10 + [InlineData("11987163407")] // Future VODs - 11 + [InlineData("SpineyPieTwitchRPGNurturing")] + [InlineData("FuriousFlaccidTireArgieB8-NHbTiYQlzwHVvv_Vf")] + public void CorrectlyParsesVodOrClipId(string id) + { + var match = IdParse.MatchVideoOrClipId(id); + + Assert.NotNull(match); + Assert.Equal(id, match.Value); + } + + [Theory] + [InlineData("https://www.twitch.tv/videos/41546181", "41546181")] // Oldest VODs - 8 + [InlineData("https://www.twitch.tv/videos/982306410", "982306410")] // Old VODs - 9 + [InlineData("https://www.twitch.tv/videos/6834869128", "6834869128")] // Current VODs - 10 + [InlineData("https://www.twitch.tv/videos/11987163407", "11987163407")] // Future VODs - 11 + [InlineData("https://www.twitch.tv/kitboga/video/2865132173", "2865132173")] // Alternate highlight URL + [InlineData("https://www.twitch.tv/kitboga/v/2865132173", "2865132173")] // Alternate VOD URL + [InlineData("https://www.twitch.tv/videos/4894164023/", "4894164023")] + [InlineData("https://www.twitch.tv/streamer8/clip/SpineyPieTwitchRPGNurturing", "SpineyPieTwitchRPGNurturing")] + [InlineData("https://www.twitch.tv/streamer8/clip/FuriousFlaccidTireArgieB8-NHbTiYQlzwHVvv_Vf", "FuriousFlaccidTireArgieB8-NHbTiYQlzwHVvv_Vf")] + [InlineData("https://www.twitch.tv/streamer8/clip/SpineyPieTwitchRPGNurturing?featured=false&filter=clips&range=all&sort=time", "SpineyPieTwitchRPGNurturing")] + [InlineData("https://www.twitch.tv/streamer8/clip/FuriousFlaccidTireArgieB8-NHbTiYQlzwHVvv_Vf?featured=false&filter=clips&range=all&sort=time", "FuriousFlaccidTireArgieB8-NHbTiYQlzwHVvv_Vf")] + [InlineData("https://clips.twitch.tv/SpineyPieTwitchRPGNurturing", "SpineyPieTwitchRPGNurturing")] + [InlineData("https://clips.twitch.tv/FuriousFlaccidTireArgieB8-NHbTiYQlzwHVvv_Vf", "FuriousFlaccidTireArgieB8-NHbTiYQlzwHVvv_Vf")] + [InlineData("https://clips.twitch.tv/SpineyPieTwitchRPGNurturing/", "SpineyPieTwitchRPGNurturing")] + [InlineData("https://clips.twitch.tv/FuriousFlaccidTireArgieB8-NHbTiYQlzwHVvv_Vf/", "FuriousFlaccidTireArgieB8-NHbTiYQlzwHVvv_Vf")] + public void CorrectlyParsesVodOrClipLink(string link, string expectedId) + { + var match = IdParse.MatchVideoOrClipId(link); + + Assert.NotNull(match); + Assert.Equal(expectedId, match.Value); + } + + [Fact] + public void DoesNotParseGarbageVodId() + { + const string GARBAGE = "SORRY FOR THE TRAFFIC NaM"; + + var match = IdParse.MatchVideoId(GARBAGE); + + Assert.Null(match); + } + + [Fact] + public void DoesNotParseGarbageClipId() + { + const string GARBAGE = "SORRY FOR THE TRAFFIC NaM"; + + var match = IdParse.MatchClipId(GARBAGE); + + Assert.Null(match); + } + + [Fact] + public void DoesNotParseGarbageVodOrClipId() + { + const string GARBAGE = "SORRY FOR THE TRAFFIC NaM"; + + var match = IdParse.MatchVideoOrClipId(GARBAGE); + + Assert.Null(match); + } + } +} \ No newline at end of file diff --git a/TwitchDownloaderCore/Tools/IdParse.cs b/TwitchDownloaderCore/Tools/IdParse.cs new file mode 100644 index 00000000..485f4efc --- /dev/null +++ b/TwitchDownloaderCore/Tools/IdParse.cs @@ -0,0 +1,71 @@ +using System.Diagnostics.CodeAnalysis; +using System.Linq; +using System.Text.RegularExpressions; + +namespace TwitchDownloaderCore.Tools +{ + public static class IdParse + { + // TODO: Use source generators when .NET7 + private static readonly Regex VideoId = new(@"(?<=^|twitch\.tv\/videos\/)\d+(?=\/?(?:$|\?))", RegexOptions.Compiled); + private static readonly Regex HighlightId = new(@"(?<=^|twitch\.tv\/\w+\/v(?:ideo)?\/)\d+(?=\/?(?:$|\?))", RegexOptions.Compiled); + private static readonly Regex ClipId = new(@"(?<=^|(?:clips\.)?twitch\.tv\/(?:\w+\/clip\/)?)[\w-]+?(?=\/?(?:$|\?))", RegexOptions.Compiled); + + /// A of the video's id or . + [return: MaybeNull] + public static Match MatchVideoId(string text) + { + text = text.Trim(); + + var videoIdMatch = VideoId.Match(text); + if (videoIdMatch.Success) + { + return videoIdMatch; + } + + var highlightIdMatch = HighlightId.Match(text); + if (highlightIdMatch.Success) + { + return highlightIdMatch; + } + + return null; + } + + /// A of the clip's id or . + [return: MaybeNull] + public static Match MatchClipId(string text) + { + text = text.Trim(); + + var clipIdMatch = ClipId.Match(text); + if (clipIdMatch.Success && !clipIdMatch.Value.All(char.IsDigit)) + { + return clipIdMatch; + } + + return null; + } + + /// A of the video/clip's id or . + [return: MaybeNull] + public static Match MatchVideoOrClipId(string text) + { + text = text.Trim(); + + var videoIdMatch = MatchVideoId(text); + if (videoIdMatch is { Success: true }) + { + return videoIdMatch; + } + + var clipIdMatch = MatchClipId(text); + if (clipIdMatch is { Success: true }) + { + return clipIdMatch; + } + + return null; + } + } +} \ No newline at end of file diff --git a/TwitchDownloaderCore/Tools/TwitchRegex.cs b/TwitchDownloaderCore/Tools/TwitchRegex.cs index fa5f718c..6f2e4f8b 100644 --- a/TwitchDownloaderCore/Tools/TwitchRegex.cs +++ b/TwitchDownloaderCore/Tools/TwitchRegex.cs @@ -1,66 +1,12 @@ -using System.Linq; using System.Text.RegularExpressions; namespace TwitchDownloaderCore.Tools { public static class TwitchRegex { - // TODO: Use source generators when .NET7 - private static readonly Regex VideoId = new(@"(?<=^|twitch\.tv\/videos\/)\d+(?=$|\?|\s)", RegexOptions.Compiled); - private static readonly Regex HighlightId = new(@"(?<=^|twitch\.tv\/\w+\/v(?:ideo)?\/)\d+(?=$|\?|\s)", RegexOptions.Compiled); - private static readonly Regex ClipId = new(@"(?<=^|(?:clips\.)?twitch\.tv\/(?:\w+\/clip\/)?)[\w-]+?(?=$|\?|\s)", RegexOptions.Compiled); - public static readonly Regex UrlTimeCode = new(@"(?<=(?:\?|&)t=)\d+h\d+m\d+s(?=$|\?|\s)", RegexOptions.Compiled); public static readonly Regex BitsRegex = new( @"(?<=(?:\s|^)(?:4Head|Anon|Bi(?:bleThumb|tBoss)|bday|C(?:h(?:eer|arity)|orgo)|cheerwal|D(?:ansGame|oodleCheer)|EleGiggle|F(?:rankerZ|ailFish)|Goal|H(?:eyGuys|olidayCheer)|K(?:appa|reygasm)|M(?:rDestructoid|uxy)|NotLikeThis|P(?:arty|ride|JSalt)|RIPCheer|S(?:coops|h(?:owLove|amrock)|eemsGood|wiftRage|treamlabs)|TriHard|uni|VoHiYo))[1-9]\d{0,6}(?=\s|$)", RegexOptions.Compiled); - - /// A of the video's id or . - public static Match MatchVideoId(string text) - { - var videoIdMatch = VideoId.Match(text); - if (videoIdMatch.Success) - { - return videoIdMatch; - } - - var highlightIdMatch = HighlightId.Match(text); - if (highlightIdMatch.Success) - { - return highlightIdMatch; - } - - return null; - } - - /// A of the clip's id or . - public static Match MatchClipId(string text) - { - var clipIdMatch = ClipId.Match(text); - if (clipIdMatch.Success && !clipIdMatch.Value.All(char.IsDigit)) - { - return clipIdMatch; - } - - return null; - } - - /// A of the video/clip's id or . - public static Match MatchVideoOrClipId(string text) - { - var videoIdMatch = MatchVideoId(text); - if (videoIdMatch is { Success: true }) - { - return videoIdMatch; - } - - var clipIdMatch = MatchClipId(text); - if (clipIdMatch is { Success: true }) - { - return clipIdMatch; - } - - return null; - } } } \ No newline at end of file diff --git a/TwitchDownloaderWPF/PageChatDownload.xaml.cs b/TwitchDownloaderWPF/PageChatDownload.xaml.cs index e6913302..9fcf5861 100644 --- a/TwitchDownloaderWPF/PageChatDownload.xaml.cs +++ b/TwitchDownloaderWPF/PageChatDownload.xaml.cs @@ -225,7 +225,7 @@ private void UpdateActionButtons(bool isDownloading) public static string ValidateUrl(string text) { - var vodClipIdMatch = TwitchRegex.MatchVideoOrClipId(text); + var vodClipIdMatch = IdParse.MatchVideoOrClipId(text); return vodClipIdMatch is { Success: true } ? vodClipIdMatch.Value : null; diff --git a/TwitchDownloaderWPF/PageClipDownload.xaml.cs b/TwitchDownloaderWPF/PageClipDownload.xaml.cs index 06b7770d..596e23cb 100644 --- a/TwitchDownloaderWPF/PageClipDownload.xaml.cs +++ b/TwitchDownloaderWPF/PageClipDownload.xaml.cs @@ -113,7 +113,7 @@ private void UpdateActionButtons(bool isDownloading) private static string ValidateUrl(string text) { - var clipIdMatch = TwitchRegex.MatchClipId(text); + var clipIdMatch = IdParse.MatchClipId(text); return clipIdMatch is { Success: true } ? clipIdMatch.Value : null; diff --git a/TwitchDownloaderWPF/PageVodDownload.xaml.cs b/TwitchDownloaderWPF/PageVodDownload.xaml.cs index bb8732e1..1202a5e2 100644 --- a/TwitchDownloaderWPF/PageVodDownload.xaml.cs +++ b/TwitchDownloaderWPF/PageVodDownload.xaml.cs @@ -285,7 +285,7 @@ public void SetImage(string imageUri, bool isGif) private static long ValidateUrl(string text) { - var vodIdMatch = TwitchRegex.MatchVideoId(text); + var vodIdMatch = IdParse.MatchVideoId(text); if (vodIdMatch is {Success: true} && long.TryParse(vodIdMatch.ValueSpan, out var vodId)) { return vodId;