feat: harden sanitize_url host parsing

This commit is contained in:
2025-12-22 17:37:37 +01:00
parent 3369b018e3
commit 0228cd9c9d

View File

@@ -1,6 +1,7 @@
package Urupam::Utils; package Urupam::Utils;
use Mojo::Base -base; use Mojo::Base -base;
use Mojo::URL;
use Mojo::Util qw(url_unescape); use Mojo::Util qw(url_unescape);
sub sanitize_input { sub sanitize_input {
@@ -12,7 +13,9 @@ sub sanitize_input {
sub get_error_status { sub get_error_status {
my ($err) = @_; my ($err) = @_;
return $err =~ /SSL certificate|Cannot reach|DNS resolution|server error/i ? 422 : 400; return $err =~ /SSL certificate|Cannot reach|DNS resolution|server error/i
? 422
: 400;
} }
sub sanitize_error_message { sub sanitize_error_message {
@@ -22,7 +25,10 @@ sub sanitize_error_message {
$sanitized =~ s/[^\w\s\.\-\:\/]//g; $sanitized =~ s/[^\w\s\.\-\:\/]//g;
$sanitized =~ s/\s+/ /g; $sanitized =~ s/\s+/ /g;
$sanitized =~ s/^\s+|\s+$//g; $sanitized =~ s/^\s+|\s+$//g;
return length($sanitized) > 200 ? substr($sanitized, 0, 200) . '...' : $sanitized; return
length($sanitized) > 200
? substr( $sanitized, 0, 200 ) . '...'
: $sanitized;
} }
sub sanitize_url { sub sanitize_url {
@@ -32,17 +38,48 @@ sub sanitize_url {
$url =~ s/^\s+|\s+$//g; $url =~ s/^\s+|\s+$//g;
return undef if length($url) == 0; return undef if length($url) == 0;
if ( $url =~ /%[0-9a-f]{2}/i ) {
$url = url_unescape($url);
}
unless ( $url =~ m{^https?://}i ) { unless ( $url =~ m{^https?://}i ) {
return undef if $url =~ /[\@:]/; return undef if $url =~ /[\@:]/;
$url = 'http://' . $url; $url = 'http://' . $url;
} }
my ($authority) = $url =~ m{^https?://([^/?#]*)}i;
if ( defined $authority ) {
return undef if $authority =~ /\@/;
return undef if $authority =~ /[\s\x00-\x1F\x7F]/;
my $hostport = ( split /\@/, $authority )[-1];
my $host_raw;
if ( $hostport =~ /^\[(.+)\](?::\d+)?$/ ) {
$host_raw = $1;
}
else {
$host_raw = $hostport;
$host_raw =~ s/:(\d+)$//;
}
if ( $hostport =~ /[\[\]]/ ) {
return undef
unless $hostport =~ /^\[[0-9a-fA-F:.]+\](?::\d+)?$/;
}
return undef if $host_raw =~ /%[0-9a-f]{2}/i;
}
my $parsed = Mojo::URL->new($url);
if ( $url =~ /%[0-9a-f]{2}/i ) {
my $path = url_unescape( $parsed->path->to_string );
$parsed->path($path);
my $query = $parsed->query->to_string;
$parsed->query( url_unescape($query) ) if length $query;
my $fragment = $parsed->fragment;
$parsed->fragment( url_unescape($fragment) ) if defined $fragment;
$url = $parsed->to_string;
}
return $url; return $url;
} }
1; 1;