1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163
|
package Mail::DMARC::Report::URI;
use strict;
use warnings;
our $VERSION = '1.20240314';
use Carp;
use URI;
sub new {
my $class = shift;
return bless {}, $class;
}
sub parse {
my $self = shift;
my $str = shift or croak "URI string is required!";
my @valids = ();
foreach my $raw ( split /,/, $str ) {
# warn "raw: $raw\n";
my ( $u, $size_f ) = split /!/, $raw;
my $bytes = $self->get_size_limit($size_f);
my $uri = URI->new($u) or do {
carp "can't parse URI from $u";
next;
};
my $scheme = $uri->scheme or next;
if ( $scheme eq 'mailto' && lc substr( $u, 0, 7 ) eq 'mailto:' ) {
push @valids, { max_bytes => $bytes, uri => $uri };
next;
}
if ( $scheme =~ /^http(s)?/x && lc substr( $u, 0, 4 ) eq 'http' ) {
push @valids, { max_bytes => $bytes, uri => $uri };
next;
}
# print "invalid URI scheme: $scheme in $u\n";
# 12.1 Discovery - URI schemes found in "rua" tag that are not implemented by
# a Mail Receiver MUST be ignored.
}
return \@valids;
}
sub get_size_limit {
my ( $self, $size ) = @_;
return 0 if !defined $size; # no limit
return $size if $size =~ /^\d+$/; # no units, raw byte count
# 6.3 Formal Definition
# units are considered to be powers of two; a kilobyte is 2^10, a megabyte is 2^20,
my $unit = lc chop $size;
return $size * ( 2**10 ) if 'k' eq $unit;
return $size * ( 2**20 ) if 'm' eq $unit;
return $size * ( 2**30 ) if 'g' eq $unit;
return $size * ( 2**40 ) if 't' eq $unit;
croak "unrecognized unit ($unit) in size ($size)";
}
1;
__END__
=pod
=head1 NAME
Mail::DMARC::Report::URI - a DMARC report URI
=head1 VERSION
version 1.20240314
=head1 SYNOPSIS
use Mail::DMARC::URI;
my $duri = Mail::DMARC::URI->new;
my $uri_ref = $duri->parse('mailto:rua@example.com,mailto:rua@external.otherdomain.com');
foreach my $u ( @$uri_ref ) {
my $method = $u->{uri};
my $max = $u->{max_bytes};
... do some URI stuff ...
};
=head1 DESCRIPTION
defines a generic syntax for identifying a resource. The DMARC
mechanism uses this as the format by which a Domain Owner specifies
the destination for the two report types that are supported.
The place such URIs are specified (see Section 6.2) allows a list of
these to be provided. A report is to be sent to each listed URI.
Mail Receivers MAY impose a limit on the number of URIs that receive
reports, but MUST support at least two. The list of URIs is
separated by commas (ASCII 0x2C).
Each URI can have associated with it a maximum report size that may
be sent to it. This is accomplished by appending an exclamation
point (ASCII 0x21), followed by a maximum size indication, before a
separating comma or terminating semi-colon.
Thus, a DMARC URI is a URI within which any commas or exclamation
points are percent-encoded per [URI], followed by an OPTIONAL
exclamation point and a maximum size specification, and, if there are
additional reporting URIs in the list, a comma and the next URI.
For example, the URI "mailto:reports@example.com!50m" would request a
report be sent via email to "reports@example.com" so long as the
report payload does not exceed 50 megabytes.
A formal definition is provided in Section 6.3.
=head1 ABNF
dmarc-uri = URI [ "!" 1*DIGIT [ "k" / "m" / "g" / "t" ] ]
; "URI" is imported from [URI]; commas (ASCII 0x2c)
; and exclamation points (ASCII 0x21) MUST be encoded
URI is imported from RFC 3986: https://www.ietf.org/rfc/rfc3986.txt
Only mailto, http, and https URIs are currently supported, examples:
https://www.ietf.org/rfc/rfc3986.txt
mailto:John.Doe@example.com
With an optional size limit (see SIZE LIMIT).
=head1 SIZE LIMIT
A size limitation in a dmarc-uri, if provided, is interpreted as a
count of units followed by an OPTIONAL unit size ("k" for kilobytes,
"m" for megabytes, "g" for gigabytes, "t" for terabytes). Without a
unit, the number is presumed to be a basic byte count. Note that the
units are considered to be powers of two; a kilobyte is 2^10, a
megabyte is 2^20, etc.
=head1 AUTHORS
=over 4
=item *
Matt Simerson <msimerson@cpan.org>
=item *
Davide Migliavacca <shari@cpan.org>
=item *
Marc Bradshaw <marc@marcbradshaw.net>
=back
=head1 COPYRIGHT AND LICENSE
This software is copyright (c) 2024 by Matt Simerson.
This is free software; you can redistribute it and/or modify it under
the same terms as the Perl 5 programming language system itself.
=cut
|