# ex:ts=8 sw=4: # $OpenBSD: PackageRepository.pm,v 1.68 2009/10/13 11:49:25 espie Exp $ # # Copyright (c) 2003-2007 Marc Espie # # Permission to use, copy, modify, and distribute this software for any # purpose with or without fee is hereby granted, provided that the above # copyright notice and this permission notice appear in all copies. # # THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES # WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF # MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR # ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES # WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN # ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF # OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. use strict; use warnings; # XXX load extra class, grab match from Base class, and tweak inheritance # to get all methods. use OpenBSD::PackageRepository::Installed; $OpenBSD::PackageRepository::Installed::ISA=(qw(OpenBSD::PackageRepository)); package OpenBSD::PackageRepository; our @ISA=(qw(OpenBSD::PackageRepositoryBase)); use OpenBSD::PackageLocation; use OpenBSD::Paths; sub _new { my ($class, $path, $host) = @_; $path .= '/' unless $path =~ m/\/$/; bless { host => $host, path => $path }, $class; } sub baseurl { my $self = shift; return $self->{path}; } sub new { my ($class, $baseurl) = @_; my $o = $class->parse(\$baseurl); return $o; } sub strip_urlscheme { my ($class, $r) = @_; if ($$r =~ m/^(.*?)\:(.*)$/) { my $scheme = lc($1); if ($scheme eq $class->urlscheme) { $$r = $2; return 1; } } return 0; } sub parse_local_url { my ($class, $r, @args) = @_; my $o; if ($$r =~ m/^(.*?)\:(.*)/) { $o = $class->_new($1, @args); $$r = $2; } else { $o = $class->_new($$r, @args); $$r = ''; } return $o; } sub parse_url { &parse_local_url; } sub parse_fullurl { my ($class, $r) = @_; $class->strip_urlscheme($r) or return undef; return $class->parse_url($r); } sub parse { my ($class, $ref) = @_; my $_ = $$ref; return undef if $_ eq ''; if (m/^ftp\:/io) { return OpenBSD::PackageRepository::FTP->parse_fullurl($ref); } elsif (m/^http\:/io) { return OpenBSD::PackageRepository::HTTP->parse_fullurl($ref); } elsif (m/^https\:/io) { return OpenBSD::PackageRepository::HTTPS->parse_fullurl($ref); } elsif (m/^scp\:/io) { require OpenBSD::PackageRepository::SCP; return OpenBSD::PackageRepository::SCP->parse_fullurl($ref); } elsif (m/^src\:/io) { require OpenBSD::PackageRepository::Source; return OpenBSD::PackageRepository::Source->parse_fullurl($ref); } elsif (m/^file\:/io) { return OpenBSD::PackageRepository::Local->parse_fullurl($ref); } elsif (m/^inst\:$/io) { return OpenBSD::PackageRepository::Installed->parse_fullurl($ref); } else { return OpenBSD::PackageRepository::Local->parse_fullurl($ref); } } sub available { my $self = shift; return @{$self->list}; } sub stemlist { my $self = shift; if (!defined $self->{stemlist}) { require OpenBSD::PackageName; $self->{stemlist} = OpenBSD::PackageName::avail2stems($self->available); } return $self->{stemlist}; } sub wipe_info { my ($self, $pkg) = @_; require File::Path; my $dir = $pkg->{dir}; if (defined $dir) { File::Path::rmtree($dir); delete $pkg->{dir}; } } # by default, all objects may exist sub may_exist { return 1; } # by default, we don't track opened files for this key sub opened { undef; } # hint: 0 premature close, 1 real error. undef, normal ! sub close { my ($self, $object, $hint) = @_; close($object->{fh}) if defined $object->{fh}; if (defined $object->{pid2}) { local $SIG{ALRM} = sub { kill HUP => $object->{pid2}; }; alarm(30); waitpid($object->{pid2}, 0); alarm(0); } $self->parse_problems($object->{errors}, $hint, $object) if defined $object->{errors}; undef $object->{errors}; $object->deref; } sub make_room { my $self = shift; # kill old files if too many my $already = $self->opened; if (defined $already) { # gc old objects if (@$already >= $self->maxcount) { @$already = grep { defined $_->{fh} } @$already; } while (@$already >= $self->maxcount) { my $o = shift @$already; $self->close_now($o); } } return $already; } # open method that tracks opened files per-host. sub open { my ($self, $object) = @_; return unless $self->may_exist($object->{name}); # kill old files if too many my $already = $self->make_room; my $fh = $self->open_pipe($object); if (!defined $fh) { return; } $object->{fh} = $fh; if (defined $already) { push @$already, $object; } return $fh; } sub find { my ($repository, $name, $arch) = @_; my $self = $repository->new_location($name, $arch); if ($self->contents) { return $self; } } sub grabPlist { my ($repository, $name, $arch, $code) = @_; my $self = $repository->new_location($name, $arch); return $self->grabPlist($code); } sub parse_problems { my ($self, $filename, $hint, $object) = @_; unlink $filename; } sub cleanup { # nothing to do } sub relative_url { my ($self, $name) = @_; if (defined $name) { return $self->baseurl.$name.".tgz"; } else { return $self->baseurl; } } package OpenBSD::PackageRepository::Local; our @ISA=qw(OpenBSD::PackageRepository); use OpenBSD::Error; sub urlscheme { return 'file'; } sub parse_fullurl { my ($class, $r) = @_; $class->strip_urlscheme($r); return $class->parse_local_url($r); } # wrapper around copy, that sometimes does not copy sub may_copy { my ($self, $object, $destdir) = @_; my $src = $self->relative_url($object->{name}); require File::Spec; my (undef, undef, $base) = File::Spec->splitpath($src); my $dest = File::Spec->catfile($destdir, $base); if (File::Spec->canonpath($dest) eq File::Spec->canonpath($src)) { return; } if (-f $dest) { my ($ddev, $dino) = (stat $dest)[0,1]; my ($sdev, $sino) = (stat $src)[0, 1]; if ($ddev == $sdev and $sino == $dino) { return; } } Copy($src, $destdir); } sub open_pipe { my ($self, $object) = @_; if (defined $ENV{'PKG_CACHE'}) { $self->may_copy($object, $ENV{'PKG_CACHE'}); } my $pid = open(my $fh, "-|"); if (!defined $pid) { die "Cannot fork: $!"; } if ($pid) { return $fh; } else { open STDERR, ">/dev/null"; exec {OpenBSD::Paths->gzip} "gzip", "-d", "-c", "-q", "-f", $self->relative_url($object->{name}) or die "Can't run gzip"; } } sub may_exist { my ($self, $name) = @_; return -r $self->relative_url($name); } sub list { my $self = shift; my $l = []; my $dname = $self->baseurl; opendir(my $dir, $dname) or return $l; while (my $e = readdir $dir) { next unless $e =~ m/^(.*)\.tgz$/o; next unless -f "$dname/$e"; push(@$l, $1); } close($dir); return $l; } package OpenBSD::PackageRepository::Local::Pipe; our @ISA=qw(OpenBSD::PackageRepository::Local); sub urlscheme { return 'pipe'; } sub relative_url { return ''; } sub may_exist { return 1; } sub open_pipe { my ($self, $object) = @_; my $pid = open(my $fh, "-|"); if (!defined $pid) { die "Cannot fork: $!"; } if ($pid) { return $fh; } else { open STDERR, ">/dev/null"; exec {OpenBSD::Paths->gzip} "gzip", "-d", "-c", "-q", "-f", "-" or die "can't run gzip"; } } package OpenBSD::PackageRepository::Distant; our @ISA=qw(OpenBSD::PackageRepository); sub baseurl { my $self = shift; return "//$self->{host}$self->{path}"; } sub parse_url { &parse_distant_url; } sub parse_distant_url { my ($class, $r) = @_; # same heuristics as ftp(1): # find host part, rest is parsed as a local url if ($$r =~ m/^\/\/(.*?)(\/.*)$/) { my $host = $1; $$r = $2; return $class->parse_local_url($r, $host); } else { return undef; } } my $buffsize = 2 * 1024 * 1024; sub pkg_copy { my ($self, $in, $object) = @_; require OpenBSD::Temp; my $name = $object->{name}; my $dir = $object->{cache_dir}; my ($copy, $filename) = OpenBSD::Temp::permanent_file($dir, $name) or die "Can't write copy to cache"; chmod 0644, $filename; $object->{tempname} = $filename; my $handler = sub { my ($sig) = @_; unlink $filename; close($in); $SIG{$sig} = 'DEFAULT'; kill $sig, $$; }; my $nonempty = 0; my $error = 0; { local $SIG{'PIPE'} = $handler; local $SIG{'INT'} = $handler; local $SIG{'HUP'} = $handler; local $SIG{'QUIT'} = $handler; local $SIG{'KILL'} = $handler; local $SIG{'TERM'} = $handler; my ($buffer, $n); # copy stuff over do { $n = sysread($in, $buffer, $buffsize); if (!defined $n) { die "Error reading: $!"; } if ($n > 0) { $nonempty = 1; } if (!$error) { my $r = syswrite $copy, $buffer; if (!defined $r || $r < $n) { $error = 1; } } syswrite STDOUT, $buffer; } while ($n != 0); close($copy); } if ($nonempty && !$error) { rename $filename, "$dir/$name.tgz"; } else { unlink $filename; } close($in); } sub open_pipe { require OpenBSD::Temp; my ($self, $object) = @_; $object->{errors} = OpenBSD::Temp->file; $object->{cache_dir} = $ENV{'PKG_CACHE'}; $object->{parent} = $$; my ($rdfh, $wrfh); pipe($rdfh, $wrfh); my $pid = open(my $fh, "-|"); if (!defined $pid) { die "Cannot fork: $!"; } if ($pid) { $object->{pid} = $pid; } else { open(STDIN, '<&', $rdfh) or die "Bad dup"; close($rdfh); close($wrfh); exec {OpenBSD::Paths->gzip} "gzip", "-d", "-c", "-q", "-" or die "can't run gzip"; } my $pid2 = fork(); if (!defined $pid2) { die "Cannot fork: $!"; } if ($pid2) { $object->{pid2} = $pid2; } else { open STDERR, '>', $object->{errors}; open(STDOUT, '>&', $wrfh) or die "Bad dup"; close($rdfh); close($wrfh); close($fh); if (defined $object->{cache_dir}) { my $pid3 = open(my $in, "-|"); if (!defined $pid3) { die "Cannot fork: $!"; } if ($pid3) { $self->pkg_copy($in, $object); } else { $self->grab_object($object); } } else { $self->grab_object($object); } exit(0); } close($rdfh); close($wrfh); return $fh; } sub finish_and_close { my ($self, $object) = @_; if (defined $object->{cache_dir}) { while (defined $object->_next) { } } $self->SUPER::finish_and_close($object); } package OpenBSD::PackageRepository::HTTPorFTP; our @ISA=qw(OpenBSD::PackageRepository::Distant); our %distant = (); sub grab_object { my ($self, $object) = @_; my ($ftp, @extra) = split(/\s+/, OpenBSD::Paths->ftp); exec {$ftp} $ftp, @extra, "-o", "-", $self->url($object->{name}) or die "can't run ".OpenBSD::Paths->ftp; } sub maxcount { return 1; } sub opened { my $self = $_[0]; my $k = $self->{host}; if (!defined $distant{$k}) { $distant{$k} = []; } return $distant{$k}; } sub should_have { my ($self, $pkgname) = @_; if (defined $self->{lasterror} && $self->{lasterror} == 421) { return (defined $self->{list}) && grep { $_ eq $pkgname } @{$self->{list}}; } else { return 0; } } sub try_until_success { my ($self, $pkgname, $code) = @_; for (my $retry = 5; $retry <= 160; $retry *= 2) { undef $self->{lasterror}; my $o = &$code; if (defined $o) { return $o; } if (defined $self->{lasterror} && $self->{lasterror} == 550) { last; } if ($self->should_have($pkgname)) { print STDERR "Temporary error, sleeping $retry seconds\n"; sleep($retry); } } return undef; } sub find { my ($self, $pkgname, @extra) = @_; return $self->try_until_success($pkgname, sub { return $self->SUPER::find($pkgname, @extra); }); } sub grabPlist { my ($self, $pkgname, @extra) = @_; return $self->try_until_success($pkgname, sub { return $self->SUPER::grabPlist($pkgname, @extra); }); } sub parse_problems { my ($self, $filename, $hint, $object) = @_; CORE::open(my $fh, '<', $filename) or return; my $baseurl = $self->url; my $url = $baseurl; if (defined $object) { $url = $object->url; } my $_; my $notyet = 1; while(<$fh>) { next if m/^(?:200|220|221|226|229|230|227|250|331|500|150)[\s\-]/o; next if m/^EPSV command not understood/o; next if m/^Trying [\da-f\.\:]+\.\.\./o; next if m/^Requesting \Q$baseurl\E/; next if m/^Remote system type is\s+/o; next if m/^Connected to\s+/o; next if m/^remote\:\s+/o; next if m/^Using binary mode to transfer files/o; next if m/^Retrieving\s+/o; next if m/^Success?fully retrieved file/o; next if m/^\d+\s+bytes\s+received\s+in/o; next if m/^ftp: connect to address.*: No route to host/o; if (defined $hint && $hint == 0) { next if m/^ftp: -: short write/o; next if m/^ftp: Writing -: Broken pipe/o; next if m/^421\s+/o; } if ($notyet) { print STDERR "Error from $url:\n" if $notyet; $notyet = 0; } if (m/^421\s+/o || m/^ftp: connect: Connection timed out/o || m/^ftp: Can't connect or login to host/o) { $self->{lasterror} = 421; } if (m/^550\s+/o) { $self->{lasterror} = 550; } print STDERR $_; } CORE::close($fh); $self->SUPER::parse_problems($filename, $hint, $object); } sub list { my ($self) = @_; if (!defined $self->{list}) { $self->make_room; my $error = OpenBSD::Temp->file; $self->{list} = $self->obtain_list($error); $self->parse_problems($error); if ($self->{no_such_dir}) { print STDERR $self->{path}, ": Directory does not exist on ", $self->{host}, "\n"; $self->{lasterror} = 404; } } return $self->{list}; } sub get_http_list { my ($self, $error) = @_; my $fullname = $self->url; my $l = []; my $_; open(my $fh, '-|', OpenBSD::Paths->ftp." -o - $fullname 2>$error") or return; while(<$fh>) { chomp; for my $pkg (m/\/gio) { $pkg = $1 if $pkg =~ m|^.*/(.*)$|; # decode uri-encoding; from URI::Escape $pkg =~ s/%([0-9A-Fa-f]{2})/chr(hex($1))/eg; push(@$l, $pkg); } } close($fh); return $l; } package OpenBSD::PackageRepository::HTTP; our @ISA=qw(OpenBSD::PackageRepository::HTTPorFTP); sub urlscheme { return 'http'; } sub obtain_list { my ($self, $error) = @_; return $self->get_http_list($error); } package OpenBSD::PackageRepository::HTTPS; our @ISA=qw(OpenBSD::PackageRepository::HTTP); sub urlscheme { return 'https'; } package OpenBSD::PackageRepository::FTP; our @ISA=qw(OpenBSD::PackageRepository::HTTPorFTP); sub urlscheme { return 'ftp'; } sub _list { my ($self, $cmd) = @_; my $l =[]; my $_; open(my $fh, '-|', "$cmd") or return; while(<$fh>) { chomp; next if m/^\d\d\d\s+\S/; if (m/No such file or directory|Failed to change directory/i) { $self->{no_such_dir} = 1; } next unless m/^(?:\.\/)?(\S+)\.tgz\s*$/; push(@$l, $1); } close($fh); return $l; } sub get_ftp_list { my ($self, $error) = @_; my $fullname = $self->url; return $self->_list("echo 'nlist'| ".OpenBSD::Paths->ftp ." $fullname 2>$error"); } sub obtain_list { my ($self, $error) = @_; if (defined $ENV{'ftp_proxy'}) { return $self->get_http_list($error); } else { return $self->get_ftp_list($error); } } 1;