/usr/lib/perl5/PDL/DiskCache.pm is in pdl 1:2.4.7+dfsg-2ubuntu5.
This file is owned by root:root, with mode 0o644.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 | =head1 NAME
PDL::DiskCache -- Non-memory-resident array object
=head1 SYNOPSIS
NON-OO:
use PDL::DiskCache;
tie @a,'PDL::DiskCache', \@files, \%options;
imag $a[3];
OO:
use PDL::DiskCache;
$a = diskcache(\@files,\%options);
imag $a->[3];
or
use PDL::DiskCache;
$a = new PDL::DiskCache(\@files,\%options);
imag $a->[4];
=over 3
=item \@files
an array ref containing a list of file names
=item \%options
a hash ref containing options for the PDL::DiskCache object (see "TIEARRAY"
below for details)
=back
=head1 DESCRIPTION
A PDL::DiskCache object is a perl L<"tied array"|perltie> that is useful
for operations where you have to look at a large collection of PDLs one
or a few at a time (such as tracking features through an image sequence).
You can write prototype code that uses a perl list of a few PDLs, then
scale up to to millions of PDLs simply by handing the prototype code
a DiskCache tied array instead of a native perl array. The individual
PDLs are stored on disk and a few of them are swapped into memory on a
FIFO basis. You can set whether the data are read-only or writeable.
By default, PDL::DiskCache uses FITS files to represent the PDLs, but
you can use any sort of file at all -- the read/write routines are the
only place where it examines the underlying data, and you can specify
the routines to use at construction time (or, of course, subclass
PDL::DiskCache).
Items are swapped out on a FIFO basis, so if you have 10 slots
and an expression with 10 items in it then you're OK (but you probably
want more slots than that); but if you use more items in an expression than
there are slots, thrashing will occur!
The hash ref interface is kept for historical reasons; you can access
the sync() and purge() method calls directly from the returned array ref.
=head1 Shortcomings & caveats
There's no file locking, so you could really hose yourself by having two of
these things going at once on the same files.
Since this is a tied array, things like Dumper traverse it transparently.
That is sort-of good but also sort-of dangerous. You wouldn't want to
PDL::Dumper::sdump() a large PDL::DiskCache, for example -- that would defeat
the purpose of using a PDL::DiskCache in the first place.
=head1 Author, license, no warranty
Copyright 2001, Craig DeForest
This code may be distributed under the same terms as Perl itself
(license available at L<http://www.perl.org>). Copying, reverse engineering,
distribution, and modification are explicitly allowed so long as this notice
is preserved intact and modified versions are clearly marked as such.
If you modify the code and it's useful, please send a copy of the modified
version to cdeforest@solar.stanford.edu.
This package comes with NO WARRANTY.
=head1 FUNCTIONS
=cut
######################################################################
# Package initialization
$PDL::DiskCache::VERSION = 1.1;
use strict;
use Carp;
=head2 diskcache
Object constructor.
=for usage
$a = diskcache(\@f,\%options);
Options
=over 3
=item
See the TIEARRAY options,below.
=back
=cut
sub diskcache {
my($f,$opt) = @_;
return PDL::DiskCache::new('PDL::DiskCache',$f,$opt);
}
sub PDL::DiskCache::new {
my($class,$f,$opt) = @_;
my($a)=[];
my($b) = tie @{$a},$class,$f,$opt;
if($opt->{bless}) {
$a = bless($a,$class);
}
if(wantarray) {
return ($a,bless($b,$class));
} else {
return $a;
}
}
*PDL::DiskCache::diskcache = *diskcache;
=head2 TIEARRAY
=for ref
Tied-array constructor; invoked by perl during object construction.
=for usage
TIEARRAY(class,\@f,\%options)
Options
=over 3
=item ro (default 0)
If set, treat the files as read-only (modifications
to the tied array will only persist until the changed elements are
swapped out)
=item rw (default 1)
If set, allow reading and writing to the files.
Because there's currently no way to determine reliably whether a PDL
has been modified, rw files are always written to disk when they're
swapped out -- this causes a slight performance hit.
=item mem (default 20)
Number of files to be cached in memory at once.
=item read (default \&rfits)
A function ref pointing to code that will read
list objects from disk. The function must have the same syntax as
rfits: $object = rfits(filename).
=item write (default \&wfits)
A function ref pointing to code that will
write list objects to disk. The function must have the same syntax as
wfits: func(object,filename).
=item bless (default 0)
If set to a nonzero value, then the array ref gets
blessed into the DiskCache class for for easier access to the "purge"
and "sync" methods. This means that you can say C<< $a->sync >> instead
of the more complex C<< (%{tied @$a})->sync >>, but C<ref $a> will return
"PDL::DiskCache" instead of "ARRAY", which could break some code.
=item verbose (default 0)
Get chatty.
=back
=cut
sub PDL::DiskCache::TIEARRAY {
my($class,$f,$opt) = @_;
croak "PDL::DiskCache needs array ref as 2nd arg (did you pass an array instead?)\n"
if(ref $f ne 'ARRAY');
my($new) = {files => $f # File list
, n => scalar(@{$f}) # no. of el.
, write => $opt->{write} || \&main::wfits # Write routine
, read => $opt->{read} || \&main::rfits # Read routine
, mem => $opt->{mem} || 20 # No. of mem slots
, rw => (!($opt->{ro})) # rw or ro
, fdex => [] # Current file stored in each slot, by slot
, slot => [] # Current slot in which each file is stored
, cache => [] # Actual cached stuff gets held here
, opt => {} # Options stashed here for later reference
, cache_next => 0 # Next cache slot to be used
};
foreach $_(keys %{$opt}) {
$new->{opt}->{$_} = $opt->{$_};
}
return bless($new,$class);
}
=head2 purge
Remove an item from the oldest slot in the cache, writing to disk as necessary.
You also send in how many slots to purge (default 1; sending in -1 purges
everything.)
For most uses, a nice MODIFIED flag in the data structure could save
some hassle here. But PDLs can get modified out from under us
with slicing and .= -- so for now we always assume everything is tainted
and must be written to disk.
=cut
sub PDL::DiskCache::purge {
my($me,$n) = @_,1;
$me = (tied @{$me}) if("$me" =~ m/^PDL\:\:DiskCache\=ARRAY/);
$n = $me->{mem} if($n<0);
print "purging $n items..." if($me->{opt}->{verbose});
my($dex) = $me->{cache_next};
local($_);
for(1..$n) {
if($me->{rw}) {
print "writing $me->{files}->[$me->{fdex}->[$dex]]: "
if($me->{opt}->{verbose});
eval {&{$me->{write}}($me->{cache}->[$dex],
$me->{files}->[$me->{fdex}->[$dex]]);
};
print "WARNING: PDL::DiskCache::purge: problems with write of ".$me->{files}->[$me->{fdex}->[$dex]].", item $me->{fdex}->[$dex] from slot $dex: `$@' (".$me->{opt}->{varname}.") \n" if($@);
$@ = 0;
print "ok.\n" if($me->{opt}->{verbose});
}
print "Purging item $dex (file $me->{fdex}->[$dex])...\n" if($me->{opt}->{verbose});
undef $me->{slot}->[$me->{fdex}->[$dex]]; # Purge from slot location list
undef $me->{fdex}->[$dex]; # Purge from slot fdex list
undef $me->{cache}->[$dex]; # Purge from memory
$dex++;
$dex %= $me->{mem};
}
print "...done with purge.\n" if($me->{opt}->{verbose});
}
sub PDL::DiskCache::FETCH {
my($me,$i) = @_;
if($i < 0 || $i >= $me->{n}) {
carp("PDL::DiskCache: Element $i is outside range of 0-",$me->{n}-1,"\n");
return undef;
}
if(defined $me->{slot}->[$i]) {
print "Item $i is in the cache...\n" if ($me->{opt}->{verbose});
return ($me->{cache}->[$me->{slot}->[$i]]);
}
### Got here -- we have to get the item from disk.
print "Item $i ($me->{files}->[$i]) not present. Retrieving..."
if($me->{opt}->{verbose});
if(defined($me->{fdex}->[$me->{cache_next}])) {
print "cache full..." if($me->{opt}->{verbose});
$me->purge(1);
}
my($a) = $me->{cache_next};
$me->{cache}->[$a] = eval {
&{$me->{read}}($me->{files}->[$i])
} ;
undef $@; # Keep this from hanging anything else.
print "result is ",(defined $me->{cache}->[$a] ? "" : "un")."defined.\n"
if($me->{opt}->{verbose});
$me->{slot}->[$i] = $me->{cache_next};
$me->{fdex}->[$me->{cache_next}] = $i;
$me->{cache_next}++;
$me->{cache_next} %= $me->{mem};
$me->{cache}->[$a];
}
sub PDL::DiskCache::STORE {
my($me, $i, $val) = @_;
if( $me->{slot}->[$i] ) {
print "Storing index $i, in cache\n" if($me->{opt}->{verbose});
$me->sync;
return $me->{cache}->[$me->{slot}->[$i]] = $val;
} else {
print "Storing index $i, not in cache\n" if($me->{opt}->{verbose});
if(defined ($me->{fdex}->[$me->{cache_next}])) {
print "cache full..." if($me->{opt}->{verbose});
$me->purge(1);
}
my($a) = $me->{cache_next};
$me->{slot}->[$i] = $a;
$me->{fdex}->[$a] = $i;
$me->{cache_next}++;
$me->{cache_next} %= $me->{mem};
$me->sync;
return $me->{cache}->[$a] = $val;
}
croak("This never happens");
}
sub PDL::DiskCache::FETCHSIZE {
my($me) = shift;
$me->{n};
}
sub PDL::DiskCache::STORESIZE {
my($me,$newsize) = @_;
if($newsize > $me->{n}) {
croak("PDL::DiskCache: Can't augment array size (yet)!\n");
}
for( my($i) = $newsize-1; $i<$me->{n}; $i++ ) {
if(defined $me->{slot}->[$i]) {
if($me->{rw}) {
print "Writing $me->{files}->[$me->{fdex}->[$i]]\n"
if($me->{opt}->{verbose});
eval {&{$me->{write}}($me->{cache}->[$me->{slot}->[$i]],
$me->{files}->[$i]);
};
$@ = 0; # Keep from hanging anything else
}
undef $me->{fdex}->[$me->{slot}->[$i]];
}
}
$#{$me->{slot}} = $newsize-1;
$#{$me->{files}} = $newsize-1;
$me->{n} = $newsize;
}
=head2 sync
In a rw cache, flush all items out to disk but retain them in the cache.
This is useful primarily for cache protection and could be slow. Because
we have no way of knowing what's modified and what's not in the cache,
all elements are always flushed from an rw cache. For ro caches,
this is a not-too-slow (but safe) no-op.
=cut
sub PDL::DiskCache::sync {
my($me) = shift;
$me = (tied @{$me}) if("$me" =~ m/^PDL\:\:DiskCache\=ARRAY/);
print "PDL::DiskCache::sync\n" if($me->{opt}->{verbose});
if($me->{rw}) {
for(0..$me->{mem}-1) {
if(defined $me->{fdex}->[$_]) {
print " writing $me->{files}->[$me->{fdex}->[$_]]...\n"
if($me->{opt}->{verbose});
eval {&{$me->{write}}($me->{cache}->[$_],
$me->{files}->[$me->{fdex}->[$_]]);
};
$@ = 0; # keep from hanging anything else
}
}
}
}
=head2 DESTROY
This is the perl hook for object destruction. It just makes a call to
"sync", to flush the cache out to disk. Destructor calls from perl don't
happen at a guaranteed time, so be sure to call "sync" if you need to
ensure that the files get flushed out, e.g. to use 'em somewhere else.
=cut
sub PDL::DiskCache::DESTROY {
my($me) = shift;
$me->sync;
}
# return true
1;
|