The Perl Toolchain Summit needs more sponsors. If your company depends on Perl, please support this very important event.
# NOTE: this file tests how large files (>2GB) work with perlio (stdio/sfio).
# sysopen(), sysseek(), syswrite(), sysread() are tested in t/lib/syslfs.t.
# If you modify/add tests here, remember to update also ext/Fcntl/t/syslfs.t.

use Config;

BEGIN {
	# Don't bother if there are no quad offsets.
	if (config_value('lseeksize') +< 8) {
		print $^STDOUT, "1..0 # Skip: no 64-bit file offsets\n";
		exit(0);
	}
}

our @s;
our $fail;
my $big;

sub zap {
    close($big);
    unlink("big");
    unlink("big1");
    unlink("big2");
}

sub bye {
    zap();	
    exit(0);
}

my $explained;

sub explain {
    unless ($explained++) {
	print $^STDOUT, <<EOM;
#
# If the lfs (large file support: large meaning larger than two
# gigabytes) tests are skipped or fail, it may mean either that your
# process (or process group) is not allowed to write large files
# (resource limits) or that the file system (the network filesystem?)
# you are running the tests on doesn't let your user/group have large
# files (quota) or the filesystem simply doesn't support large files.
# You may even need to reconfigure your kernel.  (This is all very
# operating system and site-dependent.)
#
# Perl may still be able to support large files, once you have
# such a process, enough quota, and such a (file) system.
# It is just that the test failed now.
#
EOM
    }
    print $^STDOUT, "1..0 # Skip: $(join ' ',@_)\n" if (nelems @_);
}

$^OUTPUT_AUTOFLUSH = 1;

print $^STDOUT, "# checking whether we have sparse files...\n";

# Known have-nots.
if ($^OS_NAME eq 'MSWin32' || $^OS_NAME eq 'NetWare' || $^OS_NAME eq 'VMS') {
    print $^STDOUT, "1..0 # Skip: no sparse files in $^OS_NAME\n";
    bye();
}

# Known haves that have problems running this test
# (for example because they do not support sparse files, like UNICOS)
if ($^OS_NAME eq 'unicos') {
    print $^STDOUT, "1..0 # Skip: no sparse files in $^OS_NAME, unable to test large files\n";
    bye();
}

# Then try to heuristically deduce whether we have sparse files.

# Let's not depend on Fcntl or any other extension.

my @($SEEK_SET, $SEEK_CUR, $SEEK_END) = @(0, 1, 2);

# We'll start off by creating a one megabyte file which has
# only three "true" bytes.  If we have sparseness, we should
# consume less blocks than one megabyte (assuming nobody has
# one megabyte blocks...)

open($big, ">", "big1") or
    do { warn "open big1 failed: $^OS_ERROR\n"; bye };
binmode($big) or
    do { warn "binmode big1 failed: $^OS_ERROR\n"; bye };
seek($big, 1_000_000, $SEEK_SET) or
    do { warn "seek big1 failed: $^OS_ERROR\n"; bye };
print $big, "big" or
    do { warn "print big1 failed: $^OS_ERROR\n"; bye };
close($big) or
    do { warn "close big1 failed: $^OS_ERROR\n"; bye };

my @s1 = @( stat("big1") );

print $^STDOUT, "# s1 = $(join ' ',@s1)\n";

open($big, ">", "big2") or
    do { warn "open big2 failed: $^OS_ERROR\n"; bye };
binmode($big) or
    do { warn "binmode big2 failed: $^OS_ERROR\n"; bye };
seek($big, 2_000_000, $SEEK_SET) or
    do { warn "seek big2 failed; $^OS_ERROR\n"; bye };
print $big, "big" or
    do { warn "print big2 failed; $^OS_ERROR\n"; bye };
close($big) or
    do { warn "close big2 failed; $^OS_ERROR\n"; bye };

my @s2 = @( stat("big2") );

print $^STDOUT, "# s2 = $(join ' ',@s2)\n";

zap();

unless (@s1[7] == 1_000_003 && @s2[7] == 2_000_003 &&
	@s1[11] == @s2[11] && @s1[12] == @s2[12]) {
	print $^STDOUT, "1..0 # Skip: no sparse files?\n";
	bye;
}

print $^STDOUT, "# we seem to have sparse files...\n";

# By now we better be sure that we do have sparse files:
# if we are not, the following will hog 5 gigabytes of disk.  Ooops.
# This may fail by producing some signal; run in a subprocess first for safety

env::var('LC_ALL' ) = "C";

my $r = system '../perl', '-e', <<'EOF';
open(my $big, ">", "big");
seek($big, 5_000_000_000, 0);
print $big, "big";
exit 0;
EOF

open($big, ">", "big") or do { warn "open failed: $^OS_ERROR\n"; bye };
binmode $big;
if ($r or not seek($big, 5_000_000_000, $SEEK_SET)) {
    my $err = $r ?? 'signal '.($r ^&^ 0x7f) !! $^OS_ERROR;
    explain("seeking past 2GB failed: $err");
    bye();
}

# Either the print or (more likely, thanks to buffering) the close will
# fail if there are are filesize limitations (process or fs).
my $print = print $big, "big";
print $^STDOUT, "# print failed: $^OS_ERROR\n" unless $print;
my $close = close $big;
print $^STDOUT, "# close failed: $^OS_ERROR\n" unless $close;
unless ($print && $close) {
    if ($^OS_ERROR =~m/too large/i) {
	explain("writing past 2GB failed: process limits?");
    } elsif ($^OS_ERROR =~ m/quota/i) {
	explain("filesystem quota limits?");
    } else {
	explain("error: $^OS_ERROR");
    }
    bye();
}

@s = @( stat("big") );

print $^STDOUT, "# $(join ' ',@s)\n";

unless (@s[7] == 5_000_000_003) {
    explain("kernel/fs not configured to use large files?");
    bye();
}

sub fail () {
    print $^STDOUT, "not ";
    $fail++;
}

sub offset($offset_will_be, $offset_want) {
    my $offset_is = eval $offset_will_be;
    unless ($offset_is == $offset_want) {
        print $^STDOUT, "# bad offset $offset_is, want $offset_want\n";
	my @($offset_func) = @($offset_will_be =~ m/^(\w+)/);
	if (unpack("L", pack("L", $offset_want)) == $offset_is) {
	    print $^STDOUT, "# 32-bit wraparound suspected in $offset_func() since\n";
	    print $^STDOUT, "# $offset_want cast into 32 bits equals $offset_is.\n";
	} elsif ($offset_want - unpack("L", pack("L", $offset_want)) - 1
	         == $offset_is) {
	    print $^STDOUT, "# 32-bit wraparound suspected in $offset_func() since\n";
	    printf $^STDOUT, "# \%s - unpack('L', pack('L', \%s)) - 1 equals \%s.\n",
	        $offset_want,
	        $offset_want,
	        $offset_is;
        }
        fail;
    }
}

print $^STDOUT, "1..17\n";

$fail = 0;

fail unless @s[7] == 5_000_000_003;	# exercizes pp_stat
print $^STDOUT, "ok 1\n";

fail unless -s "big" == 5_000_000_003;	# exercizes pp_ftsize
print $^STDOUT, "ok 2\n";

fail unless -e "big";
print $^STDOUT, "ok 3\n";

fail unless -f "big";
print $^STDOUT, "ok 4\n";

open($big, "<", "big") or do { warn "open failed: $^OS_ERROR\n"; bye };
binmode $big;

fail unless seek($big, 4_500_000_000, $SEEK_SET);
print $^STDOUT, "ok 5\n";

offset('tell($big)', 4_500_000_000);
print $^STDOUT, "ok 6\n";

fail unless seek($big, 1, $SEEK_CUR);
print $^STDOUT, "ok 7\n";

# If you get 205_032_705 from here it means that
# your tell() is returning 32-bit values since (I32)4_500_000_001
# is exactly 205_032_705.
offset('tell($big)', 4_500_000_001);
print $^STDOUT, "ok 8\n";

fail unless seek($big, -1, $SEEK_CUR);
print $^STDOUT, "ok 9\n";

offset('tell($big)', 4_500_000_000);
print $^STDOUT, "ok 10\n";

fail unless seek($big, -3, $SEEK_END);
print $^STDOUT, "ok 11\n";

offset('tell($big)', 5_000_000_000);
print $^STDOUT, "ok 12\n";

my $big_str;

fail unless read($big, $big_str, 3) == 3;
print $^STDOUT, "ok 13\n";

fail unless $big_str eq "big";
print $^STDOUT, "ok 14\n";

# 705_032_704 = (I32)5_000_000_000
# See that we don't have "big" in the 705_... spot:
# that would mean that we have a wraparound.
fail unless seek($big, 705_032_704, $SEEK_SET);
print $^STDOUT, "ok 15\n";

my $zero;

fail unless read($big, $zero, 3) == 3;
print $^STDOUT, "ok 16\n";

fail unless $zero eq "\0\0\0";
print $^STDOUT, "ok 17\n";

explain() if $fail;

bye(); # does the necessary cleanup

END {
    # unlink may fail if applied directly to a large file
    # be paranoid about leaving 5 gig files lying around
    open($big, ">", "big"); # truncate
    close($big);
    1 while unlink "big"; # standard portable idiom
}

# eof