perkeep/server/tester/bs-test.pl

431 lines
13 KiB
Perl
Executable File

#!/usr/bin/perl
#
# Test script to run against a Camli blobserver to test its compliance
# with the spec.
use strict;
use Getopt::Long;
use LWP;
use Test::More;
my $user;
my $password;
my $implopt;
GetOptions("user" => \$user,
"password" => \$password,
"impl=s" => \$implopt,
) or usage();
my $impl;
my %args = (user => $user, password => $password);
if ($implopt eq "go") {
$impl = Impl::Go->new(%args);
} elsif ($implopt eq "appengine") {
$impl = Impl::AppEngine->new(%args);
} else {
die "The --impl flag must be 'go' or 'appengine'.\n";
}
ok($impl->start, "Server started");
$impl->verify_no_blobs; # also tests some of enumerate
$impl->test_stat_and_upload;
$impl->test_upload_corrupt_blob; # blobref digest doesn't match
# TODO: test multiple uploads in a batch
# TODO: test uploads in serial (using each response's next uploadUrl)
# TODO: test enumerate boundaries
# TODO: interrupt a POST upload in the middle; verify no straggler on
# disk in subsequent GET
# ....
# test auth works on bogus password? (auth still undefined)
# TODO: test stat with both GET and POST (currently just POST)
done_testing();
sub usage {
die "Usage: bs-test.pl [--user= --password=] --impl={go,appengine}\n";
}
package Impl;
use HTTP::Request::Common;
use LWP::UserAgent;
use JSON::Any;
use Test::More;
use Digest::SHA1 qw(sha1_hex);
use URI::URL ();
use Data::Dumper;
sub new {
my ($class, %args) = @_;
return bless \%args, $class;
}
sub post {
my ($self, $path, $form) = @_;
$path ||= "";
$form ||= {};
return POST($self->path($path),
"Authorization" => "Basic dGVzdDp0ZXN0", # test:test
Content => $form);
}
sub upload_request {
my ($self, $upload_url, $blobref_to_blob_map) = @_;
my @content;
my $n = 0;
foreach my $key (sort keys %$blobref_to_blob_map) {
$n++;
# TODO: the App Engine client refused to work unless the Content-Type
# is set. This should be clarified in the docs (MUST?) and update the
# test suite and Go server accordingly (to fail if not present).
push @content, $key => [
undef, "filename$n",
"Content-Type" => "application/octet-stream",
Content => $blobref_to_blob_map->{$key},
];
}
return POST($upload_url,
"Content_Type" => 'form-data',
"Authorization" => "Basic dGVzdDp0ZXN0", # test:test
Content => \@content);
}
sub get {
my ($self, $path, $form) = @_;
$path ||= "";
$form ||= {};
return GET($self->path($path),
"Authorization" => "Basic dGVzdDp0ZXN0", # test:test
%$form);
}
sub head {
my ($self, $path, $form) = @_;
$path ||= "";
$form ||= {};
return HEAD($self->path($path),
"Authorization" => "Basic dGVzdDp0ZXN0", # test:test
%$form);
}
sub ua {
my $self = shift;
return ($self->{_ua} ||= LWP::UserAgent->new(agent => "camli/blobserver-tester"));
}
sub root {
my $self= shift;
return $self->{root} or die "No 'root' for $self";
}
sub path {
my $self = shift;
my $path = shift || "";
return $self->root . $path;
}
sub get_json {
my ($self, $req, $msg, $opts) = @_;
$opts ||= {};
my $res = $self->ua->request($req);
ok(defined($res), "got response for HTTP request '$msg'");
if ($res->code =~ m!^30[123]$! && $opts->{follow_redirect}) {
my $location = $res->header("Location");
if ($res->code == "303") {
$req->method("GET");
}
my $new_uri = URI::URL->new($location, $req->uri)->abs;
diag("Old URI was " . $req->uri);
diag("New is " . $new_uri);
diag("Redirecting HTTP request '$msg' to $location ($new_uri)");
$req->uri($new_uri);
$res = $self->ua->request($req);
ok(defined($res), "got redirected response for HTTP request '$msg'");
}
ok($res->is_success, "successful response for HTTP request '$msg'")
or diag("Status was: " . $res->status_line);
my $json = JSON::Any->jsonToObj($res->content);
is("HASH", ref($json), "JSON parsed for HTTP request '$msg'")
or BAIL_OUT("expected JSON response");
return $json;
}
sub get_upload_json {
my ($self, $req) = @_;
return $self->get_json($req, "upload", { follow_redirect => 1 })
}
sub verify_no_blobs {
my $self = shift;
my $req = $self->get("/camli/enumerate-blobs", {
"after" => "",
"limit" => 10,
});
my $json = $self->get_json($req, "enumerate empty blobs");
ok(defined($json->{'blobs'}), "enumerate has a 'blobs' key");
is("ARRAY", ref($json->{'blobs'}), "enumerate's blobs key is an array");
is(0, scalar @{$json->{'blobs'}}, "no blobs on server");
}
sub test_stat_and_upload {
my $self = shift;
my ($req, $res);
my $blob = "This is a line.\r\nWith mixed newlines\rFoo\nAnd binary\0data.\0\n\r.";
my $blobref = "sha1-" . sha1_hex($blob);
# Bogus method.
$req = $self->head("/camli/stat", {
"camliversion" => 1,
"blob1" => $blobref,
});
$res = $self->ua->request($req);
ok(!$res->is_success, "returns failure for HEAD on /camli/stat");
# Correct method, but missing camliVersion.
$req = $self->post("/camli/stat", {
"blob1" => $blobref,
});
$res = $self->ua->request($req);
ok(!$res->is_success, "returns failure for missing camliVersion param on stat");
# Valid pre-upload
$req = $self->post("/camli/stat", {
"camliversion" => 1,
"blob1" => $blobref,
});
my $jres = $self->get_json($req, "valid stat");
diag("stat response: " . Dumper($jres));
ok($jres, "valid stat JSON response");
for my $f (qw(stat maxUploadSize uploadUrl uploadUrlExpirationSeconds)) {
ok(defined($jres->{$f}), "required field '$f' present");
}
is(scalar(keys %$jres), 4, "Exactly 4 JSON keys returned");
my $statList = $jres->{stat};
is(ref($statList), "ARRAY", "stat is an array");
is(scalar(@$statList), 0, "server doesn't have this blob yet.");
like($jres->{uploadUrlExpirationSeconds}, qr/^\d+$/, "uploadUrlExpirationSeconds is numeric");
my $upload_url = URI::URL->new($jres->{uploadUrl}, $self->root)->abs;
ok($upload_url, "valid uploadUrl");
# TODO: test & clarify in spec: are relative URLs allowed in uploadUrl?
# App Engine seems to do it already, and makes it easier, so probably
# best to clarify that they're relative.
# Do the actual upload
my $upreq = $self->upload_request($upload_url, {
$blobref => $blob,
});
diag("upload request: " . $upreq->as_string);
my $upres = $self->get_upload_json($upreq);
ok($upres, "Upload was success");
print STDERR "# upload response: ", Dumper($upres);
for my $f (qw(uploadUrlExpirationSeconds uploadUrl maxUploadSize received)) {
ok(defined($upres->{$f}), "required upload response field '$f' present");
}
is(scalar(keys %$upres), 4, "Exactly 4 JSON keys returned");
like($upres->{uploadUrlExpirationSeconds}, qr/^\d+$/, "uploadUrlExpirationSeconds is numeric");
is(ref($upres->{received}), "ARRAY", "'received' is an array")
or BAIL_OUT();
my $got = $upres->{received};
is(scalar(@$got), 1, "got one file");
is($got->[0]{blobRef}, $blobref, "received[0] 'blobRef' matches");
is($got->[0]{size}, length($blob), "received[0] 'size' matches");
# TODO: do a get request, verify that we get it back.
}
sub test_upload_corrupt_blob {
my $self = shift;
my ($req, $res);
my $blob = "A blob, pre-corruption.";
my $blobref = "sha1-" . sha1_hex($blob);
$blob .= "OIEWUROIEWURLKJDSLKj CORRUPT";
$req = $self->post("/camli/stat", {
"camliversion" => 1,
"blob1" => $blobref,
});
my $jres = $self->get_json($req, "valid stat");
my $upload_url = URI::URL->new($jres->{uploadUrl}, $self->root)->abs;
# TODO: test & clarify in spec: are relative URLs allowed in uploadUrl?
# App Engine seems to do it already, and makes it easier, so probably
# best to clarify that they're relative.
# Do the actual upload
my $upreq = $self->upload_request($upload_url, {
$blobref => $blob,
});
diag("corrupt upload request: " . $upreq->as_string);
my $upres = $self->get_upload_json($upreq);
my $got = $upres->{received};
is(ref($got), "ARRAY", "corrupt upload returned a 'received' array");
is(scalar(@$got), 0, "didn't get any files (it was corrupt)");
}
package Impl::Go;
use base 'Impl';
use FindBin;
use LWP::UserAgent;
use HTTP::Request;
use Fcntl;
use File::Temp ();
sub start {
my $self = shift;
$self->{_tmpdir_obj} = File::Temp->newdir();
my $tmpdir = $self->{_tmpdir_obj}->dirname;
die "Failed to create temporary directory." unless -d $tmpdir;
system("$FindBin::Bin/../../build.pl", "server/go/blobserver")
and die "Failed to build Go blobserver.";
my $bindir = "$FindBin::Bin/../go/blobserver/";
my $binary = "$bindir/blobserver";
chdir($bindir) or die "filed to chdir to $bindir: $!";
system("make") and die "failed to run make in $bindir";
my ($port_rd, $port_wr, $exit_rd, $exit_wr);
my $flags;
pipe $port_rd, $port_wr;
pipe $exit_rd, $exit_wr;
$flags = fcntl($port_wr, F_GETFD, 0);
fcntl($port_wr, F_SETFD, $flags & ~FD_CLOEXEC);
$flags = fcntl($exit_rd, F_GETFD, 0);
fcntl($exit_rd, F_SETFD, $flags & ~FD_CLOEXEC);
$ENV{TESTING_PORT_WRITE_FD} = fileno($port_wr);
$ENV{TESTING_CONTROL_READ_FD} = fileno($exit_rd);
$ENV{CAMLI_PASSWORD} = "test";
die "Binary $binary doesn't exist\n" unless -x $binary;
my $pid = fork;
die "Failed to fork" unless defined($pid);
if ($pid == 0) {
# child
my @args = ($binary, "-listen=:0", "-root=$tmpdir");
print STDERR "# Running: [@args]\n";
exec @args;
die "failed to exec: $!\n";
}
close($exit_rd); # child owns this side
close($port_wr); # child owns this side
print "Waiting for Go server to start...\n";
my $line = <$port_rd>;
close($port_rd);
# Parse the port line out
chomp $line;
# print "Got port line: $line\n";
die "Failed to start, no port info." unless $line =~ /:(\d+)$/;
$self->{port} = $1;
$self->{root} = "http://localhost:$self->{port}";
print STDERR "# Running on $self->{root} ...\n";
# Keep a reference to this to write "EXIT\n" to in order
# to cleanly shutdown the child perkeepd process.
# If we close it, the child also dies, though.
$self->{_exit_wr} = $exit_wr;
return 1;
}
sub DESTROY {
my $self = shift;
syswrite($self->{_exit_wr}, "EXIT\n");
}
package Impl::AppEngine;
use base 'Impl';
use IO::Socket::INET;
use Time::HiRes ();
sub start {
my $self = shift;
my $dev_appserver = `which dev_appserver.py`;
chomp $dev_appserver;
unless ($dev_appserver && -x $dev_appserver) {
$dev_appserver = "$ENV{HOME}/sdk/google_appengine/dev_appserver.py";
unless (-x $dev_appserver) {
die "No dev_appserver.py in \$PATH nor in \$HOME/sdk/google_appengine/dev_appserver.py\n";
}
}
$self->{_tempdir_blobstore_obj} = File::Temp->newdir();
$self->{_tempdir_datastore_obj} = File::Temp->newdir();
my $datapath = $self->{_tempdir_blobstore_obj}->dirname . "/datastore-file";
my $blobdir = $self->{_tempdir_datastore_obj}->dirname;
my $port;
while (1) {
$port = int(rand(30000) + 1024);
my $sock = IO::Socket::INET->new(Listen => 5,
LocalAddr => '127.0.0.1',
LocalPort => $port,
ReuseAddr => 1,
Proto => 'tcp');
if ($sock) {
last;
}
}
$self->{port} = $port;
$self->{root} = "http://localhost:$self->{port}";
my $pid = fork;
die "Failed to fork" unless defined($pid);
if ($pid == 0) {
my $appdir = "$FindBin::Bin/../appengine/blobserver";
# child
my @args = ($dev_appserver,
"--clear_datastore", # kinda redundant as we made a temp dir
"--datastore_path=$datapath",
"--blobstore_path=$blobdir",
"--port=$port",
$appdir);
print STDERR "# Running: [@args]\n";
exec @args;
die "failed to exec: $!\n";
}
$self->{pid} = $pid;
my $last_print = 0;
for (1..15) {
my $now = time();
if ($now != $last_print) {
print STDERR "# Waiting for appengine app to start...\n";
$last_print = $now;
}
my $res = $self->ua->request($self->get("/"));
if ($res && $res->is_success) {
print STDERR "# Up.";
last;
}
Time::HiRes::sleep(0.1);
}
return 1;
}
sub DESTROY {
my $self = shift;
kill 3, $self->{pid} if $self->{pid};
}
1;