# ------------------------------------------------------------------------------------------------------- # Copyright (C) Microsoft. All rights reserved. # Licensed under the MIT license. See LICENSE.txt file in the project root for full license information. # ------------------------------------------------------------------------------------------------------- # # Script used for perf testing against individual benchmarks. This script supports "official" mode, which dumps an XML file # filled with all the data for analysis or exporting into Excel. # use strict; use File::Basename; use File::Spec; my $defaultIter = 35; my $iter = $defaultIter; my @testlist = (); my @testlistSwitches = (); my @variants = ("native"); my %switches = ( "interpreted" => "-NoNative", "native" => ""); my $other_switches = ""; my $official_name; my $OFFICIAL; my $is_official = 0; my $is_baseline = 0; my $basefile = "perfbase.txt"; my $testfile = "perftest.txt"; my $binary = ""; my $dir = ""; my $skipCheckSwitch = 0; # use with non-chakra hosts my $highprecisiondate = 1; my $args; my $parse_scores = 0; my $parse_time = 1; my $parse_latency = 0; my $is_dynamicProfileRun = 1; my $profileFile="dynamicProfileInfo.dpl"; my $perlScriptDir = dirname(__FILE__); my $testDescription = ""; my %measured_data; my %measured; my %variances; my %baseline; my %baseline_variances; parse_args(); if($dir) { $testDescription = $dir; } else { print "Specify one of the benchmark octane, sunspider, kraken or jetsream\n"; print "or specify a directory of perf benchmark\n"; print "and rerun this script with -baseline.\n"; print "perl perftest.pl -? for more options. \n"; die(); } # make sure the baseline file exists if($is_baseline == 0 && !-e $basefile) { print "Baseline file $basefile not found. Rerun this script with -baseline switch.\n"; print "Provide a binary path for ch.exe as well (-binary:\\ch.exe).\n"; die(); } check_switch(); $other_switches .= " -dynamicProfileCache:$profileFile" if $is_dynamicProfileRun; print "NOTE: Baseline Run\n" if $is_baseline; print "NOTE: Official Run\n" if $is_official; print "Baseline file: $basefile\n"; print "Binary: $binary\n"; print "Iterations: $iter\n"; print "High Precision Date not used!\n" if !$highprecisiondate; print "Switches: $other_switches\n" unless ($other_switches eq ""); $other_switches .= " -highprecisiondate" if $highprecisiondate; if($is_baseline) { delete_file($basefile); } else { open(my $IN, '<', $basefile) or die "Couldn't open $basefile for reading."; while(<$IN>) { if(/^([\w\-\\\.]+)$(\w+)$\s([-+]?[0-9]*\.?[0-9]+)\s([-+]?[0-9]*\.?[0-9]+)\s([-+]?[0-9]*\.?[0-9]+)\s([-+]?[0-9]*\.?[0-9]+)$/) { $baseline{$1}{$2}{"time"}=$3; $baseline{$1}{$2}{"score"}=$5; $baseline_variances{$1}{$2}{"time"}=$4; $baseline_variances{$1}{$2}{"score"}=$6; } elsif(/^([\w\-\\\.]+)$(\w+)$\s([-+]?[0-9]*\.?[0-9]+)\s([-+]?[0-9]*\.?[0-9]+)\s*$/) { $baseline{$1}{$2}{"time"}=$3; $baseline{$1}{$2}{"score"}=0; $baseline_variances{$1}{$2}{"time"}=$4; $baseline_variances{$1}{$2}{"score"}=0; } elsif(/^([\w\-\\\.]+)$(\w+)$\s\s\s([-+]?[0-9]*\.?[0-9]+)\s([-+]?[0-9]*\.?[0-9]+)\s*$/) { $baseline{$1}{$2}{"time"}=0; $baseline{$1}{$2}{"score"}=$3; $baseline_variances{$1}{$2}{"time"}=0; $baseline_variances{$1}{$2}{"score"}=$4; } else { die "Couldn't match baseline file line: $_"; } } close($IN); delete_file($testfile); } # run the benchmark tests print "Running $testDescription...\n"; foreach my $variant(@variants) { print("\n"); if(!$is_baseline) { printf("TEST - %-10s BASE TEST DIFF RATIO(%)\n", uc($variant), 0); print("---------------------------------------------------------------------------\n"); } else { printf("Running %s tests...\n", uc($variant)); } my %totalVariance = {"time", 0, "score", 0}; my %totalBaseVariance = {"time", 0, "score", 0}; my %basesum = {"time", 0, "score", 0}; my %measuredsum = {"time", 0, "score", 0}; foreach my $test(@testlist) { my $testLatency = $test . "Latency"; if($is_baseline) { print "Running $test...\n"; } delete_profile(); for(my $i = 0; $i < $iter; ++$i) { # store each data point my %result = runtest($test, $variant); if ($parse_time == 1) { $measured_data{$test}{$variant}{"time"}[$i] = $result{"time"}; } if ($parse_scores == 1) { $measured_data{$test}{$variant}{"score"}[$i] = $result{"score"}; } if ($parse_latency == 1) { # Store Latency score as a separate test - This is used as one of the compnonents in calculating the final GM score. $measured_data{$testLatency}{$variant}{"score"}[$i] = $result{"latency"}; } } if ($parse_time == 1) { # process the time result my $testName = $test; if ($parse_scores == 1) { $testName = $testName." (time)"; } my %result = processResult($testName, $baseline{$test}{$variant}{"time"}, $baseline_variances{$test}{$variant}{"time"}, $measured_data{$test}{$variant}{"time"}, 0); $measured{$test}{$variant}{"time"} = $result{"measured"}; $variances{$test}{$variant}{"time"} = $result{"variance"}; $totalBaseVariance{"time"} += ($baseline{$test}{$variant}{"time"} * $baseline_variances{$test}{$variant}{"time"}) / 100; $basesum{"time"} += $baseline{$test}{$variant}{"time"}; $totalVariance{"time"} += ($measured{$test}{$variant}{"time"} * $variances{$test}{$variant}{"time"}) / 100; $measuredsum{"time"} += $measured{$test}{$variant}{"time"}; } if ($parse_scores == 1) { # process the score result my $testName = $test; if ($parse_time == 1) { $testName = $testName." (score)"; } my %result = processResult($testName, $baseline{$test}{$variant}{"score"}, $baseline_variances{$test}{$variant}{"score"}, $measured_data{$test}{$variant}{"score"}, 1); $measured{$test}{$variant}{"score"} = $result{"measured"}; $variances{$test}{$variant}{"score"} = $result{"variance"}; } if ($parse_latency == 1) { # Check if this test has a Latency score available (Only Mandreel and Splay has latency scores as of 11/08/2013) if($measured_data{$testLatency}{$variant}{"score"}[0] != 0) { my $testName = $testLatency; my %result = processResult($testName, $baseline{$testLatency}{$variant}{"score"}, $baseline_variances{$testLatency}{$variant}{"score"}, $measured_data{$testLatency}{$variant}{"score"}, 1); $measured{$testLatency}{$variant}{"score"} = $result{"measured"}; $variances{$testLatency}{$variant}{"score"} = $result{"variance"}; } } } # generate the geometric means if ($parse_scores == 1) { my $measuredlog = 0; my $variancelog = 0; my $baselog = 0; my $basevariancelog = 0; foreach my $test (@testlist) { my $testLatency = $test . "Latency"; if (!$is_baseline) { $baselog += log($baseline{$test}{$variant}{"score"}); $basevariancelog += log(($baseline{$test}{$variant}{"score"} * $baseline_variances{$test}{$variant}{"score"}) / 100); if($parse_latency == 1) { if(exists $baseline{$testLatency}) { $baselog += log($baseline{$testLatency}{$variant}{"score"}); $basevariancelog += log(($baseline{$testLatency}{$variant}{"score"} * $baseline_variances{$testLatency}{$variant}{"score"}) / 100); } } } $measuredlog += log($measured{$test}{$variant}{"score"}); $variancelog += log(($measured{$test}{$variant}{"score"} * $variances{$test}{$variant}{"score"}) / 100); if($parse_latency == 1) { if(exists $measured{$testLatency}) { $measuredlog += log($measured{$testLatency}{$variant}{"score"}); $variancelog += log(($measured{$testLatency}{$variant}{"score"} * $variances{$testLatency}{$variant}{"score"}) / 100); } } } my $count = keys(%measured); $measuredsum{"score"} = exp($measuredlog / $count); $totalVariance{"score"} = exp($variancelog / $count); $basesum{"score"} = exp($baselog / $count); $totalBaseVariance{"score"} = exp($basevariancelog / $count); } print("---------------------------------------------------------------------------\n"); #print the total only if it is not a baseline run. if(!$is_baseline) { if ($parse_time == 1) { my $base_variance = ($totalBaseVariance{"time"} / $basesum{"time"}) * 100; my $test_variance = ($totalVariance{"time"} / $measuredsum{"time"}) * 100; my $diff = $measuredsum{"time"} - $basesum{"time"}; my $ratio = ($measuredsum{"time"} / $basesum{"time"} - 1) * 100.0; my $investigate = ""; if($test_variance < abs($ratio) && $base_variance < abs($ratio)) { if($ratio > 4 ) { $investigate = "<-CHECK"; } if($ratio < -4) { $investigate = "<-IMPROVED"; } } printf("%-24.24s %6.1f +-%2.1f%%\t%6.1f +-%2.1f%%\t%6.1f\t%5.1f%% %s\n", "TOTAL TIME", $basesum{"time"}, $base_variance, $measuredsum{"time"}, $test_variance, $diff, $ratio, $investigate); } if ($parse_scores == 1) { my $base_variance = ($totalBaseVariance{"score"} / $basesum{"score"}) * 100; my $test_variance = ($totalVariance{"score"} / $measuredsum{"score"}) * 100; my $diff = $measuredsum{"score"} - $basesum{"score"}; my $ratio = ($measuredsum{"score"} / $basesum{"score"} - 1) * 100.0; my $investigate = ""; if($test_variance < abs($ratio) && $base_variance < abs($ratio)) { if($ratio > 4 ) { $investigate = "<-IMPROVED"; } if($ratio < -4) { $investigate = "<-CHECK"; } } printf("%-24.24s %6.1f +-%2.1f%%\t%6.1f +-%2.1f%%\t%6.1f\t%5.1f%% %s\n", "MEAN SCORE", $basesum{"score"}, $base_variance, $measuredsum{"score"}, $test_variance, $diff, $ratio, $investigate); } print("\n"); } } # handle the official run if($is_official) { official_header(); # record each test foreach my $test(@testlist) { official_start_test($test); foreach my $variant(@variants) { official_start_variant($variant); for(my $i = 0; $i < $iter; ++$i) { official_record($measured_data{$test}{$variant}{"time"}[$i]); } official_end_variant($variant); } official_end_test($test); } # record the total official_start_test("TOTAL"); foreach my $variant(@variants) { official_start_variant($variant); for(my $i = 0; $i < $iter; ++$i) { my $sum = 0; # for each iteration, sum across all tests foreach my $test(@testlist) { $sum += $measured_data{$test}{$variant}{"time"}[$i]; } official_record($sum); } official_end_variant($variant); } official_end_test("TOTAL"); official_footer(); exit(0); } # output to the baseline file or test result file and exit saveResult($is_baseline ? $basefile : $testfile); sub saveResult() { my $result_file = shift; open(my $OUT, '>', $result_file) or die "Couldn't open $result_file for writing."; foreach my $test(@testlist) { foreach my $variant(@variants) { print $OUT "$test($variant) $measured{$test}{$variant}{'time'} $variances{$test}{$variant}{'time'} $measured{$test}{$variant}{'score'} $variances{$test}{$variant}{'score'}\n"; my $testLatency = $test . "Latency"; if(exists $measured{$testLatency}) { #Note: There are extra spaces in this output - which is deliberately added to match the regex (to read from the baseline file) print $OUT "$testLatency($variant) $measured{$testLatency}{$variant}{'score'} $variances{$testLatency}{$variant}{'score'}\n"; } } } close($OUT); exit(0); } sub processResult() { my $test = shift; my $baseline = shift; my $baseline_variance = shift; my $data = shift; my $bigger_is_better = shift; my $value = 0; my $variance = 0; my %result = {"measured", 0, "variance", 0}; # sort the timings if ($bigger_is_better == 1) { @{$data} = sort {$b <=> $a} @{$data}; } else { @{$data} = sort {$a <=> $b} @{$data}; } # discard the minimum/maximum 10% my $count = @{$data}; if($count >= 10) { $count = int($count * 9 / 10); } for(my $i = 0; $i < $count; ++$i) { $value += @{$data}[$i]; } my $value = $value / $count; if ($value > 0) { for(my $i = 0; $i < $count; ++$i) { $variance += (@{$data}[$i] - $value) * (@{$data}[$i] - $value); } $variance = (sqrt($variance / $count) / $value) * 100; if ($variance == 0) { $variance = 0.0001; # to avoid divide by zero and ln(0) errors } } else { $variance = 0.0001; # to avoid divide by zero and ln(0) errors } #print the results only if it is not a baseline run. if(!$is_baseline) { my $diff = $value - $baseline; my $ratio = 0; if ($baseline > 0) { $ratio = ($diff / $baseline) * 100.0; } else { # prevent divide by zero. the lack of precision is acceptable if the tests are taking <1ms $ratio = ($diff / 1) * 100.0; } my $investigate = ""; if($variance < abs($ratio) && $baseline_variance < abs($ratio)) { if($ratio > 4 ) { if ($bigger_is_better == 1) { $investigate = "<-IMPROVED"; } else { $investigate = "<-CHECK"; } } if($ratio < -4) { if ($bigger_is_better == 1) { $investigate = "<-CHECK"; } else { $investigate = "<-IMPROVED"; } } } printf ("%-24.24s %6.1f +-%2.1f%%\t%6.1f +-%2.1f%%\t%6.1f\t%5.1f%% %s\n", $test, $baseline, $baseline_variance, $value, $variance, $diff, $ratio, $investigate); } $result{"measured"} = $value; $result{"variance"} = $variance; return %result; } sub runtest { my $testcasename = shift; my $variant = shift; my %results = ("time", -1, "score", -1); #TODO investigate what was meant to go here, other than adding whitespace on the end #This is a hash slice syntax on an array which is empty, so makes no sense at all #$other_switches .= " " . @testlistSwitches{$testcasename}; if(!$dir) { system("$binary $switches{$variant} $other_switches $testcasename.js > _time.txt"); } else { my $testpath = File::Spec->catfile($dir, $testcasename); system("$binary $switches{$variant} $other_switches $testpath.js > _time.txt"); } open(my $IN, '<', "_time.txt") or die; my $i = 0; while(<$IN>) { if(/###\sTIME:\s(\d+(\.\d+)*)\sms/) { $results{"time"} = $1; } if(/###\sSCORE:\s(\d+)/) { $results{"score"} = $1; } if(/###\sLATENCY:\s(\d+)/) { $results{"latency"} = $1; } } close $IN; if ($testDescription == "custom") { if ($results{"time"} != -1 || $results{"score"} != -1) { return %results; } } if(($parse_time == 1 && $results{"time"} == -1) || ($parse_scores == 1 && $results{"score"} == -1)) { print "ERROR: test produced invalid output while running $testcasename.js\n"; exit(1); } return %results; } sub badswitch { die "invalid switch combination"; } sub usage { print "Usage: perftest.pl [options]\n"; print "Options:\n"; print " -baseline Generates a baseline, updating your local baseline file. \n"; print " NOTE: use only with base binary with clean clone from the Chakracore repo\n"; print " -basefile: Uses as your perf baseline (default: perfbase.txt)\n"; print " -testfile: Uses to save your perf test result (default: perftest.txt)\n"; print " -dir: Uses the test files in the .\n"; print " -binary: Uses to run the JS files.\n"; print " -skipCheckSwitch Skip checking binary command line switches (use with non-chakra hosts)"; print " -iterations: Number of iterations to run tests (default: 11)\n"; print " -official: Generates an official report into results-.xml\n"; print " -native Only run -native variation (default)\n"; print " -interpreted Only run -interpreted variation\n"; print " -nativeAndinterpreted Run -interpreted along with -native variation\n"; print " -nodynamicProfile Run without dynamic profile info\n"; print " -dynamicProfile Force Run with dynamic profile info\n"; print " -sunspider Run the sunspider 1.0.2 benchmark\n"; print " -kraken Run the kraken benchmark\n"; print " -octane Run the Octane 2.0 benchmark\n"; print " -jetstream Run the JetStream benchmark (only non octane and sunspider tests)\n"; print " -file: Run the specified js file\n"; print " -args: Other arguments to ch.exe\n"; print " -score Test output scores\n"; } sub parse_args { my $forceDynamicProfileOn; my $forceDynamicProfileOff; if(@ARGV == 1 && $ARGV[0] =~ /[-\/]\?/) { usage(); exit(0); } for(my $i = 0; $i < @ARGV; ++$i) { if($ARGV[$i] =~ /[-\/]baseline/) { $is_baseline = 1; badswitch() if $is_official; } elsif($ARGV[$i] =~ /[-\/]basefile:(.*)$/) { $basefile = $1; badswitch() if $is_official; } elsif($ARGV[$i] =~ /[-\/]testfile:(.*)$/) { $testfile = $1; badswitch() if $is_official; } elsif($ARGV[$i] =~ /[-\/]binary:(.*)$/) { $binary = $1; } elsif($ARGV[$i] =~ /[-\/]skipCheckSwitch/) { $skipCheckSwitch = 1; } elsif($ARGV[$i] =~ /[-\/]dir:(.*)$/) { if($1) { $dir = $1; print "dir = $1\n"; } else { $dir= "."; print "dir = $1\n"; } #opens the directory and read the files in it opendir(dirHandle,$dir) || die("Cannot open directory"); @testlist = grep (/.js/, readdir(dirHandle)); closedir(dirHandle); for (@testlist) { s/(.*).js/$1/; } $is_dynamicProfileRun = 0; } elsif($ARGV[$i] =~ /[-\/]iterations:(\d+)$/) { $iter = $1; } elsif($ARGV[$i] =~ /[-\/]official:(.*)$/) { $is_official = 1; $official_name = $1; open($OFFICIAL, '>', "results-$official_name.xml") or die "Cannot open official results XML file for writing"; badswitch() if $is_baseline; } elsif($ARGV[$i] =~ /[-\/]native/) { @variants = ("native"); } elsif($ARGV[$i] =~ /[-\/]interpreted/) { @variants = ("interpreted"); } elsif($ARGV[$i] =~ /[-\/]nativeAndInterpreted/) { @variants = ("native", "interpreted"); } elsif($ARGV[$i] =~ /[-\/]octane/) { if($iter == $defaultIter) { $iter = 10; } @testlist = ("box2d", "code-load", "crypto", "deltablue", "earley-boyer", "gbemu", "mandreel", "navier-stokes", "pdfjs", "raytrace", "regexp", "richards", "splay", "typescript", "zlib"); $testDescription = "octane 2.0 benchmark"; $parse_time = 0; $parse_scores = 1; $parse_latency = 1; $dir = "Octane"; $basefile = "perfbase$dir.txt"; $testfile = "perftest$dir.txt"; $is_dynamicProfileRun = 0; # Currently octane dyna-pogo info is not avialable in the browser - remove this when it is. } elsif($ARGV[$i] =~ /[-\/]jetstream/) { if($iter == $defaultIter) { $iter = 5; } @testlist = ("bigfib.cpp", "container.cpp", "dry.c", "float-mm.c", "gcc-loops.cpp", "hash-map", "n-body.c", "quicksort.c", "towers.c", "cdjs"); $testDescription = "JetStream benchmark"; $parse_time = 0; $parse_scores = 1; $parse_latency = 0; $dir = "jetstream"; $basefile = "perfbase$dir.txt"; $testfile = "perftest$dir.txt"; $is_dynamicProfileRun = 0; # Currently dyna-pogo info is not avialable in the browser - remove this when it is. } elsif($ARGV[$i] =~ /[-\/]kraken/i) { if($iter == $defaultIter) { $iter = 10; } @testlist = ("ai-astar", "audio-beat-detection", "audio-dft", "audio-fft", "audio-oscillator", "imaging-darkroom", "imaging-desaturate", "imaging-gaussian-blur", "json-parse-financial", "json-stringify-tinderbox", "stanford-crypto-aes", "stanford-crypto-ccm", "stanford-crypto-pbkdf2", "stanford-crypto-sha256-iterative"); $testDescription = "kraken benchmark"; $dir = "Kraken"; $basefile = "perfbase$dir.txt"; $testfile = "perftest$dir.txt"; $highprecisiondate = 0; } elsif($ARGV[$i] =~ /[-\/]sunspider/i) { @testlist = ("3d-cube", "3d-morph", "3d-raytrace", "access-binary-trees", "access-fannkuch", "access-nbody", "access-nsieve", "bitops-3bit-bits-in-byte", "bitops-bits-in-byte", "bitops-bitwise-and", "bitops-nsieve-bits", "controlflow-recursive", "crypto-aes", "crypto-md5", "crypto-sha1", "date-format-tofte", "date-format-xparb", "math-cordic", "math-partial-sums", "math-spectral-norm", "regexp-dna", "string-base64", "string-fasta", "string-tagcloud", "string-unpack-code", "string-validate-input"); $dir = "SunSpider"; $basefile = "perfbase$dir.txt"; $testfile = "perftest$dir.txt"; $is_dynamicProfileRun = 1; } elsif($ARGV[$i] =~ /[-\/]file:(.*).js$/i) { # only supports octane, add additional support here for jetstream my %scoreTests = ( "box2d" => 1, "code-load" => 1, "crypto" => 1, "deltablue" => 1, "earley-boyer" => 1, "gbemu" => 1, "mandreel" => 1, "navier-stokes" => 1, "pdfjs" => 1, "raytrace" => 1, "regexp" => 1, "richards" => 1, "splay" => 1, "zlib" => 1, "typescript" => 1); @testlist = ($1); my $test = lc $1; if (exists $scoreTests{$test}) { $parse_scores = 1; $parse_time = 0; $is_dynamicProfileRun = 0; # Currently octane dyna-pogo info is not avialable in the browser - remove this when it is. if($iter == $defaultIter) { $iter = 10; } } $testDescription = "custom"; } elsif($ARGV[$i] =~ /[-\/]score/i) { $parse_scores = 1; $parse_time = 0; } elsif($ARGV[$i] =~ /[-\/]Off:(.*)$/i) { $other_switches .= " -Off:" . $1; } elsif($ARGV[$i] =~ /[-\/]On:(.*)$/i) { $other_switches .= " -On:" . $1; } elsif($ARGV[$i] =~ /[-\/]args:(.*)$/i) { $other_switches .= " " . $1; } elsif($ARGV[$i] =~ /[-\/]noDynamicProfile/i) { $forceDynamicProfileOff = 1; } elsif($ARGV[$i] =~ /[-\/]dynamicProfile/i) { $forceDynamicProfileOn = 1; } else { print "ERROR: Invalid argument $ARGV[$i] to script\n"; die; } } if($forceDynamicProfileOff) { $is_dynamicProfileRun = 0; } if($forceDynamicProfileOn) { $is_dynamicProfileRun = 1; } if ($binary eq "") { print "ERROR: Provide a binary path for ch.exe (-binary:\\ch.exe).\n"; die; } } sub official_footer { print $OFFICIAL "\n"; close($OFFICIAL); } sub official_header { print $OFFICIAL "\n"; } sub official_start_variant { my $variant = shift; print $OFFICIAL "\t\n"; } sub official_end_variant { print $OFFICIAL "\t\n"; } sub official_start_test { my $testname = shift; print $OFFICIAL "\n"; } sub official_record { my $time = shift; print $OFFICIAL "\t\t\n"; } sub official_end_test { print $OFFICIAL "\n"; } sub check_switch { # Use -skipCheckSwitch to avoid checking command line switches with # non-chakra hosts (Following "... -?" may enter host command loop.) if ($skipCheckSwitch) { return; } system("$binary -? > _time.txt"); open(my $IN, '<', "_time.txt") or die; my $dynamicProfileSupported = 0; my $highprecisiondateSupported = 0; while(<$IN>) { if(/\sHighPrecisionDate/) { $highprecisiondateSupported = 1; } if(/\sDynamicProfileCache/) { $dynamicProfileSupported = 1; } } close($IN); if($is_dynamicProfileRun && !$dynamicProfileSupported) { print "Warning: Persistent Dynamic profile is not supported! \n"; $is_dynamicProfileRun = 0; } if(!$highprecisiondateSupported) { $highprecisiondate = 0; } } sub delete_profile { if($is_dynamicProfileRun) { delete_file($profileFile); } } sub delete_file() { my $f = shift; if(-e $f) { unlink($f); if(-e $f) { print "File could not be deleted: $f\n"; die(); } } }