AlphaServer DS10

From: John Henning (henning@perfom.zko.dec.com)
Date: Wed May 26 1999 - 09:15:04 CDT


Hi John,

Here's the AlphaServer DS10. Please add this (and the XP1000, sent
earlier in the week) to your page?

Thanks
   - john

PS. I had encouraged HP to send you results for the N4000.
    Glad to see they did. Who was the submitter?

Script started on Fri May 21 12:23:22 1999
% cat tryit.csh
#!/bin/csh
set verbose
unlimit

cat rpcc.c
cc -c rpcc.c

sleep 2

diff stream_d.f_as_at_ftp_site_22may97 tryit.f

sleep 2

f90 -non_shared -fast -O5 -unroll 8 -arch ev6 \
-assume nounderscore rpcc.o tryit.f

sleep 2

./a.out
% ./tryit.csh
unlimit

cat rpcc.c
/* rpcc.c j.henning hacked from example by d.grunwald*/

#include <c_asm.h>
#include <sys/sysinfo.h>
#include <machine/hal_sysinfo.h>
#include <unistd.h>
#include <sys/resource.h>
#include <sys/types.h>
 
static double scale = -1;
static pid_t mypid = -1;
 
/* fix_rpcc adds the two halves of the register (bias & offset), since
   some tools return it w/o this fixup */

unsigned long
fix_rpcc(unsigned long rpcc)
{
    unsigned long fixed;
    unsigned long offset = (rpcc >> 32) & 0xffffffff;
    unsigned long cycles = (rpcc & 0xffffffff);
    fixed = (unsigned long) offset + (unsigned long) cycles;
    /* printf ("%8lx %8lx %8lx ", offset, cycles, fixed); */
    return fixed;
}
 
/* Compute time in *seconds* (note that Grunwald's original version
   did microseconds) given two fixedup RPCCs */

double
rpcc_delta(unsigned long ul_start, unsigned long ul_stop)
{
    double retval;
 
    if ( scale == -1 ) {
          int err;
          double freq;
          struct cpu_info cpubuf ;
 
          err = getsysinfo(GSI_CPU_INFO, &cpubuf, sizeof(cpubuf));
          /*printf ("err= %d freq = %d current_cpu = %d\n",
               err, cpubuf.mhz, cpubuf.current_cpu);*/
          if (err < 0) {
              freq = 300;
          } else {
              freq = cpubuf.mhz;
          }
          freq *= 1000000;
          /*
           * Scale is the 1 over the clock frequency
           */
          scale = 1/(double) freq;
    }
 
    if (ul_stop < ul_start) {
        retval = ((0xffffffff - ul_start) + ul_stop) * scale;
        }
    else {
        retval = (ul_stop - ul_start) * scale;
        }

    /* printf ("%f\n", retval); */
 
    return retval;
}
 
unsigned long
fixed_rpcc(void)
{
  unsigned long i;

  i = asm("rpcc %v0");
  return fix_rpcc(i);
}
 
 
cc -c rpcc.c

sleep 2

diff stream_d.f_as_at_ftp_site_22may97 tryit.f
53c53,54
< PARAMETER (n=2000000,offset=0,ndim=n+offset,ntimes=10)

---
>       PARAMETER (n = 1000063 ,offset=0)
>       PARAMETER (ndim=n+offset,ntimes=10)
334a336,359
>       END
> 
>       DOUBLE PRECISION FUNCTION SECOND
> *
> *     Assume we will be called often enough so that rpcc counter
> *     doesn't overflow!
> *
>       INTEGER*8 TICK, PREV_TICK
>       DOUBLE PRECISION RPCC_DELTA, PREV_SEC 
>       INTEGER*8 FIXED_RPCC 
>       EXTERNAL FIXED_RPCC, RPCC_DELTA
> 
>       DATA PREV_TICK /0/
> 
>       TICK = FIXED_RPCC()
>       IF (PREV_TICK .EQ. 0) THEN
>            SECOND = 0D0
>       ELSE
>            SECOND = PREV_SEC + RPCC_DELTA (%VAL(PREV_TICK), %VAL(TICK))
>       END IF
> 
>       PREV_SEC = SECOND
>       PREV_TICK   =  TICK
>       RETURN

sleep 2

f90 -non_shared -fast -O5 -unroll 8 -arch ev6 -assume nounderscore rpcc.o tryit.f

sleep 2

./a.out ---------------------------------------------- Double precision appears to have 16 digits of accuracy Assuming 8 bytes per DOUBLE PRECISION word ---------------------------------------------- Array size = 1000063 Offset = 0 The total memory requirement is 22 MB You are running each test 10 times The *best* time for each test is used ---------------------------------------------------- Your clock granularity appears to be less than one microsecond Your clock granularity/precision appears to be 1 microseconds The tests below will each take a time on the order of 16817 microseconds (= 16817 clock ticks) Increase the size of the arrays if this shows that you are not getting at least 20 clock ticks per test. ---------------------------------------------------- WARNING -- The above is only a rough guideline. For best results, please be sure you know the precision of your system timer. ---------------------------------------------------- Function Rate (MB/s) RMS time Min time Max time Copy: 881.1317 0.0185 0.0182 0.0197 Scale: 929.8878 0.0174 0.0172 0.0174 Add: 839.8763 0.0289 0.0286 0.0290 Triad: 900.9164 0.0268 0.0266 0.0279 Sum of a is = 1.153373439229264E+018 Sum of b is = 2.306746878435012E+017 Sum of c is = 3.075662504592511E+017 % exit % script done on Fri May 21 12:23:43 1999



This archive was generated by hypermail 2b29 : Tue Apr 18 2000 - 05:23:08 CDT