Changeset 415


Ignore:
Timestamp:
08/31/10 21:16:24 (14 years ago)
Author:
lnalod
Message:

Script matlab for the bruit.

Location:
trunk/examples/nardi/shallow_performanceMeasurement
Files:
2 added
5 edited

Legend:

Unmodified
Added
Removed
  • trunk/examples/nardi/shallow_performanceMeasurement/2shalw_100x100.h

    r414 r415  
    487487} 
    488488} 
     489 
    489490endForward=my_gettimeofday(); 
    490  
    491491         return(0); 
    492492} 
     
    509509         Yvsmatt (YNBS_Vfil, YNBI_Vfil, YMAX_JAC_NBI, &YG1Y_Vfil, Yjac[0], Ytbeta); 
    510510         YG1_Vfil( Yi, Yj, YTemps-1) += Ytbeta[0]; 
     511         #pragma omp atomic 
    511512         YG1_Vphy( Yi, Yj, YTemps-1) += Ytbeta[1]; 
     513         #pragma omp atomic 
    512514         YG1_Vphy( Yi, Yj, YTemps) += Ytbeta[2]; 
    513515         Yting[0]=YS1_Ufil( Yi, Yj, YTemps-1); 
     
    518520         Yvsmatt (YNBS_Ufil, YNBI_Ufil, YMAX_JAC_NBI, &YG1Y_Ufil, Yjac[0], Ytbeta); 
    519521         YG1_Ufil( Yi, Yj, YTemps-1) += Ytbeta[0]; 
     522         #pragma omp atomic 
    520523         YG1_Uphy( Yi, Yj, YTemps-1) += Ytbeta[1]; 
     524         #pragma omp atomic 
    521525         YG1_Uphy( Yi, Yj, YTemps) += Ytbeta[2]; 
    522526         Yting[0]=YS1_Hfil( Yi, Yj, YTemps-1); 
     
    527531         Yvsmatt (YNBS_Hfil, YNBI_Hfil, YMAX_JAC_NBI, &YG1Y_Hfil, Yjac[0], Ytbeta); 
    528532         YG1_Hfil( Yi, Yj, YTemps-1) += Ytbeta[0]; 
     533         #pragma omp atomic 
    529534         YG1_Hphy( Yi, Yj, YTemps-1) += Ytbeta[1]; 
     535         #pragma omp atomic 
    530536         YG1_Hphy( Yi, Yj, YTemps) += Ytbeta[2]; 
    531537         Yting[0]=YS1_Vfil( Yi, Yj, YTemps-1); 
     
    552558         Yvsmatt (YNBS_Vphy, YNBI_Vphy, YMAX_JAC_NBI, &YG1Y_Vphy, Yjac[0], Ytbeta); 
    553559         YG1_Vfil( Yi, Yj, YTemps-1) += Ytbeta[0]; 
     560         #pragma omp atomic 
    554561         YG1_Hphy( Yi, Yj, YTemps-1) += Ytbeta[1]; 
    555562         if (1==0 || Yj-1<0){}  
    556563         else  
     564         #pragma omp atomic 
    557565         YG1_Hphy( Yi, Yj-1, YTemps-1) += Ytbeta[2]; 
    558566         if (1==0 || Yi-1<0 || Yj-1<0){}  
     
    566574         if (1==0 || Yj-1<0){}  
    567575         else  
     576         #pragma omp atomic 
    568577         YG1_Uphy( Yi, Yj-1, YTemps-1) += Ytbeta[5]; 
     578         #pragma omp atomic 
    569579         YG1_Uphy( Yi, Yj, YTemps-1) += Ytbeta[6]; 
    570580         Yting[0]=YS1_Ufil( Yi, Yj, YTemps-1); 
     
    595605         #pragma omp atomic 
    596606         YG1_Hphy( Yi+1, Yj, YTemps-1) += Ytbeta[1]; 
     607         #pragma omp atomic 
    597608         YG1_Hphy( Yi, Yj, YTemps-1) += Ytbeta[2]; 
     609         #pragma omp atomic 
    598610         YG1_Vphy( Yi, Yj, YTemps-1) += Ytbeta[3]; 
    599611         if (1==0 || Yj+1>YA2_Soce-1){}  
    600612         else  
     613         #pragma omp atomic 
    601614         YG1_Vphy( Yi, Yj+1, YTemps-1) += Ytbeta[4]; 
    602615         if (1==0 || Yi+1>YA1_Soce-1){}  
     
    623636         Yvsmatt (YNBS_Hphy, YNBI_Hphy, YMAX_JAC_NBI, &YG1Y_Hphy, Yjac[0], Ytbeta); 
    624637         YG1_Hfil( Yi, Yj, YTemps-1) += Ytbeta[0]; 
     638         #pragma omp atomic 
    625639         YG1_Uphy( Yi, Yj, YTemps-1) += Ytbeta[1]; 
    626640         if (1==0 || Yi-1<0){}  
     
    630644         if (1==0 || Yj+1>YA2_Soce-1){}  
    631645         else  
     646         #pragma omp atomic 
    632647         YG1_Vphy( Yi, Yj+1, YTemps-1) += Ytbeta[3]; 
     648         #pragma omp atomic 
    633649         YG1_Vphy( Yi, Yj, YTemps-1) += Ytbeta[4]; 
    634650 
     
    646662  printf("Average %f\n", (differenceForward + differenceBackward) / counter ); 
    647663  printf("\n############################################################################\n\n"); 
     664 
    648665 
    649666 
  • trunk/examples/nardi/shallow_performanceMeasurement/2shalw_200x200.h

    r414 r415  
    508508         Yvsmatt (YNBS_Vfil, YNBI_Vfil, YMAX_JAC_NBI, &YG1Y_Vfil, Yjac[0], Ytbeta); 
    509509         YG1_Vfil( Yi, Yj, YTemps-1) += Ytbeta[0]; 
     510         #pragma omp atomic 
    510511         YG1_Vphy( Yi, Yj, YTemps-1) += Ytbeta[1]; 
     512         #pragma omp atomic 
    511513         YG1_Vphy( Yi, Yj, YTemps) += Ytbeta[2]; 
    512514         Yting[0]=YS1_Ufil( Yi, Yj, YTemps-1); 
     
    517519         Yvsmatt (YNBS_Ufil, YNBI_Ufil, YMAX_JAC_NBI, &YG1Y_Ufil, Yjac[0], Ytbeta); 
    518520         YG1_Ufil( Yi, Yj, YTemps-1) += Ytbeta[0]; 
     521         #pragma omp atomic 
    519522         YG1_Uphy( Yi, Yj, YTemps-1) += Ytbeta[1]; 
     523         #pragma omp atomic 
    520524         YG1_Uphy( Yi, Yj, YTemps) += Ytbeta[2]; 
    521525         Yting[0]=YS1_Hfil( Yi, Yj, YTemps-1); 
     
    526530         Yvsmatt (YNBS_Hfil, YNBI_Hfil, YMAX_JAC_NBI, &YG1Y_Hfil, Yjac[0], Ytbeta); 
    527531         YG1_Hfil( Yi, Yj, YTemps-1) += Ytbeta[0]; 
     532         #pragma omp atomic 
    528533         YG1_Hphy( Yi, Yj, YTemps-1) += Ytbeta[1]; 
     534         #pragma omp atomic 
    529535         YG1_Hphy( Yi, Yj, YTemps) += Ytbeta[2]; 
    530536         Yting[0]=YS1_Vfil( Yi, Yj, YTemps-1); 
     
    551557         Yvsmatt (YNBS_Vphy, YNBI_Vphy, YMAX_JAC_NBI, &YG1Y_Vphy, Yjac[0], Ytbeta); 
    552558         YG1_Vfil( Yi, Yj, YTemps-1) += Ytbeta[0]; 
     559         #pragma omp atomic 
    553560         YG1_Hphy( Yi, Yj, YTemps-1) += Ytbeta[1]; 
    554561         if (1==0 || Yj-1<0){}  
    555562         else  
     563         #pragma omp atomic 
    556564         YG1_Hphy( Yi, Yj-1, YTemps-1) += Ytbeta[2]; 
    557565         if (1==0 || Yi-1<0 || Yj-1<0){}  
     
    565573         if (1==0 || Yj-1<0){}  
    566574         else  
     575         #pragma omp atomic 
    567576         YG1_Uphy( Yi, Yj-1, YTemps-1) += Ytbeta[5]; 
     577         #pragma omp atomic 
    568578         YG1_Uphy( Yi, Yj, YTemps-1) += Ytbeta[6]; 
    569579         Yting[0]=YS1_Ufil( Yi, Yj, YTemps-1); 
     
    594604         #pragma omp atomic 
    595605         YG1_Hphy( Yi+1, Yj, YTemps-1) += Ytbeta[1]; 
     606         #pragma omp atomic 
    596607         YG1_Hphy( Yi, Yj, YTemps-1) += Ytbeta[2]; 
     608         #pragma omp atomic 
    597609         YG1_Vphy( Yi, Yj, YTemps-1) += Ytbeta[3]; 
    598610         if (1==0 || Yj+1>YA2_Soce-1){}  
    599611         else  
     612         #pragma omp atomic 
    600613         YG1_Vphy( Yi, Yj+1, YTemps-1) += Ytbeta[4]; 
    601614         if (1==0 || Yi+1>YA1_Soce-1){}  
     
    622635         Yvsmatt (YNBS_Hphy, YNBI_Hphy, YMAX_JAC_NBI, &YG1Y_Hphy, Yjac[0], Ytbeta); 
    623636         YG1_Hfil( Yi, Yj, YTemps-1) += Ytbeta[0]; 
     637         #pragma omp atomic 
    624638         YG1_Uphy( Yi, Yj, YTemps-1) += Ytbeta[1]; 
    625639         if (1==0 || Yi-1<0){}  
     
    629643         if (1==0 || Yj+1>YA2_Soce-1){}  
    630644         else  
     645         #pragma omp atomic 
    631646         YG1_Vphy( Yi, Yj+1, YTemps-1) += Ytbeta[3]; 
     647         #pragma omp atomic 
    632648         YG1_Vphy( Yi, Yj, YTemps-1) += Ytbeta[4]; 
    633649 
  • trunk/examples/nardi/shallow_performanceMeasurement/2shalw_50x50.h

    r414 r415  
    509509         Yvsmatt (YNBS_Vfil, YNBI_Vfil, YMAX_JAC_NBI, &YG1Y_Vfil, Yjac[0], Ytbeta); 
    510510         YG1_Vfil( Yi, Yj, YTemps-1) += Ytbeta[0]; 
     511         #pragma omp atomic 
    511512         YG1_Vphy( Yi, Yj, YTemps-1) += Ytbeta[1]; 
     513         #pragma omp atomic 
    512514         YG1_Vphy( Yi, Yj, YTemps) += Ytbeta[2]; 
    513515         Yting[0]=YS1_Ufil( Yi, Yj, YTemps-1); 
     
    518520         Yvsmatt (YNBS_Ufil, YNBI_Ufil, YMAX_JAC_NBI, &YG1Y_Ufil, Yjac[0], Ytbeta); 
    519521         YG1_Ufil( Yi, Yj, YTemps-1) += Ytbeta[0]; 
     522         #pragma omp atomic 
    520523         YG1_Uphy( Yi, Yj, YTemps-1) += Ytbeta[1]; 
     524         #pragma omp atomic 
    521525         YG1_Uphy( Yi, Yj, YTemps) += Ytbeta[2]; 
    522526         Yting[0]=YS1_Hfil( Yi, Yj, YTemps-1); 
     
    527531         Yvsmatt (YNBS_Hfil, YNBI_Hfil, YMAX_JAC_NBI, &YG1Y_Hfil, Yjac[0], Ytbeta); 
    528532         YG1_Hfil( Yi, Yj, YTemps-1) += Ytbeta[0]; 
     533         #pragma omp atomic 
    529534         YG1_Hphy( Yi, Yj, YTemps-1) += Ytbeta[1]; 
     535         #pragma omp atomic 
    530536         YG1_Hphy( Yi, Yj, YTemps) += Ytbeta[2]; 
    531537         Yting[0]=YS1_Vfil( Yi, Yj, YTemps-1); 
     
    552558         Yvsmatt (YNBS_Vphy, YNBI_Vphy, YMAX_JAC_NBI, &YG1Y_Vphy, Yjac[0], Ytbeta); 
    553559         YG1_Vfil( Yi, Yj, YTemps-1) += Ytbeta[0]; 
     560         #pragma omp atomic 
    554561         YG1_Hphy( Yi, Yj, YTemps-1) += Ytbeta[1]; 
    555562         if (1==0 || Yj-1<0){}  
    556563         else  
     564         #pragma omp atomic 
    557565         YG1_Hphy( Yi, Yj-1, YTemps-1) += Ytbeta[2]; 
    558566         if (1==0 || Yi-1<0 || Yj-1<0){}  
     
    566574         if (1==0 || Yj-1<0){}  
    567575         else  
     576         #pragma omp atomic 
    568577         YG1_Uphy( Yi, Yj-1, YTemps-1) += Ytbeta[5]; 
     578         #pragma omp atomic 
    569579         YG1_Uphy( Yi, Yj, YTemps-1) += Ytbeta[6]; 
    570580         Yting[0]=YS1_Ufil( Yi, Yj, YTemps-1); 
     
    595605         #pragma omp atomic 
    596606         YG1_Hphy( Yi+1, Yj, YTemps-1) += Ytbeta[1]; 
     607         #pragma omp atomic 
    597608         YG1_Hphy( Yi, Yj, YTemps-1) += Ytbeta[2]; 
     609         #pragma omp atomic 
    598610         YG1_Vphy( Yi, Yj, YTemps-1) += Ytbeta[3]; 
    599611         if (1==0 || Yj+1>YA2_Soce-1){}  
    600612         else  
     613         #pragma omp atomic 
    601614         YG1_Vphy( Yi, Yj+1, YTemps-1) += Ytbeta[4]; 
    602615         if (1==0 || Yi+1>YA1_Soce-1){}  
     
    623636         Yvsmatt (YNBS_Hphy, YNBI_Hphy, YMAX_JAC_NBI, &YG1Y_Hphy, Yjac[0], Ytbeta); 
    624637         YG1_Hfil( Yi, Yj, YTemps-1) += Ytbeta[0]; 
     638         #pragma omp atomic 
    625639         YG1_Uphy( Yi, Yj, YTemps-1) += Ytbeta[1]; 
    626640         if (1==0 || Yi-1<0){}  
     
    630644         if (1==0 || Yj+1>YA2_Soce-1){}  
    631645         else  
     646         #pragma omp atomic 
    632647         YG1_Vphy( Yi, Yj+1, YTemps-1) += Ytbeta[3]; 
     648         #pragma omp atomic 
    633649         YG1_Vphy( Yi, Yj, YTemps-1) += Ytbeta[4]; 
    634650 
  • trunk/examples/nardi/shallow_performanceMeasurement/scriptPerformance.sh

    r414 r415  
    1313# Serial execution 
    1414echo num threads: serial... 
    15 ./shalw_50x50 > resultNotParallelFile_50x50.txt 
     15time ./shalw_50x50 > resultNotParallelFile_50x50.txt 
    1616 
    1717YaoI -p +O3 shalw_50x50 
    1818# 1 thread execution 
    1919echo num threads: 1 
    20 OMP_NUM_THREADS=1 ./shalw_50x50 > resultParallelFile_1thread_50x50.txt 
     20OMP_NUM_THREADS=1 time ./shalw_50x50 > resultParallelFile_1thread_50x50.txt 
    2121 
    2222# 2 thread execution 
    2323echo num threads: 2 
    24 OMP_NUM_THREADS=2 ./shalw_50x50 > resultParallelFile_2thread_50x50.txt 
     24OMP_NUM_THREADS=2 time ./shalw_50x50 > resultParallelFile_2thread_50x50.txt 
    2525 
    2626# 4 thread execution 
    2727echo num threads: 4 
    28 OMP_NUM_THREADS=4 ./shalw_50x50 > resultParallelFile_4thread_50x50.txt 
     28OMP_NUM_THREADS=4 time ./shalw_50x50 > resultParallelFile_4thread_50x50.txt 
    2929 
    3030# 8 thread execution 
    3131echo num threads: 8 
    32 OMP_NUM_THREADS=8 ./shalw_50x50 > resultParallelFile_8thread_50x50.txt 
     32OMP_NUM_THREADS=8 time ./shalw_50x50 > resultParallelFile_8thread_50x50.txt 
    3333 
    3434 
     
    4040# Serial execution 
    4141echo num threads: serial... 
    42 ./shalw_100x100 > resultNotParallelFile_100x100.txt 
     42time ./shalw_100x100 > resultNotParallelFile_100x100.txt 
    4343 
    4444YaoI -p +O3 shalw_100x100 
    4545# 1 thread execution 
    4646echo num threads: 1 
    47 OMP_NUM_THREADS=1 ./shalw_100x100 > resultParallelFile_1thread_100x100.txt 
     47OMP_NUM_THREADS=1 time ./shalw_100x100 > resultParallelFile_1thread_100x100.txt 
    4848 
    4949# 2 thread execution 
    5050echo num threads: 2 
    51 OMP_NUM_THREADS=2 ./shalw_100x100 > resultParallelFile_2thread_100x100.txt 
     51OMP_NUM_THREADS=2 time ./shalw_100x100 > resultParallelFile_2thread_100x100.txt 
    5252 
    5353# 4 thread execution 
    5454echo num threads: 4 
    55 OMP_NUM_THREADS=4 ./shalw_100x100 > resultParallelFile_4thread_100x100.txt 
     55OMP_NUM_THREADS=4 time ./shalw_100x100 > resultParallelFile_4thread_100x100.txt 
    5656 
    5757# 8 thread execution 
    5858echo num threads: 8 
    59 OMP_NUM_THREADS=8 ./shalw_100x100 > resultParallelFile_8thread_100x100.txt 
     59OMP_NUM_THREADS=8 time ./shalw_100x100 > resultParallelFile_8thread_100x100.txt 
    6060 
    6161 
     
    6767# Serial execution 
    6868echo num threads: serial... 
    69 ./shalw_200x200 > resultNotParallelFile_200x200.txt 
     69time ./shalw_200x200 > resultNotParallelFile_200x200.txt 
    7070 
    7171YaoI -p +O3 shalw_200x200 
    7272# 1 thread execution 
    7373echo num threads: 1 
    74 OMP_NUM_THREADS=1 ./shalw_200x200 > resultParallelFile_1thread_200x200.txt 
     74OMP_NUM_THREADS=1 time ./shalw_200x200 > resultParallelFile_1thread_200x200.txt 
    7575 
    7676# 2 thread execution 
    7777echo num threads: 2 
    78 OMP_NUM_THREADS=2 ./shalw_200x200 > resultParallelFile_2thread_200x200.txt 
     78OMP_NUM_THREADS=2 time ./shalw_200x200 > resultParallelFile_2thread_200x200.txt 
    7979 
    8080# 4 thread execution 
    8181echo num threads: 4 
    82 OMP_NUM_THREADS=4 ./shalw_200x200 > resultParallelFile_4thread_200x200.txt 
     82OMP_NUM_THREADS=4 time ./shalw_200x200 > resultParallelFile_4thread_200x200.txt 
    8383 
    8484# 8 thread execution 
    8585echo num threads: 8 
    86 OMP_NUM_THREADS=8 ./shalw_200x200 > resultParallelFile_8thread_200x200.txt 
     86OMP_NUM_THREADS=8 time ./shalw_200x200 > resultParallelFile_8thread_200x200.txt 
    8787 
    8888 
  • trunk/examples/nardi/shallow_performanceMeasurement/shalw.d

    r33 r415  
    88 
    99//option o_gradtest 
    10 //option o_parallel 
     10option o_parallel 
    1111option o_m1qn3 
    1212 
Note: See TracChangeset for help on using the changeset viewer.