``` 1D Data Decomposition: Partitioning #include <stdio.h> #include <math h> #include <omp.h> #define NUM_TIME_STEPS 100 #ifndef NUMN #define NUMN 1024 // total number of nodes #endif #ifndef NUMT #define NUMT // number of threads to use #endif #define NUM_NODES_PER_THREAD ( NUMN / NUMT ) float Temps[2][NUMN]; // which array is the "current values"= 0 or 1 int int Next; // which array is being filled = 1 or 0 DoAllWork( int ); void Oregon State University Computer Graphics ``` ``` 8 DoAllWork(), I hiov DoAllWork( int me ) // what range of the global Temps array this thread is responsible for: int first = me * NUM_NODES_PER_THREAD; int last = first + ( NUM_NODES_PER_THREAD - 1 ); for(int step = 0; step < NUM TIME STEPS; step++) // first element on the left: float left = 0: if( me != 0 ) left = Temps[Now][first-1]; float dtemp = ( ( K / (RHO*C) ) * ( left - 2.*Temps[Now][first] + Temps[Now][first+1] ) / ( DELTA*DELTA ) ) * DT; Temps[Next][first] = Temps[Now][first] + dtemp; What happens if two cores are writing to the same cache line? False Sharing! // all the nodes in between: for( int i = first+1; i <= last-1; i++ ) float dtemp = ( ( K / (RHO*C) ) * (Temps[Now][i-1] - 2.*Temps[Now][i] + Temps[Now][i+1])/(DELTA*DELTA))* DT; Temps[Next][i] = Temps[Now][i] + dtemp; Oregon State University Computer Graphics ``` ``` 9 DoAllWork(), II // last element on the right: float right = 0.; if( me != NUMT-1 ) right = Temps[Now][last+1]; float dtemp = ((K/(RHO*C))* ( Temps[Now][last-1] - 2.*Temps[Now][last] + right ) / ( DELTA*DELTA ) ) * DT; Temps[Next][last] = Temps[Now][last] + dtemp; What happens What happens if two cores are writing to the same cache line? // all threads need to wait here so that all Temps[Next][*] values are filled: False Sharing! #pragma omp barrier // want just one thread swapping the definitions of Now and Next: #pragma omp single Now = Next: Next = 1 - Next: } // implied barrier exists here: } // for( int step = ... Because each core is working from left to right across the data, I am Oregon State University Computer Graphics guessing that there is little cache line conflict. ```