@@ -94,8 +94,8 @@ typedef FLOAT v4sf_t __attribute__ ((vector_size (16)));
9494#endif
9595#define KERNEL (i ) \
9696 rowA = (vec_t *)&AO[(i)<< 3];\
97- rowB = __builtin_vsx_lxvp(0 , (__vector_pair *)((void *) &BO[(i) << 3])); \
98- rowB1 = __builtin_vsx_lxvp(0 , (__vector_pair *)((void *) &BO[((i) << 3) + 4])); \
97+ rowB = __builtin_vsx_lxvp(0L , (const __vector_pair *)(&BO[(i) << 3])); \
98+ rowB1 = __builtin_vsx_lxvp(0L , (const __vector_pair *)(&BO[((i) << 3) + 4])); \
9999 __builtin_mma_xvf64gerpp(&acc0, rowB, rowA[0]);\
100100 __builtin_mma_xvf64gerpp(&acc1, rowB1, rowA[0]);\
101101 __builtin_mma_xvf64gerpp(&acc2, rowB, rowA[1]);\
@@ -200,8 +200,8 @@ CNAME (BLASLONG m, BLASLONG n, BLASLONG k, FLOAT alpha, FLOAT * A, FLOAT * B,
200200 BLASLONG l = 1 ;
201201 vec_t * rowA = (vec_t * ) & AO [0 ];
202202 __vector_pair rowB , rowB1 ;
203- rowB = __builtin_vsx_lxvp (0 , (__vector_pair * )(( void * ) & BO [0 ]));
204- rowB1 = __builtin_vsx_lxvp (0 , (__vector_pair * )(( void * ) & BO [4 ]));
203+ rowB = __builtin_vsx_lxvp (0L , (const __vector_pair * )(& BO [0 ]));
204+ rowB1 = __builtin_vsx_lxvp (0L , (const __vector_pair * )(& BO [4 ]));
205205 __builtin_mma_xvf64ger (& acc0 , rowB , rowA [0 ]);
206206 __builtin_mma_xvf64ger (& acc1 , rowB1 , rowA [0 ]);
207207 __builtin_mma_xvf64ger (& acc2 , rowB , rowA [1 ]);
@@ -283,16 +283,16 @@ CNAME (BLASLONG m, BLASLONG n, BLASLONG k, FLOAT alpha, FLOAT * A, FLOAT * B,
283283 BLASLONG l = 0 ;
284284 vec_t * rowA = (vec_t * ) & AO [0 ];
285285 __vector_pair rowB , rowB1 ;
286- rowB = __builtin_vsx_lxvp (0 , (__vector_pair * )(( void * ) & BO [0 ]));
287- rowB1 = __builtin_vsx_lxvp (0 , (__vector_pair * )(( void * ) & BO [4 ]));
286+ rowB = __builtin_vsx_lxvp (0L , (const __vector_pair * )(& BO [0 ]));
287+ rowB1 = __builtin_vsx_lxvp (0L , (const __vector_pair * )(& BO [4 ]));
288288 __builtin_mma_xvf64ger (& acc0 , rowB , rowA [0 ]);
289289 __builtin_mma_xvf64ger (& acc1 , rowB1 , rowA [0 ]);
290290 __builtin_mma_xvf64ger (& acc2 , rowB , rowA [1 ]);
291291 __builtin_mma_xvf64ger (& acc3 , rowB1 , rowA [1 ]);
292292 for (l = 1 ; l < temp ; l ++ ) {
293293 rowA = (vec_t * ) & AO [l << 2 ];
294- rowB = __builtin_vsx_lxvp (0 , (__vector_pair * )(( void * ) & BO [l << 3 ]));
295- rowB1 = __builtin_vsx_lxvp (0 , (__vector_pair * )(( void * ) & BO [(l << 3 ) + 4 ]));
294+ rowB = __builtin_vsx_lxvp (0L , (const __vector_pair * )(& BO [l << 3 ]));
295+ rowB1 = __builtin_vsx_lxvp (0L , (const __vector_pair * )(& BO [(l << 3 ) + 4 ]));
296296 __builtin_mma_xvf64gerpp (& acc0 , rowB , rowA [0 ]);
297297 __builtin_mma_xvf64gerpp (& acc1 , rowB1 , rowA [0 ]);
298298 __builtin_mma_xvf64gerpp (& acc2 , rowB , rowA [1 ]);
@@ -323,14 +323,14 @@ CNAME (BLASLONG m, BLASLONG n, BLASLONG k, FLOAT alpha, FLOAT * A, FLOAT * B,
323323 BLASLONG l = 0 ;
324324 vec_t * rowA = (vec_t * ) & AO [0 ];
325325 __vector_pair rowB , rowB1 ;
326- rowB = __builtin_vsx_lxvp (0 , (__vector_pair * )(( void * ) & BO [0 ]));
327- rowB1 = __builtin_vsx_lxvp (0 , (__vector_pair * )(( void * ) & BO [4 ]));
326+ rowB = __builtin_vsx_lxvp (0L , (const __vector_pair * )(& BO [0 ]));
327+ rowB1 = __builtin_vsx_lxvp (0L , (const __vector_pair * )(& BO [4 ]));
328328 __builtin_mma_xvf64ger (& acc0 , rowB , rowA [0 ]);
329329 __builtin_mma_xvf64ger (& acc1 , rowB1 , rowA [0 ]);
330330 for (l = 1 ; l < temp ; l ++ ) {
331331 rowA = (vec_t * ) & AO [l << 1 ];
332- rowB = __builtin_vsx_lxvp (0 , (__vector_pair * )(( void * ) & BO [l << 3 ]));
333- rowB1 = __builtin_vsx_lxvp (0 , (__vector_pair * )(( void * ) & BO [(l << 3 ) + 4 ]));
332+ rowB = __builtin_vsx_lxvp (0L , (const __vector_pair * )(& BO [l << 3 ]));
333+ rowB1 = __builtin_vsx_lxvp (0L , (const __vector_pair * )(& BO [(l << 3 ) + 4 ]));
334334 __builtin_mma_xvf64gerpp (& acc0 , rowB , rowA [0 ]);
335335 __builtin_mma_xvf64gerpp (& acc1 , rowB1 , rowA [0 ]);
336336 }
@@ -428,14 +428,14 @@ CNAME (BLASLONG m, BLASLONG n, BLASLONG k, FLOAT alpha, FLOAT * A, FLOAT * B,
428428 BLASLONG l = 0 ;
429429 vec_t * rowA = (vec_t * ) & AO [0 ];
430430 __vector_pair rowB ;
431- rowB = __builtin_vsx_lxvp (0 , (__vector_pair * )(( void * ) & BO [0 ]));
431+ rowB = __builtin_vsx_lxvp (0L , (const __vector_pair * )(& BO [0 ]));
432432 __builtin_mma_xvf64ger (& acc0 , rowB , rowA [0 ]);
433433 __builtin_mma_xvf64ger (& acc1 , rowB , rowA [1 ]);
434434 __builtin_mma_xvf64ger (& acc2 , rowB , rowA [2 ]);
435435 __builtin_mma_xvf64ger (& acc3 , rowB , rowA [3 ]);
436436 for (l = 1 ; l < temp ; l ++ ) {
437437 rowA = (vec_t * ) & AO [l << 3 ];
438- rowB = __builtin_vsx_lxvp (0 , (__vector_pair * )(( void * ) & BO [l << 2 ]));
438+ rowB = __builtin_vsx_lxvp (0L , (const __vector_pair * )(& BO [l << 2 ]));
439439 __builtin_mma_xvf64gerpp (& acc0 , rowB , rowA [0 ]);
440440 __builtin_mma_xvf64gerpp (& acc1 , rowB , rowA [1 ]);
441441 __builtin_mma_xvf64gerpp (& acc2 , rowB , rowA [2 ]);
@@ -466,12 +466,12 @@ CNAME (BLASLONG m, BLASLONG n, BLASLONG k, FLOAT alpha, FLOAT * A, FLOAT * B,
466466 BLASLONG l = 0 ;
467467 vec_t * rowA = (vec_t * ) & AO [0 ];
468468 __vector_pair rowB ;
469- rowB = __builtin_vsx_lxvp (0 , (__vector_pair * )(( void * ) & BO [0 ]));
469+ rowB = __builtin_vsx_lxvp (0L , (const __vector_pair * )(& BO [0 ]));
470470 __builtin_mma_xvf64ger (& acc0 , rowB , rowA [0 ]);
471471 __builtin_mma_xvf64ger (& acc1 , rowB , rowA [1 ]);
472472 for (l = 1 ; l < temp ; l ++ ) {
473473 rowA = (vec_t * ) & AO [l << 2 ];
474- rowB = __builtin_vsx_lxvp (0 , (__vector_pair * )(( void * ) & BO [l << 2 ]));
474+ rowB = __builtin_vsx_lxvp (0L , (const __vector_pair * )(& BO [l << 2 ]));
475475 __builtin_mma_xvf64gerpp (& acc0 , rowB , rowA [0 ]);
476476 __builtin_mma_xvf64gerpp (& acc1 , rowB , rowA [1 ]);
477477 }
@@ -498,11 +498,11 @@ CNAME (BLASLONG m, BLASLONG n, BLASLONG k, FLOAT alpha, FLOAT * A, FLOAT * B,
498498 BLASLONG l = 0 ;
499499 vec_t * rowA = (vec_t * ) & AO [0 ];
500500 __vector_pair rowB ;
501- rowB = __builtin_vsx_lxvp (0 , (__vector_pair * )(( void * ) & BO [0 ]));
501+ rowB = __builtin_vsx_lxvp (0L , (const __vector_pair * )(& BO [0 ]));
502502 __builtin_mma_xvf64ger (& acc0 , rowB , rowA [0 ]);
503503 for (l = 1 ; l < temp ; l ++ ) {
504504 rowA = (vec_t * ) & AO [l << 1 ];
505- rowB = __builtin_vsx_lxvp (0 , (__vector_pair * )(( void * ) & BO [l << 2 ]));
505+ rowB = __builtin_vsx_lxvp (0L , (const __vector_pair * )(& BO [l << 2 ]));
506506 __builtin_mma_xvf64gerpp (& acc0 , rowB , rowA [0 ]);
507507 }
508508 SAVE_ACC (& acc0 , 0 );
0 commit comments