* removed code which splits "unaligned" 8 byte stores/loads into two 4 bytes stores/loads on ppc64. The processor manuals and extensive testing showed that PPC970+ class processors have hardware assisted handling of unaligned memory accesses, which results in 8 byte memory accesses to be always faster than 4 byte ones

git-svn-id: trunk@9721 -
2025-08-03 17:26:05 +02:00 · 2008-01-12 13:47:55 +00:00 · 2008-01-12 13:47:55 +00:00 · 4e60ceb237
commit 4e60ceb237
parent cf295c8e88
1 changed files with 0 additions and 24 deletions
--- a/compiler/powerpc64/cgcpu.pas
+++ b/compiler/powerpc64/cgcpu.pas
@ -726,30 +726,6 @@ begin
  ref2 := ref;
  fixref(list, ref2);

-  { unaligned 64 bit accesses are much slower than unaligned }
-  { 32 bit accesses because they cause a hardware exception  }
-  { (which isn't handled by linux, so there you even get a   }
-  {  crash)                                                  }
-  if (ref.alignment<>0) and
-     (fromsize in [OS_64,OS_S64]) and
-     (ref.alignment<4) then
-    begin
-      if (ref2.base<>NR_NO) and
-         (ref2.index<>NR_NO) then
-        begin
-          tmpreg:=getintregister(list,OS_64);
-          a_op_reg_reg_reg(list,OP_SHR,OS_64,ref2.base,ref2.index,tmpreg);
-          ref2.base:=tmpreg;
-          ref2.index:=NR_NO;
-        end;
-      tmpreg:=getintregister(list,OS_32);
-      a_load_ref_reg(list,OS_32,OS_32,ref2,tmpreg);
-      inc(ref2.offset,4);
-      a_load_ref_reg(list,OS_32,OS_32,ref2,reg); 
-      list.concat(taicpu.op_reg_reg_const_const(A_RLDIMI, reg, tmpreg, 32, 0));
-      exit;
-    end;
-
  op := loadinstr[fromsize, ref2.index <> NR_NO, false];
  { there is no LWAU instruction, simulate using ADDI and LWA }
  if (op = A_NOP) then begin