1
=== modified file 'ChangeLog.linaro'
2
--- ChangeLog.linaro	2011-06-07 11:18:20 +0000
3
+++ ChangeLog.linaro	2011-06-09 09:02:19 +0000
4
@@ -1,3 +1,24 @@
5
1
2011-06-09  Michael Hope  <michael.hope@linaro.org>
6
2
7
3
	gcc/
8
4
	Backport from mainline:
9
5
10
6
	Chung-Lin Tang  <cltang@codesourcery.com>
11
7
	Richard Earnshaw  <rearnsha@arm.com>
12
8
13
9
	PR target/48250
14
10
	* config/arm/arm.c (arm_legitimize_reload_address): Update cases
15
11
	to use sign-magnitude offsets. Reject unsupported unaligned
16
12
	cases. Add detailed description in comments.
17
13
	* config/arm/arm.md (reload_outdf): Disable for ARM mode; change
18
14
	condition from TARGET_32BIT to TARGET_ARM.
19
15
20
16
	Chung-Lin Tang  <cltang@codesourcery.com>
21
17
22
18
	* config/arm/arm.c (arm_legitimize_reload_address): For NEON
23
19
	quad-word modes, reduce to 9-bit index range when above 1016
24
20
	limit.
25
21
26
1
2011-06-07  Andrew Stubbs  <ams@codesourcery.com>
22
2011-06-07  Andrew Stubbs  <ams@codesourcery.com>
27
2
23
28
3
	Backport from FSF:
24
	Backport from FSF:
29
4
25
30
=== modified file 'gcc/config/arm/arm.c'
31
--- gcc/config/arm/arm.c	2011-05-11 14:49:48 +0000
32
+++ gcc/config/arm/arm.c	2011-06-09 09:02:19 +0000
33
@@ -6419,23 +6419,134 @@
34
6419
      HOST_WIDE_INT val = INTVAL (XEXP (*p, 1));
6419
      HOST_WIDE_INT val = INTVAL (XEXP (*p, 1));
35
6420
      HOST_WIDE_INT low, high;
6420
      HOST_WIDE_INT low, high;
36
6421
6421
54
6422
      if (mode == DImode || (mode == DFmode && TARGET_SOFT_FLOAT))
6422
      /* Detect coprocessor load/stores.  */
55
6423
	low = ((val & 0xf) ^ 0x8) - 0x8;
6423
      bool coproc_p = ((TARGET_HARD_FLOAT
56
6424
      else if (TARGET_MAVERICK && TARGET_HARD_FLOAT)
6424
			&& (TARGET_VFP || TARGET_FPA || TARGET_MAVERICK)
57
6425
	/* Need to be careful, -256 is not a valid offset.  */
6425
			&& (mode == SFmode || mode == DFmode
58
6426
	low = val >= 0 ? (val & 0xff) : -((-val) & 0xff);
6426
			    || (mode == DImode && TARGET_MAVERICK)))
59
6427
      else if (mode == SImode
6427
		       || (TARGET_REALLY_IWMMXT
60
6428
	       || (mode == SFmode && TARGET_SOFT_FLOAT)
6428
			   && VALID_IWMMXT_REG_MODE (mode))
61
6429
	       || ((mode == HImode || mode == QImode) && ! arm_arch4))
6429
		       || (TARGET_NEON
62
6430
	/* Need to be careful, -4096 is not a valid offset.  */
6430
			   && (VALID_NEON_DREG_MODE (mode)
63
6431
	low = val >= 0 ? (val & 0xfff) : -((-val) & 0xfff);
6431
			       || VALID_NEON_QREG_MODE (mode))));
64
6432
      else if ((mode == HImode || mode == QImode) && arm_arch4)
6432
65
6433
	/* Need to be careful, -256 is not a valid offset.  */
6433
      /* For some conditions, bail out when lower two bits are unaligned.  */
66
6434
	low = val >= 0 ? (val & 0xff) : -((-val) & 0xff);
6434
      if ((val & 0x3) != 0
67
6435
      else if (GET_MODE_CLASS (mode) == MODE_FLOAT
6435
	  /* Coprocessor load/store indexes are 8-bits + '00' appended.  */
68
6436
	       && TARGET_HARD_FLOAT && TARGET_FPA)
6436
	  && (coproc_p
69
6437
	/* Need to be careful, -1024 is not a valid offset.  */
6437
	      /* For DI, and DF under soft-float: */
70
6438
	low = val >= 0 ? (val & 0x3ff) : -((-val) & 0x3ff);
6438
	      || ((mode == DImode || mode == DFmode)
71
6439
		  /* Without ldrd, we use stm/ldm, which does not
72
6440
		     fair well with unaligned bits.  */
73
6441
		  && (! TARGET_LDRD
74
6442
		      /* Thumb-2 ldrd/strd is [-1020,+1020] in steps of 4.  */
75
6443
		      || TARGET_THUMB2))))
76
6444
	return false;
77
6445
78
6446
      /* When breaking down a [reg+index] reload address into [(reg+high)+low],
79
6447
	 of which the (reg+high) gets turned into a reload add insn,
80
6448
	 we try to decompose the index into high/low values that can often
81
6449
	 also lead to better reload CSE.
82
6450
	 For example:
83
6451
	         ldr r0, [r2, #4100]  // Offset too large
84
6452
		 ldr r1, [r2, #4104]  // Offset too large
85
6453
86
6454
	 is best reloaded as:
87
6455
	         add t1, r2, #4096
88
6456
		 ldr r0, [t1, #4]
89
6457
		 add t2, r2, #4096
90
6458
		 ldr r1, [t2, #8]
91
6459
92
6460
	 which post-reload CSE can simplify in most cases to eliminate the
93
6461
	 second add instruction:
94
6462
	         add t1, r2, #4096
95
6463
		 ldr r0, [t1, #4]
96
6464
		 ldr r1, [t1, #8]
97
6465
98
6466
	 The idea here is that we want to split out the bits of the constant
99
6467
	 as a mask, rather than as subtracting the maximum offset that the
100
6468
	 respective type of load/store used can handle.
101
6469
102
6470
	 When encountering negative offsets, we can still utilize it even if
103
6471
	 the overall offset is positive; sometimes this may lead to an immediate
104
6472
	 that can be constructed with fewer instructions.
105
6473
	 For example:
106
6474
	         ldr r0, [r2, #0x3FFFFC]
107
6475
108
6476
	 This is best reloaded as:
109
6477
	         add t1, r2, #0x400000
110
6478
		 ldr r0, [t1, #-4]
111
6479
112
6480
	 The trick for spotting this for a load insn with N bits of offset
113
6481
	 (i.e. bits N-1:0) is to look at bit N; if it is set, then chose a
114
6482
	 negative offset that is going to make bit N and all the bits below
115
6483
	 it become zero in the remainder part.
116
6484
117
6485
	 The SIGN_MAG_LOW_ADDR_BITS macro below implements this, with respect
118
6486
	 to sign-magnitude addressing (i.e. separate +- bit, or 1's complement),
119
6487
	 used in most cases of ARM load/store instructions.  */
120
6488
121
6489
#define SIGN_MAG_LOW_ADDR_BITS(VAL, N)					\
122
6490
      (((VAL) & ((1 << (N)) - 1))					\
123
6491
       ? (((VAL) & ((1 << ((N) + 1)) - 1)) ^ (1 << (N))) - (1 << (N))	\
124
6492
       : 0)
125
6493
126
6494
      if (coproc_p)
127
6495
	{
128
6496
	  low = SIGN_MAG_LOW_ADDR_BITS (val, 10);
129
6497
130
6498
	  /* NEON quad-word load/stores are made of two double-word accesses,
131
6499
	     so the valid index range is reduced by 8. Treat as 9-bit range if
132
6500
	     we go over it.  */
133
6501
	  if (TARGET_NEON && VALID_NEON_QREG_MODE (mode) && low >= 1016)
134
6502
	    low = SIGN_MAG_LOW_ADDR_BITS (val, 9);
135
6503
	}
136
6504
      else if (GET_MODE_SIZE (mode) == 8)
137
6505
	{
138
6506
	  if (TARGET_LDRD)
139
6507
	    low = (TARGET_THUMB2
140
6508
		   ? SIGN_MAG_LOW_ADDR_BITS (val, 10)
141
6509
		   : SIGN_MAG_LOW_ADDR_BITS (val, 8));
142
6510
	  else
143
6511
	    /* For pre-ARMv5TE (without ldrd), we use ldm/stm(db/da/ib)
144
6512
	       to access doublewords. The supported load/store offsets are
145
6513
	       -8, -4, and 4, which we try to produce here.  */
146
6514
	    low = ((val & 0xf) ^ 0x8) - 0x8;
147
6515
	}
148
6516
      else if (GET_MODE_SIZE (mode) < 8)
149
6517
	{
150
6518
	  /* NEON element load/stores do not have an offset.  */
151
6519
	  if (TARGET_NEON_FP16 && mode == HFmode)
152
6520
	    return false;
153
6521
154
6522
	  if (TARGET_THUMB2)
155
6523
	    {
156
6524
	      /* Thumb-2 has an asymmetrical index range of (-256,4096).
157
6525
		 Try the wider 12-bit range first, and re-try if the result
158
6526
		 is out of range.  */
159
6527
	      low = SIGN_MAG_LOW_ADDR_BITS (val, 12);
160
6528
	      if (low < -255)
161
6529
		low = SIGN_MAG_LOW_ADDR_BITS (val, 8);
162
6530
	    }
163
6531
	  else
164
6532
	    {
165
6533
	      if (mode == HImode || mode == HFmode)
166
6534
		{
167
6535
		  if (arm_arch4)
168
6536
		    low = SIGN_MAG_LOW_ADDR_BITS (val, 8);
169
6537
		  else
170
6538
		    {
171
6539
		      /* The storehi/movhi_bytes fallbacks can use only
172
6540
			 [-4094,+4094] of the full ldrb/strb index range.  */
173
6541
		      low = SIGN_MAG_LOW_ADDR_BITS (val, 12);
174
6542
		      if (low == 4095 || low == -4095)
175
6543
			return false;
176
6544
		    }
177
6545
		}
178
6546
	      else
179
6547
		low = SIGN_MAG_LOW_ADDR_BITS (val, 12);
180
6548
	    }
181
6549
	}
182
6439
      else
6550
      else
183
6440
	return false;
6551
	return false;
184
6441
6552
185
6442
6553
186
=== modified file 'gcc/config/arm/arm.md'
187
--- gcc/config/arm/arm.md	2011-06-02 15:58:33 +0000
188
+++ gcc/config/arm/arm.md	2011-06-09 09:02:19 +0000
189
@@ -6245,7 +6245,7 @@
190
6245
  [(match_operand:DF 0 "arm_reload_memory_operand" "=o")
6245
  [(match_operand:DF 0 "arm_reload_memory_operand" "=o")
191
6246
   (match_operand:DF 1 "s_register_operand" "r")
6246
   (match_operand:DF 1 "s_register_operand" "r")
192
6247
   (match_operand:SI 2 "s_register_operand" "=&r")]
6247
   (match_operand:SI 2 "s_register_operand" "=&r")]
194
6248
  "TARGET_32BIT"
6248
  "TARGET_THUMB2"
195
6249
  "
6249
  "
196
6250
  {
6250
  {
197
6251
    enum rtx_code code = GET_CODE (XEXP (operands[0], 0));
6251
    enum rtx_code code = GET_CODE (XEXP (operands[0], 0));
Reviewer	Review Type	Date Requested	Status
Richard Sandiford		2011-06-09	Approve on 2011-06-27
Review via email: mp+63965@code.launchpad.net