Mercurial > hg > CbC > CbC_gcc
comparison gcc/config/sh/sh4a.md @ 0:a06113de4d67
first commit
author | kent <kent@cr.ie.u-ryukyu.ac.jp> |
---|---|
date | Fri, 17 Jul 2009 14:47:48 +0900 |
parents | |
children | 04ced10e8804 |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:a06113de4d67 |
---|---|
1 ;; Scheduling description for Renesas SH4a | |
2 ;; Copyright (C) 2003, 2004, 2006, 2007 Free Software Foundation, Inc. | |
3 ;; | |
4 ;; This file is part of GCC. | |
5 ;; | |
6 ;; GNU CC is free software; you can redistribute it and/or modify | |
7 ;; it under the terms of the GNU General Public License as published by | |
8 ;; the Free Software Foundation; either version 3, or (at your option) | |
9 ;; any later version. | |
10 ;; | |
11 ;; GNU CC is distributed in the hope that it will be useful, | |
12 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of | |
13 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
14 ;; GNU General Public License for more details. | |
15 ;; | |
16 ;; You should have received a copy of the GNU General Public License | |
17 ;; along with GCC; see the file COPYING3. If not see | |
18 ;; <http://www.gnu.org/licenses/>. | |
19 | |
20 ;; The following description models the SH4A pipeline | |
21 ;; using the DFA based scheduler. | |
22 | |
23 (define_automaton "sh4a") | |
24 | |
25 (define_cpu_unit "sh4a_ex" "sh4a") | |
26 (define_cpu_unit "sh4a_ls" "sh4a") | |
27 (define_cpu_unit "sh4a_fex" "sh4a") | |
28 (define_cpu_unit "sh4a_fls" "sh4a") | |
29 (define_cpu_unit "sh4a_mult" "sh4a") | |
30 (define_cpu_unit "sh4a_fdiv" "sh4a") | |
31 | |
32 ;; Decoding is done on the integer pipeline like the | |
33 ;; sh4. Define issue to be the | of the two pipelines | |
34 ;; to control how often instructions are issued. | |
35 (define_reservation "ID_or" "sh4a_ex|sh4a_ls") | |
36 (define_reservation "ID_and" "sh4a_ex+sh4a_ls") | |
37 | |
38 | |
39 ;; ======================================================= | |
40 ;; Locking Descriptions | |
41 | |
42 ;; Sh4a_Memory access on the LS pipeline. | |
43 (define_cpu_unit "sh4a_memory" "sh4a") | |
44 | |
45 ;; Other access on the LS pipeline. | |
46 (define_cpu_unit "sh4a_load_store" "sh4a") | |
47 | |
48 ;; The address calculator used for branch instructions. | |
49 ;; This will be reserved after "issue" of branch instructions | |
50 ;; and this is to make sure that no two branch instructions | |
51 ;; can be issued in parallel. | |
52 (define_reservation "sh4a_addrcalc" "sh4a_ex") | |
53 | |
54 ;; ======================================================= | |
55 ;; Reservations | |
56 | |
57 ;; Branch (BF,BF/S,BT,BT/S,BRA,BSR) | |
58 ;; Group: BR | |
59 ;; Latency when taken: 2 | |
60 (define_insn_reservation "sh4a_branch" 2 | |
61 (and (eq_attr "cpu" "sh4a") | |
62 (eq_attr "type" "cbranch,jump")) | |
63 "ID_or+sh4a_addrcalc") | |
64 | |
65 ;; Jump (JSR,JMP,RTS) | |
66 ;; Group: BR | |
67 ;; Latency: 3 | |
68 (define_insn_reservation "sh4a_jump" 3 | |
69 (and (eq_attr "cpu" "sh4a") | |
70 (eq_attr "type" "return,jump_ind")) | |
71 "ID_or+sh4a_addrcalc") | |
72 | |
73 ;; RTE | |
74 ;; Group: CO | |
75 ;; Latency: 3 | |
76 (define_insn_reservation "sh4a_rte" 3 | |
77 (and (eq_attr "cpu" "sh4a") | |
78 (eq_attr "type" "rte")) | |
79 "ID_and*4") | |
80 | |
81 ;; EX Group Single | |
82 ;; Group: EX | |
83 ;; Latency: 0 | |
84 (define_insn_reservation "sh4a_ex" 0 | |
85 (and (eq_attr "cpu" "sh4a") | |
86 (eq_attr "insn_class" "ex_group")) | |
87 "sh4a_ex") | |
88 | |
89 ;; MOVA | |
90 ;; Group: LS | |
91 ;; Latency: 1 | |
92 (define_insn_reservation "sh4a_mova" 1 | |
93 (and (eq_attr "cpu" "sh4a") | |
94 (eq_attr "type" "mova")) | |
95 "sh4a_ls+sh4a_load_store") | |
96 | |
97 ;; MOV | |
98 ;; Group: MT | |
99 ;; Latency: 0 | |
100 ;; ??? not sure if movi8 belongs here, but that's where it was | |
101 ;; effectively before. | |
102 (define_insn_reservation "sh4a_mov" 0 | |
103 (and (eq_attr "cpu" "sh4a") | |
104 (eq_attr "type" "move,movi8,gp_mac")) | |
105 "ID_or") | |
106 | |
107 ;; Load | |
108 ;; Group: LS | |
109 ;; Latency: 3 | |
110 (define_insn_reservation "sh4a_load" 3 | |
111 (and (eq_attr "cpu" "sh4a") | |
112 (eq_attr "type" "load,pcload,mem_mac")) | |
113 "sh4a_ls+sh4a_memory") | |
114 | |
115 (define_insn_reservation "sh4a_load_si" 3 | |
116 (and (eq_attr "cpu" "sh4a") | |
117 (eq_attr "type" "load_si,pcload_si")) | |
118 "sh4a_ls+sh4a_memory") | |
119 | |
120 ;; Store | |
121 ;; Group: LS | |
122 ;; Latency: 0 | |
123 (define_insn_reservation "sh4a_store" 0 | |
124 (and (eq_attr "cpu" "sh4a") | |
125 (eq_attr "type" "store,fstore,mac_mem")) | |
126 "sh4a_ls+sh4a_memory") | |
127 | |
128 ;; CWB TYPE | |
129 | |
130 ;; MOVUA | |
131 ;; Group: LS | |
132 ;; Latency: 3 | |
133 (define_insn_reservation "sh4a_movua" 3 | |
134 (and (eq_attr "cpu" "sh4a") | |
135 (eq_attr "type" "movua")) | |
136 "sh4a_ls+sh4a_memory*2") | |
137 | |
138 ;; Fixed point multiplication (single) | |
139 ;; Group: CO | |
140 ;; Latency: 2 | |
141 (define_insn_reservation "sh4a_smult" 2 | |
142 (and (eq_attr "cpu" "sh4a") | |
143 (eq_attr "type" "smpy")) | |
144 "ID_or+sh4a_mult") | |
145 | |
146 ;; Fixed point multiplication (double) | |
147 ;; Group: CO | |
148 ;; Latency: 3 | |
149 (define_insn_reservation "sh4a_dmult" 3 | |
150 (and (eq_attr "cpu" "sh4a") | |
151 (eq_attr "type" "dmpy")) | |
152 "ID_or+sh4a_mult") | |
153 | |
154 (define_insn_reservation "sh4a_mac_gp" 3 | |
155 (and (eq_attr "cpu" "sh4a") | |
156 (eq_attr "type" "mac_gp")) | |
157 "ID_and") | |
158 | |
159 ;; Other MT group instructions(1 step operations) | |
160 ;; Group: MT | |
161 ;; Latency: 1 | |
162 (define_insn_reservation "sh4a_mt" 1 | |
163 (and (eq_attr "cpu" "sh4a") | |
164 (eq_attr "type" "mt_group")) | |
165 "ID_or") | |
166 | |
167 ;; Floating point reg move | |
168 ;; Group: LS | |
169 ;; Latency: 2 | |
170 (define_insn_reservation "sh4a_freg_mov" 2 | |
171 (and (eq_attr "cpu" "sh4a") | |
172 (eq_attr "type" "fmove")) | |
173 "sh4a_ls,sh4a_fls") | |
174 | |
175 ;; Single precision floating point computation FCMP/EQ, | |
176 ;; FCMP/GT, FADD, FLOAT, FMAC, FMUL, FSUB, FTRC, FRVHG, FSCHG | |
177 ;; Group: FE | |
178 ;; Latency: 3 | |
179 (define_insn_reservation "sh4a_fp_arith" 3 | |
180 (and (eq_attr "cpu" "sh4a") | |
181 (eq_attr "type" "fp,fp_cmp,fpscr_toggle")) | |
182 "ID_or,sh4a_fex") | |
183 | |
184 (define_insn_reservation "sh4a_fp_arith_ftrc" 3 | |
185 (and (eq_attr "cpu" "sh4a") | |
186 (eq_attr "type" "ftrc_s")) | |
187 "ID_or,sh4a_fex") | |
188 | |
189 ;; Single-precision FDIV/FSQRT | |
190 ;; Group: FE | |
191 ;; Latency: 20 | |
192 (define_insn_reservation "sh4a_fdiv" 20 | |
193 (and (eq_attr "cpu" "sh4a") | |
194 (eq_attr "type" "fdiv")) | |
195 "ID_or,sh4a_fex+sh4a_fdiv,sh4a_fex") | |
196 | |
197 ;; Double Precision floating point computation | |
198 ;; (FCNVDS, FCNVSD, FLOAT, FTRC) | |
199 ;; Group: FE | |
200 ;; Latency: 3 | |
201 (define_insn_reservation "sh4a_dp_float" 3 | |
202 (and (eq_attr "cpu" "sh4a") | |
203 (eq_attr "type" "dfp_conv")) | |
204 "ID_or,sh4a_fex") | |
205 | |
206 ;; Double-precision floating-point (FADD,FMUL,FSUB) | |
207 ;; Group: FE | |
208 ;; Latency: 5 | |
209 (define_insn_reservation "sh4a_fp_double_arith" 5 | |
210 (and (eq_attr "cpu" "sh4a") | |
211 (eq_attr "type" "dfp_arith,dfp_mul")) | |
212 "ID_or,sh4a_fex*3") | |
213 | |
214 ;; Double precision FDIV/SQRT | |
215 ;; Group: FE | |
216 ;; Latency: 36 | |
217 (define_insn_reservation "sh4a_dp_div" 36 | |
218 (and (eq_attr "cpu" "sh4a") | |
219 (eq_attr "type" "dfdiv")) | |
220 "ID_or,sh4a_fex+sh4a_fdiv,sh4a_fex*2") | |
221 | |
222 ;; FSRRA | |
223 ;; Group: FE | |
224 ;; Latency: 5 | |
225 (define_insn_reservation "sh4a_fsrra" 5 | |
226 (and (eq_attr "cpu" "sh4a") | |
227 (eq_attr "type" "fsrra")) | |
228 "ID_or,sh4a_fex") | |
229 | |
230 ;; FSCA | |
231 ;; Group: FE | |
232 ;; Latency: 7 | |
233 (define_insn_reservation "sh4a_fsca" 7 | |
234 (and (eq_attr "cpu" "sh4a") | |
235 (eq_attr "type" "fsca")) | |
236 "ID_or,sh4a_fex*3") |