1;; Scheduling description for IBM POWER5 processor. 2;; Copyright (C) 2003-2018 Free Software Foundation, Inc. 3;; 4;; This file is part of GCC. 5;; 6;; GCC is free software; you can redistribute it and/or modify it 7;; under the terms of the GNU General Public License as published 8;; by the Free Software Foundation; either version 3, or (at your 9;; option) any later version. 10;; 11;; GCC is distributed in the hope that it will be useful, but WITHOUT 12;; ANY WARRANTY; without even the implied warranty of MERCHANTABILITY 13;; or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public 14;; License for more details. 15;; 16;; You should have received a copy of the GNU General Public License 17;; along with GCC; see the file COPYING3. If not see 18;; <http://www.gnu.org/licenses/>. 19 20;; Sources: IBM Red Book and White Paper on POWER5 21 22;; The POWER5 has 2 iu, 2 fpu, 2 lsu per engine (2 engines per chip). 23;; Instructions that update more than one register get broken into two 24;; (split) or more internal ops. The chip can issue up to 5 25;; internal ops per cycle. 26 27(define_automaton "power5iu,power5fpu,power5misc") 28 29(define_cpu_unit "iu1_power5,iu2_power5" "power5iu") 30(define_cpu_unit "lsu1_power5,lsu2_power5" "power5misc") 31(define_cpu_unit "fpu1_power5,fpu2_power5" "power5fpu") 32(define_cpu_unit "bpu_power5,cru_power5" "power5misc") 33(define_cpu_unit "du1_power5,du2_power5,du3_power5,du4_power5,du5_power5" 34 "power5misc") 35 36(define_reservation "lsq_power5" 37 "(du1_power5,lsu1_power5)\ 38 |(du2_power5,lsu2_power5)\ 39 |(du3_power5,lsu2_power5)\ 40 |(du4_power5,lsu1_power5)") 41 42(define_reservation "iq_power5" 43 "(du1_power5|du2_power5|du3_power5|du4_power5),\ 44 (iu1_power5|iu2_power5)") 45 46(define_reservation "fpq_power5" 47 "(du1_power5|du2_power5|du3_power5|du4_power5),\ 48 (fpu1_power5|fpu2_power5)") 49 50; Dispatch slots are allocated in order conforming to program order. 51(absence_set "du1_power5" "du2_power5,du3_power5,du4_power5,du5_power5") 52(absence_set "du2_power5" "du3_power5,du4_power5,du5_power5") 53(absence_set "du3_power5" "du4_power5,du5_power5") 54(absence_set "du4_power5" "du5_power5") 55 56 57; Load/store 58(define_insn_reservation "power5-load" 4 ; 3 59 (and (eq_attr "type" "load") 60 (eq_attr "sign_extend" "no") 61 (eq_attr "update" "no") 62 (eq_attr "cpu" "power5")) 63 "lsq_power5") 64 65(define_insn_reservation "power5-load-ext" 5 66 (and (eq_attr "type" "load") 67 (eq_attr "sign_extend" "yes") 68 (eq_attr "update" "no") 69 (eq_attr "cpu" "power5")) 70 "du1_power5+du2_power5,lsu1_power5,nothing,nothing,iu2_power5") 71 72(define_insn_reservation "power5-load-ext-update" 5 73 (and (eq_attr "type" "load") 74 (eq_attr "sign_extend" "yes") 75 (eq_attr "update" "yes") 76 (eq_attr "indexed" "no") 77 (eq_attr "cpu" "power5")) 78 "du1_power5+du2_power5+du3_power5+du4_power5,\ 79 lsu1_power5+iu2_power5,nothing,nothing,iu2_power5") 80 81(define_insn_reservation "power5-load-ext-update-indexed" 5 82 (and (eq_attr "type" "load") 83 (eq_attr "sign_extend" "yes") 84 (eq_attr "update" "yes") 85 (eq_attr "indexed" "yes") 86 (eq_attr "cpu" "power5")) 87 "du1_power5+du2_power5+du3_power5+du4_power5,\ 88 iu1_power5,lsu2_power5+iu1_power5,nothing,nothing,iu2_power5") 89 90(define_insn_reservation "power5-load-update-indexed" 3 91 (and (eq_attr "type" "load") 92 (eq_attr "sign_extend" "no") 93 (eq_attr "update" "yes") 94 (eq_attr "indexed" "yes") 95 (eq_attr "cpu" "power5")) 96 "du1_power5+du2_power5+du3_power5+du4_power5,\ 97 iu1_power5,lsu2_power5+iu2_power5") 98 99(define_insn_reservation "power5-load-update" 4 ; 3 100 (and (eq_attr "type" "load") 101 (eq_attr "sign_extend" "no") 102 (eq_attr "update" "yes") 103 (eq_attr "indexed" "no") 104 (eq_attr "cpu" "power5")) 105 "du1_power5+du2_power5,lsu1_power5+iu2_power5") 106 107(define_insn_reservation "power5-fpload" 6 ; 5 108 (and (eq_attr "type" "fpload") 109 (eq_attr "update" "no") 110 (eq_attr "cpu" "power5")) 111 "lsq_power5") 112 113(define_insn_reservation "power5-fpload-update" 6 ; 5 114 (and (eq_attr "type" "fpload") 115 (eq_attr "update" "yes") 116 (eq_attr "cpu" "power5")) 117 "du1_power5+du2_power5,lsu1_power5+iu2_power5") 118 119(define_insn_reservation "power5-store" 12 120 (and (eq_attr "type" "store") 121 (eq_attr "update" "no") 122 (eq_attr "cpu" "power5")) 123 "((du1_power5,lsu1_power5)\ 124 |(du2_power5,lsu2_power5)\ 125 |(du3_power5,lsu2_power5)\ 126 |(du4_power5,lsu1_power5)),\ 127 (iu1_power5|iu2_power5)") 128 129(define_insn_reservation "power5-store-update" 12 130 (and (eq_attr "type" "store") 131 (eq_attr "update" "yes") 132 (eq_attr "indexed" "no") 133 (eq_attr "cpu" "power5")) 134 "du1_power5+du2_power5,lsu1_power5+iu2_power5,iu1_power5") 135 136(define_insn_reservation "power5-store-update-indexed" 12 137 (and (eq_attr "type" "store") 138 (eq_attr "update" "yes") 139 (eq_attr "indexed" "yes") 140 (eq_attr "cpu" "power5")) 141 "du1_power5+du2_power5+du3_power5+du4_power5,\ 142 iu1_power5,lsu2_power5+iu2_power5,iu2_power5") 143 144(define_insn_reservation "power5-fpstore" 12 145 (and (eq_attr "type" "fpstore") 146 (eq_attr "update" "no") 147 (eq_attr "cpu" "power5")) 148 "((du1_power5,lsu1_power5)\ 149 |(du2_power5,lsu2_power5)\ 150 |(du3_power5,lsu2_power5)\ 151 |(du4_power5,lsu1_power5)),\ 152 (fpu1_power5|fpu2_power5)") 153 154(define_insn_reservation "power5-fpstore-update" 12 155 (and (eq_attr "type" "fpstore") 156 (eq_attr "update" "yes") 157 (eq_attr "cpu" "power5")) 158 "du1_power5+du2_power5,lsu1_power5+iu2_power5,fpu1_power5") 159 160(define_insn_reservation "power5-llsc" 11 161 (and (eq_attr "type" "load_l,store_c,sync") 162 (eq_attr "cpu" "power5")) 163 "du1_power5+du2_power5+du3_power5+du4_power5,\ 164 lsu1_power5") 165 166 167; Integer latency is 2 cycles 168(define_insn_reservation "power5-integer" 2 169 (and (ior (eq_attr "type" "integer,trap,cntlz,isel,popcnt") 170 (and (eq_attr "type" "add,logical,shift,exts") 171 (eq_attr "dot" "no")) 172 (and (eq_attr "type" "insert") 173 (eq_attr "size" "64"))) 174 (eq_attr "cpu" "power5")) 175 "iq_power5") 176 177(define_insn_reservation "power5-two" 2 178 (and (eq_attr "type" "two") 179 (eq_attr "cpu" "power5")) 180 "((du1_power5+du2_power5)\ 181 |(du2_power5+du3_power5)\ 182 |(du3_power5+du4_power5)\ 183 |(du4_power5+du1_power5)),\ 184 ((iu1_power5,nothing,iu2_power5)\ 185 |(iu2_power5,nothing,iu2_power5)\ 186 |(iu2_power5,nothing,iu1_power5)\ 187 |(iu1_power5,nothing,iu1_power5))") 188 189(define_insn_reservation "power5-three" 2 190 (and (eq_attr "type" "three") 191 (eq_attr "cpu" "power5")) 192 "(du1_power5+du2_power5+du3_power5|du2_power5+du3_power5+du4_power5\ 193 |du3_power5+du4_power5+du1_power5|du4_power5+du1_power5+du2_power5),\ 194 ((iu1_power5,nothing,iu2_power5,nothing,iu2_power5)\ 195 |(iu2_power5,nothing,iu2_power5,nothing,iu1_power5)\ 196 |(iu2_power5,nothing,iu1_power5,nothing,iu1_power5)\ 197 |(iu1_power5,nothing,iu2_power5,nothing,iu2_power5))") 198 199(define_insn_reservation "power5-insert" 4 200 (and (eq_attr "type" "insert") 201 (eq_attr "size" "32") 202 (eq_attr "cpu" "power5")) 203 "du1_power5+du2_power5,iu1_power5,nothing,iu2_power5") 204 205(define_insn_reservation "power5-cmp" 3 206 (and (ior (eq_attr "type" "cmp") 207 (and (eq_attr "type" "add,logical") 208 (eq_attr "dot" "yes"))) 209 (eq_attr "cpu" "power5")) 210 "iq_power5") 211 212(define_insn_reservation "power5-compare" 2 213 (and (eq_attr "type" "shift,exts") 214 (eq_attr "dot" "yes") 215 (eq_attr "cpu" "power5")) 216 "du1_power5+du2_power5,iu1_power5,iu2_power5") 217 218(define_bypass 4 "power5-compare" "power5-branch,power5-crlogical,power5-delayedcr,power5-mfcr,power5-mfcrf") 219 220(define_insn_reservation "power5-lmul-cmp" 7 221 (and (eq_attr "type" "mul") 222 (eq_attr "dot" "yes") 223 (eq_attr "size" "64") 224 (eq_attr "cpu" "power5")) 225 "du1_power5+du2_power5,iu1_power5*6,iu2_power5") 226 227(define_bypass 10 "power5-lmul-cmp" "power5-branch,power5-crlogical,power5-delayedcr,power5-mfcr,power5-mfcrf") 228 229(define_insn_reservation "power5-imul-cmp" 5 230 (and (eq_attr "type" "mul") 231 (eq_attr "dot" "yes") 232 (eq_attr "size" "32") 233 (eq_attr "cpu" "power5")) 234 "du1_power5+du2_power5,iu1_power5*4,iu2_power5") 235 236(define_bypass 8 "power5-imul-cmp" "power5-branch,power5-crlogical,power5-delayedcr,power5-mfcr,power5-mfcrf") 237 238(define_insn_reservation "power5-lmul" 7 239 (and (eq_attr "type" "mul") 240 (eq_attr "dot" "no") 241 (eq_attr "size" "64") 242 (eq_attr "cpu" "power5")) 243 "(du1_power5|du2_power5|du3_power5|du4_power5),(iu1_power5*6|iu2_power5*6)") 244 245(define_insn_reservation "power5-imul" 5 246 (and (eq_attr "type" "mul") 247 (eq_attr "dot" "no") 248 (eq_attr "size" "32") 249 (eq_attr "cpu" "power5")) 250 "(du1_power5|du2_power5|du3_power5|du4_power5),(iu1_power5*4|iu2_power5*4)") 251 252(define_insn_reservation "power5-imul3" 4 253 (and (eq_attr "type" "mul") 254 (eq_attr "size" "8,16") 255 (eq_attr "cpu" "power5")) 256 "(du1_power5|du2_power5|du3_power5|du4_power5),(iu1_power5*3|iu2_power5*3)") 257 258 259; SPR move only executes in first IU. 260; Integer division only executes in second IU. 261(define_insn_reservation "power5-idiv" 36 262 (and (eq_attr "type" "div") 263 (eq_attr "size" "32") 264 (eq_attr "cpu" "power5")) 265 "du1_power5+du2_power5,iu2_power5*35") 266 267(define_insn_reservation "power5-ldiv" 68 268 (and (eq_attr "type" "div") 269 (eq_attr "size" "64") 270 (eq_attr "cpu" "power5")) 271 "du1_power5+du2_power5,iu2_power5*67") 272 273 274(define_insn_reservation "power5-mtjmpr" 3 275 (and (eq_attr "type" "mtjmpr,mfjmpr") 276 (eq_attr "cpu" "power5")) 277 "du1_power5,bpu_power5") 278 279 280; Branches take dispatch Slot 4. The presence_sets prevent other insn from 281; grabbing previous dispatch slots once this is assigned. 282(define_insn_reservation "power5-branch" 2 283 (and (eq_attr "type" "jmpreg,branch") 284 (eq_attr "cpu" "power5")) 285 "(du5_power5\ 286 |du4_power5+du5_power5\ 287 |du3_power5+du4_power5+du5_power5\ 288 |du2_power5+du3_power5+du4_power5+du5_power5\ 289 |du1_power5+du2_power5+du3_power5+du4_power5+du5_power5),bpu_power5") 290 291 292; Condition Register logical ops are split if non-destructive (RT != RB) 293(define_insn_reservation "power5-crlogical" 2 294 (and (eq_attr "type" "cr_logical") 295 (eq_attr "cpu" "power5")) 296 "du1_power5,cru_power5") 297 298(define_insn_reservation "power5-delayedcr" 4 299 (and (eq_attr "type" "delayed_cr") 300 (eq_attr "cpu" "power5")) 301 "du1_power5+du2_power5,cru_power5,cru_power5") 302 303; 4 mfcrf (each 3 cyc, 1/cyc) + 3 fxu 304(define_insn_reservation "power5-mfcr" 6 305 (and (eq_attr "type" "mfcr") 306 (eq_attr "cpu" "power5")) 307 "du1_power5+du2_power5+du3_power5+du4_power5,\ 308 du1_power5+du2_power5+du3_power5+du4_power5+cru_power5,\ 309 cru_power5,cru_power5,cru_power5") 310 311; mfcrf (1 field) 312(define_insn_reservation "power5-mfcrf" 3 313 (and (eq_attr "type" "mfcrf") 314 (eq_attr "cpu" "power5")) 315 "du1_power5,cru_power5") 316 317; mtcrf (1 field) 318(define_insn_reservation "power5-mtcr" 4 319 (and (eq_attr "type" "mtcr") 320 (eq_attr "cpu" "power5")) 321 "du1_power5,iu1_power5") 322 323; Basic FP latency is 6 cycles 324(define_insn_reservation "power5-fp" 6 325 (and (eq_attr "type" "fp,fpsimple,dmul") 326 (eq_attr "cpu" "power5")) 327 "fpq_power5") 328 329(define_insn_reservation "power5-fpcompare" 5 330 (and (eq_attr "type" "fpcompare") 331 (eq_attr "cpu" "power5")) 332 "fpq_power5") 333 334(define_insn_reservation "power5-sdiv" 33 335 (and (eq_attr "type" "sdiv,ddiv") 336 (eq_attr "cpu" "power5")) 337 "(du1_power5|du2_power5|du3_power5|du4_power5),\ 338 (fpu1_power5*28|fpu2_power5*28)") 339 340(define_insn_reservation "power5-sqrt" 40 341 (and (eq_attr "type" "ssqrt,dsqrt") 342 (eq_attr "cpu" "power5")) 343 "(du1_power5|du2_power5|du3_power5|du4_power5),\ 344 (fpu1_power5*35|fpu2_power5*35)") 345 346(define_insn_reservation "power5-isync" 2 347 (and (eq_attr "type" "isync") 348 (eq_attr "cpu" "power5")) 349 "du1_power5+du2_power5+du3_power5+du4_power5,\ 350 lsu1_power5") 351 352