187 lines
6.5 KiB
Markdown
187 lines
6.5 KiB
Markdown
|
;; Scheduling description for GR6.
|
||
|
;; Copyright (C) 2013-2021 Free Software Foundation, Inc.
|
||
|
;;
|
||
|
;; This file is part of GCC.
|
||
|
;;
|
||
|
;; GCC is free software; you can redistribute it and/or modify
|
||
|
;; it under the terms of the GNU General Public License as published by
|
||
|
;; the Free Software Foundation; either version 3, or (at your option)
|
||
|
;; any later version.
|
||
|
;;
|
||
|
;; GCC is distributed in the hope that it will be useful,
|
||
|
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
|
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||
|
;; GNU General Public License for more details.
|
||
|
;;
|
||
|
;; You should have received a copy of the GNU General Public License
|
||
|
;; along with GCC; see the file COPYING3. If not see
|
||
|
;; <http://www.gnu.org/licenses/>.
|
||
|
|
||
|
;; GR6 is a dual-issue, superscalar, out-of-order processor.
|
||
|
;;
|
||
|
;; The GR6 pipeline has 3 major components:
|
||
|
;; 1. The FETCH/DECODE/DISPATCH stages, an in-order front-end,
|
||
|
;; 2. The PROCESS stage, which is the out-of-order core,
|
||
|
;; 3. The STORE stage, an in-order register storage stage.
|
||
|
;;
|
||
|
;; The front-end and the back-end (PROCESS + STORE) are connected through a set
|
||
|
;; of reservation stations which, among other things, serve as buffers for the
|
||
|
;; decoded instructions. The reservation stations are attached to a specific
|
||
|
;; execution unit of the PROCESS stage and the DISPATCH stage is responsible
|
||
|
;; for dispatching the decoded instructions to the appropriate stations. Most
|
||
|
;; execution units have multiple reservation stations, thus making it possible
|
||
|
;; to dispatch two instructions per unit on a given cycle, but only one of them
|
||
|
;; can be executed on the next cycle.
|
||
|
;;
|
||
|
;; Since the core executes the instructions out of order, the most important
|
||
|
;; consideration for performance tuning is to make sure that enough decoded
|
||
|
;; instructions are ready for execution in the PROCESS stage while not stalling
|
||
|
;; the front-end, i.e while not trying to dispatch a decoded instruction to an
|
||
|
;; execution unit whose reservation stations are full. Therefore, we do not
|
||
|
;; model the reservation stations (which is equivalent to pretending that there
|
||
|
;; is only one of them for each execution unit) but only the execution unit,
|
||
|
;; thus preserving some margin in case the unit itself stalls unexpectedly.
|
||
|
|
||
|
;; CPU execution units:
|
||
|
;;
|
||
|
;; inst[1|2] The front-end: 2 instructions can be issued on a given
|
||
|
;; cycle by the FETCH/DECODE/DISPATCH stages, except for
|
||
|
;; the Block Move instructions.
|
||
|
;;
|
||
|
;; mov Move Execution Unit: immediate moves into registers.
|
||
|
;;
|
||
|
;; alu[1|2] The 2 Arithmetic and Logic Units: other instructions
|
||
|
;; operating on the registers.
|
||
|
;;
|
||
|
;; bru Branch Resolution Unit: all branches.
|
||
|
;;
|
||
|
;; mem_wr Memory Write Unit: all writes to memory.
|
||
|
;;
|
||
|
;; mem_rd Memory Read Unit: all reads from memory.
|
||
|
;;
|
||
|
;; mem_eam EAM interface: reads and writes from and to the EAM
|
||
|
;; and reads from the FP registers.
|
||
|
;;
|
||
|
;; eam Extended Arithmetic Module: multiply, divide and
|
||
|
;; 64-bit shifts.
|
||
|
;;
|
||
|
;; fpcu Floating-Point Compare Unit: FP comparisons.
|
||
|
;;
|
||
|
;; fpu[1|2|3|4] The 4 Floating-Point Units: all other instructions
|
||
|
;; operating on the FP registers.
|
||
|
|
||
|
(define_automaton "gr6,gr6_fpu")
|
||
|
|
||
|
(define_cpu_unit "gr6_inst1, gr6_inst2" "gr6")
|
||
|
(define_cpu_unit "gr6_mov" "gr6")
|
||
|
(define_cpu_unit "gr6_alu1,gr6_alu2" "gr6")
|
||
|
(define_cpu_unit "gr6_bru" "gr6")
|
||
|
(define_cpu_unit "gr6_mem_wr,gr6_mem_rd,gr6_mem_eam" "gr6")
|
||
|
(define_cpu_unit "gr6_eam" "gr6")
|
||
|
(define_cpu_unit "gr6_fpcu" "gr6")
|
||
|
(define_cpu_unit "gr6_fpu1,gr6_fpu2,gr6_fpu3,gr6_fpu4" "gr6_fpu")
|
||
|
|
||
|
(define_reservation "gr6_issue" "(gr6_inst1 | gr6_inst2)")
|
||
|
(define_reservation "gr6_single_issue" "gr6_inst1 + gr6_inst2")
|
||
|
|
||
|
(define_insn_reservation "gr6_immediate" 1
|
||
|
(and (eq_attr "cpu" "gr6")
|
||
|
(eq_attr "type" "imm_reg"))
|
||
|
"gr6_issue + gr6_mov")
|
||
|
|
||
|
(define_insn_reservation "gr6_alu" 1
|
||
|
(and (eq_attr "cpu" "gr6")
|
||
|
(eq_attr "type" "arith,arith2,logic,cmp"))
|
||
|
"gr6_issue + (gr6_alu1 | gr6_alu2)")
|
||
|
|
||
|
(define_insn_reservation "gr6_branch" 1
|
||
|
(and (eq_attr "cpu" "gr6")
|
||
|
(eq_attr "type" "abs_branch,branch,call,ret,rfi"))
|
||
|
"gr6_issue + gr6_bru")
|
||
|
|
||
|
(define_insn_reservation "gr6_block_move" 16
|
||
|
(and (eq_attr "cpu" "gr6")
|
||
|
(eq_attr "type" "bmi"))
|
||
|
"gr6_single_issue*16")
|
||
|
|
||
|
(define_insn_reservation "gr6_cpu_other" 1
|
||
|
(and (eq_attr "cpu" "gr6")
|
||
|
(eq_attr "type" "dsi,nop"))
|
||
|
"gr6_issue")
|
||
|
|
||
|
(define_insn_reservation "gr6_write_mem" 1
|
||
|
(and (eq_attr "cpu" "gr6")
|
||
|
(eq_attr "type" "reg_mem"))
|
||
|
"gr6_issue + gr6_mem_wr")
|
||
|
|
||
|
(define_insn_reservation "gr6_read_mem" 6
|
||
|
(and (eq_attr "cpu" "gr6")
|
||
|
(eq_attr "type" "mem_reg"))
|
||
|
"gr6_issue + gr6_mem_rd, nothing*5")
|
||
|
|
||
|
;; EAM instructions.
|
||
|
|
||
|
(define_insn_reservation "gr6_write_eam" 2
|
||
|
(and (eq_attr "cpu" "gr6")
|
||
|
(eq_attr "type" "reg_eam"))
|
||
|
"gr6_issue + gr6_mem_eam, nothing")
|
||
|
|
||
|
(define_reservation "gr6_issue_eam" "gr6_issue + gr6_mem_eam + gr6_eam")
|
||
|
|
||
|
(define_insn_reservation "gr6_read_eam" 2
|
||
|
(and (eq_attr "cpu" "gr6")
|
||
|
(eq_attr "type" "eam_reg"))
|
||
|
"gr6_issue_eam, nothing")
|
||
|
|
||
|
(define_insn_reservation "gr6_shiftdi" 2
|
||
|
(and (eq_attr "cpu" "gr6")
|
||
|
(eq_attr "type" "shiftdi"))
|
||
|
"gr6_issue_eam, gr6_eam")
|
||
|
|
||
|
(define_insn_reservation "gr6_mul" 3
|
||
|
(and (eq_attr "cpu" "gr6")
|
||
|
(eq_attr "type" "mul"))
|
||
|
"gr6_issue_eam, gr6_eam*2")
|
||
|
|
||
|
(define_insn_reservation "gr6_div" 34
|
||
|
(and (eq_attr "cpu" "gr6")
|
||
|
(eq_attr "type" "div"))
|
||
|
"gr6_issue_eam, gr6_eam*33")
|
||
|
|
||
|
(define_insn_reservation "gr6_divd" 66
|
||
|
(and (eq_attr "cpu" "gr6")
|
||
|
(eq_attr "type" "divd"))
|
||
|
"gr6_issue_eam, gr6_eam*65")
|
||
|
|
||
|
;; FPU instructions.
|
||
|
|
||
|
(define_insn_reservation "gr6_read_fp" 2
|
||
|
(and (eq_attr "cpu" "gr6")
|
||
|
(eq_attr "type" "fp_reg"))
|
||
|
"gr6_issue + gr6_mem_eam, nothing")
|
||
|
|
||
|
(define_insn_reservation "gr6_cmp_fp" 1
|
||
|
(and (eq_attr "cpu" "gr6")
|
||
|
(eq_attr "type" "fcmp"))
|
||
|
"gr6_issue + gr6_fpcu")
|
||
|
|
||
|
(define_insn_reservation "gr6_fp_1cycle" 1
|
||
|
(and (eq_attr "cpu" "gr6")
|
||
|
(eq_attr "type" "fmove,ftoi,itof"))
|
||
|
"gr6_issue + gr6_fpu1")
|
||
|
|
||
|
(define_insn_reservation "gr6_fp_3cycle" 3
|
||
|
(and (eq_attr "cpu" "gr6")
|
||
|
(eq_attr "type" "fp"))
|
||
|
"gr6_issue + gr6_fpu2, nothing*2")
|
||
|
|
||
|
(define_insn_reservation "gr6_fp_17cycle" 17
|
||
|
(and (eq_attr "cpu" "gr6")
|
||
|
(eq_attr "type" "fdiv,fsqrt"))
|
||
|
"gr6_issue + gr6_fpu3, gr6_fpu3*14, nothing*2")
|
||
|
|
||
|
(define_insn_reservation "gr6_write_fp" 1
|
||
|
(and (eq_attr "cpu" "gr6")
|
||
|
(eq_attr "type" "reg_fp"))
|
||
|
"gr6_issue + gr6_fpu4")
|