Training courses

Kernel and Embedded Linux

Bootlin training courses

Embedded Linux, kernel,
Yocto Project, Buildroot, real-time,
graphics, boot time, debugging...

Bootlin logo

Elixir Cross Referencer

;; Scheduling description for GR6.
;; Copyright (C) 2013-2020 Free Software Foundation, Inc.
;;
;; This file is part of GCC.
;;
;; GCC is free software; you can redistribute it and/or modify
;; it under the terms of the GNU General Public License as published by
;; the Free Software Foundation; either version 3, or (at your option)
;; any later version.
;;
;; GCC is distributed in the hope that it will be useful,
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
;; GNU General Public License for more details.
;;
;; You should have received a copy of the GNU General Public License
;; along with GCC; see the file COPYING3.  If not see
;; <http://www.gnu.org/licenses/>.

;; GR6 is a dual-issue, superscalar, out-of-order processor.
;;
;; The GR6 pipeline has 3 major components:
;;  1. The FETCH/DECODE/DISPATCH stages, an in-order front-end,
;;  2. The PROCESS stage, which is the out-of-order core,
;;  3. The STORE stage, an in-order register storage stage.
;;
;; The front-end and the back-end (PROCESS + STORE) are connected through a set
;; of reservation stations which, among other things, serve as buffers for the
;; decoded instructions.  The reservation stations are attached to a specific
;; execution unit of the PROCESS stage and the DISPATCH stage is responsible
;; for dispatching the decoded instructions to the appropriate stations.  Most
;; execution units have multiple reservation stations, thus making it possible
;; to dispatch two instructions per unit on a given cycle, but only one of them
;; can be executed on the next cycle.
;;
;; Since the core executes the instructions out of order, the most important
;; consideration for performance tuning is to make sure that enough decoded
;; instructions are ready for execution in the PROCESS stage while not stalling
;; the front-end, i.e while not trying to dispatch a decoded instruction to an
;; execution unit whose reservation stations are full.  Therefore, we do not
;; model the reservation stations (which is equivalent to pretending that there
;; is only one of them for each execution unit) but only the execution unit,
;; thus preserving some margin in case the unit itself stalls unexpectedly.

;; CPU execution units:
;;
;; inst[1|2]             The front-end: 2 instructions can be issued on a given
;;                       cycle by the FETCH/DECODE/DISPATCH stages, except for
;;                       the Block Move instructions.
;;
;; mov                   Move Execution Unit: immediate moves into registers.
;;
;; alu[1|2]              The 2 Arithmetic and Logic Units: other instructions
;;                       operating on the registers.
;;
;; bru                   Branch Resolution Unit: all branches.
;;
;; mem_wr                Memory Write Unit: all writes to memory.
;;
;; mem_rd                Memory Read Unit: all reads from memory.
;;
;; mem_eam               EAM interface: reads and writes from and to the EAM
;;                       and reads from the FP registers.
;;
;; eam                   Extended Arithmetic Module: multiply, divide and
;;                       64-bit shifts.
;;
;; fpcu                  Floating-Point Compare Unit: FP comparisons.
;;
;; fpu[1|2|3|4]          The 4 Floating-Point Units: all other instructions
;;                       operating on the FP registers.

(define_automaton "gr6,gr6_fpu")

(define_cpu_unit "gr6_inst1, gr6_inst2" "gr6")
(define_cpu_unit "gr6_mov" "gr6")
(define_cpu_unit "gr6_alu1,gr6_alu2" "gr6")
(define_cpu_unit "gr6_bru" "gr6")
(define_cpu_unit "gr6_mem_wr,gr6_mem_rd,gr6_mem_eam" "gr6")
(define_cpu_unit "gr6_eam" "gr6")
(define_cpu_unit "gr6_fpcu" "gr6")
(define_cpu_unit "gr6_fpu1,gr6_fpu2,gr6_fpu3,gr6_fpu4" "gr6_fpu")

(define_reservation "gr6_issue" "(gr6_inst1 | gr6_inst2)")
(define_reservation "gr6_single_issue" "gr6_inst1 + gr6_inst2")

(define_insn_reservation "gr6_immediate" 1
  (and (eq_attr "cpu" "gr6")
       (eq_attr "type" "imm_reg"))
  "gr6_issue + gr6_mov")

(define_insn_reservation "gr6_alu" 1
  (and (eq_attr "cpu" "gr6")
       (eq_attr "type" "arith,arith2,logic,cmp"))
  "gr6_issue + (gr6_alu1 | gr6_alu2)")

(define_insn_reservation "gr6_branch" 1
  (and (eq_attr "cpu" "gr6")
       (eq_attr "type" "abs_branch,branch,call,ret,rfi"))
  "gr6_issue + gr6_bru")

(define_insn_reservation "gr6_block_move" 16
  (and (eq_attr "cpu" "gr6")
       (eq_attr "type" "bmi"))
  "gr6_single_issue*16")

(define_insn_reservation "gr6_cpu_other" 1
  (and (eq_attr "cpu" "gr6")
       (eq_attr "type" "dsi,nop"))
  "gr6_issue")

(define_insn_reservation "gr6_write_mem" 1
  (and (eq_attr "cpu" "gr6")
       (eq_attr "type" "reg_mem"))
  "gr6_issue + gr6_mem_wr")

(define_insn_reservation "gr6_read_mem" 6
  (and (eq_attr "cpu" "gr6")
       (eq_attr "type" "mem_reg"))
  "gr6_issue + gr6_mem_rd, nothing*5")

;; EAM instructions.

(define_insn_reservation "gr6_write_eam" 2
  (and (eq_attr "cpu" "gr6")
       (eq_attr "type" "reg_eam"))
  "gr6_issue + gr6_mem_eam, nothing")

(define_reservation "gr6_issue_eam" "gr6_issue + gr6_mem_eam + gr6_eam")

(define_insn_reservation "gr6_read_eam" 2
  (and (eq_attr "cpu" "gr6")
       (eq_attr "type" "eam_reg"))
  "gr6_issue_eam, nothing")

(define_insn_reservation "gr6_shiftdi" 2
  (and (eq_attr "cpu" "gr6")
       (eq_attr "type" "shiftdi"))
  "gr6_issue_eam, gr6_eam")

(define_insn_reservation "gr6_mul" 3
  (and (eq_attr "cpu" "gr6")
       (eq_attr "type" "mul"))
  "gr6_issue_eam, gr6_eam*2")

(define_insn_reservation "gr6_div" 34
  (and (eq_attr "cpu" "gr6")
       (eq_attr "type" "div"))
  "gr6_issue_eam, gr6_eam*33")

(define_insn_reservation "gr6_divd" 66
  (and (eq_attr "cpu" "gr6")
       (eq_attr "type" "divd"))
  "gr6_issue_eam, gr6_eam*65")

;; FPU instructions.

(define_insn_reservation "gr6_read_fp" 2
  (and (eq_attr "cpu" "gr6")
       (eq_attr "type" "fp_reg"))
  "gr6_issue + gr6_mem_eam, nothing")

(define_insn_reservation "gr6_cmp_fp" 1
  (and (eq_attr "cpu" "gr6")
       (eq_attr "type" "fcmp"))
  "gr6_issue + gr6_fpcu")

(define_insn_reservation "gr6_fp_1cycle" 1
  (and (eq_attr "cpu" "gr6")
       (eq_attr "type" "fmove,ftoi,itof"))
  "gr6_issue + gr6_fpu1")

(define_insn_reservation "gr6_fp_3cycle" 3
  (and (eq_attr "cpu" "gr6")
       (eq_attr "type" "fp"))
  "gr6_issue + gr6_fpu2, nothing*2")

(define_insn_reservation "gr6_fp_17cycle" 17
  (and (eq_attr "cpu" "gr6")
       (eq_attr "type" "fdiv,fsqrt"))
  "gr6_issue + gr6_fpu3, gr6_fpu3*14, nothing*2")

(define_insn_reservation "gr6_write_fp" 1
  (and (eq_attr "cpu" "gr6")
       (eq_attr "type" "reg_fp"))
  "gr6_issue + gr6_fpu4")