123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413 |
- //===-- PPCScheduleP8.td - PPC P8 Scheduling Definitions ---*- tablegen -*-===//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- //
- // This file defines the itinerary class data for the POWER8 processor.
- //
- //===----------------------------------------------------------------------===//
- // Scheduling for the P8 involves tracking two types of resources:
- // 1. The dispatch bundle slots
- // 2. The functional unit resources
- // Dispatch units:
- def P8_DU1 : FuncUnit;
- def P8_DU2 : FuncUnit;
- def P8_DU3 : FuncUnit;
- def P8_DU4 : FuncUnit;
- def P8_DU5 : FuncUnit;
- def P8_DU6 : FuncUnit;
- def P8_DU7 : FuncUnit; // Only branch instructions will use DU7,DU8
- def P8_DU8 : FuncUnit;
- // 10 insns per cycle (2-LU, 2-LSU, 2-FXU, 2-FPU, 1-CRU, 1-BRU).
- def P8_LU1 : FuncUnit; // Loads or fixed-point operations 1
- def P8_LU2 : FuncUnit; // Loads or fixed-point operations 2
- // Load/Store pipelines can handle Stores, fixed-point loads, and simple
- // fixed-point operations.
- def P8_LSU1 : FuncUnit; // Load/Store pipeline 1
- def P8_LSU2 : FuncUnit; // Load/Store pipeline 2
- // Fixed Point unit
- def P8_FXU1 : FuncUnit; // FX pipeline 1
- def P8_FXU2 : FuncUnit; // FX pipeline 2
- // The Floating-Point Unit (FPU) and Vector Media Extension (VMX) units
- // are combined on P7 and newer into a Vector Scalar Unit (VSU).
- // The P8 Instruction latency documents still refers to the unit as the
- // FPU, so keep in mind that FPU==VSU.
- // In contrast to the P7, the VMX units on P8 are symmetric, so no need to
- // split vector integer ops or 128-bit load/store/perms to the specific units.
- def P8_FPU1 : FuncUnit; // VS pipeline 1
- def P8_FPU2 : FuncUnit; // VS pipeline 2
- def P8_CRU : FuncUnit; // CR unit (CR logicals and move-from-SPRs)
- def P8_BRU : FuncUnit; // BR unit
- def P8Itineraries : ProcessorItineraries<
- [P8_DU1, P8_DU2, P8_DU3, P8_DU4, P8_DU5, P8_DU6, P8_DU7, P8_DU8,
- P8_LU1, P8_LU2, P8_LSU1, P8_LSU2, P8_FXU1, P8_FXU2,
- P8_FPU1, P8_FPU2, P8_CRU, P8_BRU], [], [
- InstrItinData<IIC_IntSimple , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2,
- P8_LU1, P8_LU2,
- P8_LSU1, P8_LSU2]>],
- [1, 1, 1]>,
- InstrItinData<IIC_IntGeneral , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2, P8_LU1,
- P8_LU2, P8_LSU1, P8_LSU2]>],
- [1, 1, 1]>,
- InstrItinData<IIC_IntISEL, [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2], 0>,
- InstrStage<1, [P8_BRU]>],
- [1, 1, 1, 1]>,
- InstrItinData<IIC_IntCompare , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [1, 1, 1]>,
- InstrItinData<IIC_IntDivW , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<15, [P8_FXU1, P8_FXU2]>],
- [15, 1, 1]>,
- InstrItinData<IIC_IntDivD , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<23, [P8_FXU1, P8_FXU2]>],
- [23, 1, 1]>,
- InstrItinData<IIC_IntMulHW , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [4, 1, 1]>,
- InstrItinData<IIC_IntMulHWU , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [4, 1, 1]>,
- InstrItinData<IIC_IntMulHD , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [4, 1, 1]>,
- InstrItinData<IIC_IntMulLI , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [4, 1, 1]>,
- InstrItinData<IIC_IntRotate , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [1, 1, 1]>,
- InstrItinData<IIC_IntRotateD , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [1, 1, 1]>,
- InstrItinData<IIC_IntRotateDI , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [1, 1, 1]>,
- InstrItinData<IIC_IntShift , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [1, 1, 1]>,
- InstrItinData<IIC_IntTrapW , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [1, 1]>,
- InstrItinData<IIC_IntTrapD , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [1, 1]>,
- InstrItinData<IIC_BrB , [InstrStage<1, [P8_DU7, P8_DU8], 0>,
- InstrStage<1, [P8_BRU]>],
- [3, 1, 1]>,
- // FIXME - the Br* groups below are not branch related, so should probably
- // be renamed.
- // IIC_BrCR consists of the cr* instructions. (crand,crnor,creqv, etc).
- // and should be 'First' in dispatch.
- InstrItinData<IIC_BrCR , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_CRU]>],
- [3, 1, 1]>,
- // IIC_BrMCR consists of the mcrf instruction.
- InstrItinData<IIC_BrMCR , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_CRU]>],
- [3, 1, 1]>,
- // IIC_BrMCRX consists of mcrxr (obsolete instruction) and mtcrf, which
- // should be first in the dispatch group.
- InstrItinData<IIC_BrMCRX , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [3, 1, 1]>,
- InstrItinData<IIC_BrMCRX , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [3, 1]>,
- InstrItinData<IIC_LdStLoad , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_LSU1, P8_LSU2,
- P8_LU1, P8_LU2]>],
- [2, 1, 1]>,
- InstrItinData<IIC_LdStLoadUpd , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_DU2], 0>,
- InstrStage<1, [P8_LSU1, P8_LSU2,
- P8_LU1, P8_LU2 ], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [2, 2, 1, 1]>,
- // Update-Indexed form loads/stores are no longer first and last in the
- // dispatch group. They are simply cracked, so require DU1,DU2.
- InstrItinData<IIC_LdStLoadUpdX, [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_DU2], 0>,
- InstrStage<1, [P8_LSU1, P8_LSU2,
- P8_LU1, P8_LU2], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [3, 3, 1, 1]>,
- InstrItinData<IIC_LdStLD , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_LSU1, P8_LSU2,
- P8_LU1, P8_LU2]>],
- [2, 1, 1]>,
- InstrItinData<IIC_LdStLDU , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_DU2], 0>,
- InstrStage<1, [P8_LSU1, P8_LSU2,
- P8_LU1, P8_LU2], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [2, 2, 1, 1]>,
- InstrItinData<IIC_LdStLDUX , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_DU2], 0>,
- InstrStage<1, [P8_LSU1, P8_LSU2,
- P8_LU1, P8_LU2], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [3, 3, 1, 1]>,
- InstrItinData<IIC_LdStLFD , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_LU1, P8_LU2]>],
- [3, 1, 1]>,
- InstrItinData<IIC_LdStLVecX , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_LU1, P8_LU2]>],
- [3, 1, 1]>,
- InstrItinData<IIC_LdStLFDU , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_DU2], 0>,
- InstrStage<1, [P8_LU1, P8_LU2], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [3, 3, 1, 1]>,
- InstrItinData<IIC_LdStLFDUX , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_DU2], 0>,
- InstrStage<1, [P8_LU1, P8_LU2], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [3, 3, 1, 1]>,
- InstrItinData<IIC_LdStLHA , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_DU2], 0>,
- InstrStage<1, [P8_LSU1, P8_LSU2,
- P8_LU1, P8_LU2], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2,
- P8_LU1, P8_LU2]>],
- [3, 1, 1]>,
- InstrItinData<IIC_LdStLHAU , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_DU2], 0>,
- InstrStage<1, [P8_LSU1, P8_LSU2,
- P8_LU1, P8_LU2], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [4, 4, 1, 1]>,
- // first+last in dispatch group.
- InstrItinData<IIC_LdStLHAUX , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_DU2], 0>,
- InstrStage<1, [P8_DU3], 0>,
- InstrStage<1, [P8_DU4], 0>,
- InstrStage<1, [P8_DU5], 0>,
- InstrStage<1, [P8_DU6], 0>,
- InstrStage<1, [P8_LSU1, P8_LSU2,
- P8_LU1, P8_LU2], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [4, 4, 1, 1]>,
- InstrItinData<IIC_LdStLWA , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_DU2], 0>,
- InstrStage<1, [P8_LSU1, P8_LSU2,
- P8_LU1, P8_LU2]>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [3, 1, 1]>,
- InstrItinData<IIC_LdStLWARX, [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_DU2], 0>,
- InstrStage<1, [P8_DU3], 0>,
- InstrStage<1, [P8_DU4], 0>,
- InstrStage<1, [P8_LSU1, P8_LSU2,
- P8_LU1, P8_LU2]>],
- [3, 1, 1]>,
- // first+last
- InstrItinData<IIC_LdStLDARX, [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_DU2], 0>,
- InstrStage<1, [P8_DU3], 0>,
- InstrStage<1, [P8_DU4], 0>,
- InstrStage<1, [P8_DU5], 0>,
- InstrStage<1, [P8_DU6], 0>,
- InstrStage<1, [P8_LSU1, P8_LSU2,
- P8_LU1, P8_LU2]>],
- [3, 1, 1]>,
- InstrItinData<IIC_LdStLMW , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_LSU1, P8_LSU2,
- P8_LU1, P8_LU2]>],
- [2, 1, 1]>,
- // Stores are dual-issued from the issue queue, so may only take up one
- // dispatch slot. The instruction will be broken into two IOPS. The agen
- // op is issued to the LSU, and the data op (register fetch) is issued
- // to either the LU (GPR store) or the VSU (FPR store).
- InstrItinData<IIC_LdStStore , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_LSU1, P8_LSU2]>,
- InstrStage<1, [P8_LU1, P8_LU2]>],
- [1, 1, 1]>,
- InstrItinData<IIC_LdStSTD , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_LU1, P8_LU2,
- P8_LSU1, P8_LSU2]>]
- [1, 1, 1]>,
- InstrItinData<IIC_LdStSTU , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_DU2], 0>,
- InstrStage<1, [P8_LU1, P8_LU2,
- P8_LSU1, P8_LSU2], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [2, 1, 1, 1]>,
- // First+last
- InstrItinData<IIC_LdStSTUX , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_DU2], 0>,
- InstrStage<1, [P8_DU3], 0>,
- InstrStage<1, [P8_DU4], 0>,
- InstrStage<1, [P8_DU5], 0>,
- InstrStage<1, [P8_DU6], 0>,
- InstrStage<1, [P8_LSU1, P8_LSU2], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [2, 1, 1, 1]>,
- InstrItinData<IIC_LdStSTFD , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_LSU1, P8_LSU2], 0>,
- InstrStage<1, [P8_FPU1, P8_FPU2]>],
- [1, 1, 1]>,
- InstrItinData<IIC_LdStSTFDU , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_DU2], 0>,
- InstrStage<1, [P8_LSU1, P8_LSU2], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2], 0>,
- InstrStage<1, [P8_FPU1, P8_FPU2]>],
- [2, 1, 1, 1]>,
- InstrItinData<IIC_LdStSTVEBX , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_LSU1, P8_LSU2], 0>,
- InstrStage<1, [P8_FPU1, P8_FPU2]>],
- [1, 1, 1]>,
- InstrItinData<IIC_LdStSTDCX , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_DU2], 0>,
- InstrStage<1, [P8_DU3], 0>,
- InstrStage<1, [P8_DU4], 0>,
- InstrStage<1, [P8_DU5], 0>,
- InstrStage<1, [P8_DU6], 0>,
- InstrStage<1, [P8_LSU1, P8_LSU2], 0>,
- InstrStage<1, [P8_LU1, P8_LU2]>],
- [1, 1, 1]>,
- InstrItinData<IIC_LdStSTWCX , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_DU2], 0>,
- InstrStage<1, [P8_DU3], 0>,
- InstrStage<1, [P8_DU4], 0>,
- InstrStage<1, [P8_DU5], 0>,
- InstrStage<1, [P8_DU6], 0>,
- InstrStage<1, [P8_LSU1, P8_LSU2], 0>,
- InstrStage<1, [P8_LU1, P8_LU2]>],
- [1, 1, 1]>,
- InstrItinData<IIC_SprMFCR , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_CRU]>],
- [6, 1]>,
- InstrItinData<IIC_SprMFCRF , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_CRU]>],
- [3, 1]>,
- InstrItinData<IIC_SprMTSPR , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_FXU1, P8_FXU2]>],
- [4, 1]>, // mtctr
- InstrItinData<IIC_FPGeneral , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_FPU1, P8_FPU2]>],
- [5, 1, 1]>,
- InstrItinData<IIC_FPAddSub , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_FPU1, P8_FPU2]>],
- [5, 1, 1]>,
- InstrItinData<IIC_FPCompare , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_FPU1, P8_FPU2]>],
- [8, 1, 1]>,
- InstrItinData<IIC_FPDivD , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_FPU1, P8_FPU2]>],
- [33, 1, 1]>,
- InstrItinData<IIC_FPDivS , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_FPU1, P8_FPU2]>],
- [27, 1, 1]>,
- InstrItinData<IIC_FPSqrtD , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_FPU1, P8_FPU2]>],
- [44, 1, 1]>,
- InstrItinData<IIC_FPSqrtS , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_FPU1, P8_FPU2]>],
- [32, 1, 1]>,
- InstrItinData<IIC_FPFused , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_FPU1, P8_FPU2]>],
- [5, 1, 1, 1]>,
- InstrItinData<IIC_FPRes , [InstrStage<1, [P8_DU1, P8_DU2, P8_DU3,
- P8_DU4, P8_DU5, P8_DU6], 0>,
- InstrStage<1, [P8_FPU1, P8_FPU2]>],
- [5, 1, 1]>,
- InstrItinData<IIC_VecGeneral , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_FPU1, P8_FPU2]>],
- [2, 1, 1]>,
- InstrItinData<IIC_VecVSL , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_FPU1, P8_FPU2]>],
- [2, 1, 1]>,
- InstrItinData<IIC_VecVSR , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_FPU1, P8_FPU2]>],
- [2, 1, 1]>,
- InstrItinData<IIC_VecFP , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_FPU1, P8_FPU2]>],
- [6, 1, 1]>,
- InstrItinData<IIC_VecFPCompare, [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_FPU1, P8_FPU2]>],
- [6, 1, 1]>,
- InstrItinData<IIC_VecFPRound , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_FPU1, P8_FPU2]>],
- [6, 1, 1]>,
- InstrItinData<IIC_VecComplex , [InstrStage<1, [P8_DU1], 0>,
- InstrStage<1, [P8_FPU1, P8_FPU2]>],
- [7, 1, 1]>,
- InstrItinData<IIC_VecPerm , [InstrStage<1, [P8_DU1, P8_DU2], 0>,
- InstrStage<1, [P8_FPU1, P8_FPU2]>],
- [3, 1, 1]>
- ]>;
- // ===---------------------------------------------------------------------===//
- // P8 machine model for scheduling and other instruction cost heuristics.
- // P8 has an 8 insn dispatch group (6 non-branch, 2 branch) and can issue up
- // to 10 insns per cycle (2-LU, 2-LSU, 2-FXU, 2-FPU, 1-CRU, 1-BRU).
- def P8Model : SchedMachineModel {
- let IssueWidth = 8; // up to 8 instructions dispatched per cycle.
- // up to six non-branch instructions.
- // up to two branches in a dispatch group.
- let LoadLatency = 3; // Optimistic load latency assuming bypass.
- // This is overriden by OperandCycles if the
- // Itineraries are queried instead.
- let MispredictPenalty = 16;
- // Try to make sure we have at least 10 dispatch groups in a loop.
- let LoopMicroOpBufferSize = 60;
- let CompleteModel = 0;
- let Itineraries = P8Itineraries;
- }
|