Change-Id: I2f056571dbf35081d58afda09726c600141d5a05 Signed-off-by: Hoa Nguyen <hn@hnpl.org>
827 lines
25 KiB
C++
827 lines
25 KiB
C++
/*
|
|
* Copyright (c) 2011-2013, 2017, 2020 ARM Limited
|
|
* All rights reserved
|
|
*
|
|
* The license below extends only to copyright in the software and shall
|
|
* not be construed as granting a license to any other intellectual
|
|
* property including but not limited to intellectual property relating
|
|
* to a hardware implementation of the functionality of the software
|
|
* licensed hereunder. You may use the software subject to the license
|
|
* terms below provided that you ensure that this notice is replicated
|
|
* unmodified and in its entirety in all distributions of the software,
|
|
* modified or unmodified, in source code or in binary form.
|
|
*
|
|
* Copyright (c) 2002-2005 The Regents of The University of Michigan
|
|
* Copyright (c) 2011 Regents of the University of California
|
|
* All rights reserved.
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions are
|
|
* met: redistributions of source code must retain the above copyright
|
|
* notice, this list of conditions and the following disclaimer;
|
|
* redistributions in binary form must reproduce the above copyright
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
* documentation and/or other materials provided with the distribution;
|
|
* neither the name of the copyright holders nor the names of its
|
|
* contributors may be used to endorse or promote products derived from
|
|
* this software without specific prior written permission.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
|
* OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
|
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
|
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
*/
|
|
|
|
#ifndef __CPU_BASE_HH__
|
|
#define __CPU_BASE_HH__
|
|
|
|
#include <memory>
|
|
#include <vector>
|
|
|
|
#include "arch/generic/interrupts.hh"
|
|
#include "base/statistics.hh"
|
|
#include "debug/Mwait.hh"
|
|
#include "mem/htm.hh"
|
|
#include "mem/port_proxy.hh"
|
|
#include "sim/clocked_object.hh"
|
|
#include "sim/eventq.hh"
|
|
#include "sim/full_system.hh"
|
|
#include "sim/insttracer.hh"
|
|
#include "sim/probe/pmu.hh"
|
|
#include "sim/probe/probe.hh"
|
|
#include "sim/signal.hh"
|
|
#include "sim/system.hh"
|
|
|
|
namespace gem5
|
|
{
|
|
|
|
class BaseCPU;
|
|
struct BaseCPUParams;
|
|
class CheckerCPU;
|
|
class ThreadContext;
|
|
|
|
struct AddressMonitor
|
|
{
|
|
AddressMonitor();
|
|
bool doMonitor(PacketPtr pkt);
|
|
|
|
bool armed;
|
|
Addr vAddr;
|
|
Addr pAddr;
|
|
uint64_t val;
|
|
bool waiting; // 0=normal, 1=mwaiting
|
|
bool gotWakeup;
|
|
};
|
|
|
|
class CPUProgressEvent : public Event
|
|
{
|
|
protected:
|
|
Tick _interval;
|
|
Counter lastNumInst;
|
|
BaseCPU *cpu;
|
|
bool _repeatEvent;
|
|
|
|
public:
|
|
CPUProgressEvent(BaseCPU *_cpu, Tick ival = 0);
|
|
|
|
void process();
|
|
|
|
void interval(Tick ival) { _interval = ival; }
|
|
Tick interval() { return _interval; }
|
|
|
|
void repeatEvent(bool repeat) { _repeatEvent = repeat; }
|
|
|
|
virtual const char *description() const;
|
|
};
|
|
|
|
class BaseCPU : public ClockedObject
|
|
{
|
|
protected:
|
|
|
|
/// Instruction count used for SPARC misc register
|
|
/// @todo unify this with the counters that cpus individually keep
|
|
Tick instCnt;
|
|
|
|
// every cpu has an id, put it in the base cpu
|
|
// Set at initialization, only time a cpuId might change is during a
|
|
// takeover (which should be done from within the BaseCPU anyway,
|
|
// therefore no setCpuId() method is provided
|
|
int _cpuId;
|
|
|
|
/** Each cpu will have a socket ID that corresponds to its physical location
|
|
* in the system. This is usually used to bucket cpu cores under single DVFS
|
|
* domain. This information may also be required by the OS to identify the
|
|
* cpu core grouping (as in the case of ARM via MPIDR register)
|
|
*/
|
|
const uint32_t _socketId;
|
|
|
|
/** instruction side request id that must be placed in all requests */
|
|
RequestorID _instRequestorId;
|
|
|
|
/** data side request id that must be placed in all requests */
|
|
RequestorID _dataRequestorId;
|
|
|
|
/** An intrenal representation of a task identifier within gem5. This is
|
|
* used so the CPU can add which taskId (which is an internal representation
|
|
* of the OS process ID) to each request so components in the memory system
|
|
* can track which process IDs are ultimately interacting with them
|
|
*/
|
|
uint32_t _taskId;
|
|
|
|
/** The current OS process ID that is executing on this processor. This is
|
|
* used to generate a taskId */
|
|
uint32_t _pid;
|
|
|
|
/** Is the CPU switched out or active? */
|
|
bool _switchedOut;
|
|
|
|
/** Cache the cache line size that we get from the system */
|
|
const Addr _cacheLineSize;
|
|
|
|
/** Global CPU statistics that are merged into the Root object. */
|
|
struct GlobalStats : public statistics::Group
|
|
{
|
|
GlobalStats(statistics::Group *parent);
|
|
|
|
statistics::Value simInsts;
|
|
statistics::Value simOps;
|
|
|
|
statistics::Formula hostInstRate;
|
|
statistics::Formula hostOpRate;
|
|
};
|
|
|
|
/**
|
|
* Pointer to the global stat structure. This needs to be
|
|
* constructed from regStats since we merge it into the root
|
|
* group. */
|
|
static std::unique_ptr<GlobalStats> globalStats;
|
|
|
|
SignalSinkPort<bool> modelResetPort;
|
|
|
|
public:
|
|
|
|
/**
|
|
* Purely virtual method that returns a reference to the data
|
|
* port. All subclasses must implement this method.
|
|
*
|
|
* @return a reference to the data port
|
|
*/
|
|
virtual Port &getDataPort() = 0;
|
|
|
|
/**
|
|
* Purely virtual method that returns a reference to the instruction
|
|
* port. All subclasses must implement this method.
|
|
*
|
|
* @return a reference to the instruction port
|
|
*/
|
|
virtual Port &getInstPort() = 0;
|
|
|
|
/** Reads this CPU's ID. */
|
|
int cpuId() const { return _cpuId; }
|
|
|
|
/** Reads this CPU's Socket ID. */
|
|
uint32_t socketId() const { return _socketId; }
|
|
|
|
/** Reads this CPU's unique data requestor ID */
|
|
RequestorID dataRequestorId() const { return _dataRequestorId; }
|
|
/** Reads this CPU's unique instruction requestor ID */
|
|
RequestorID instRequestorId() const { return _instRequestorId; }
|
|
|
|
/**
|
|
* Get a port on this CPU. All CPUs have a data and
|
|
* instruction port, and this method uses getDataPort and
|
|
* getInstPort of the subclasses to resolve the two ports.
|
|
*
|
|
* @param if_name the port name
|
|
* @param idx ignored index
|
|
*
|
|
* @return a reference to the port with the given name
|
|
*/
|
|
Port &getPort(const std::string &if_name,
|
|
PortID idx=InvalidPortID) override;
|
|
|
|
/** Get cpu task id */
|
|
uint32_t taskId() const { return _taskId; }
|
|
/** Set cpu task id */
|
|
void taskId(uint32_t id) { _taskId = id; }
|
|
|
|
uint32_t getPid() const { return _pid; }
|
|
void setPid(uint32_t pid) { _pid = pid; }
|
|
|
|
inline void workItemBegin() { baseStats.numWorkItemsStarted++; }
|
|
inline void workItemEnd() { baseStats.numWorkItemsCompleted++; }
|
|
// @todo remove me after debugging with legion done
|
|
Tick instCount() { return instCnt; }
|
|
|
|
protected:
|
|
std::vector<BaseInterrupts*> interrupts;
|
|
|
|
public:
|
|
BaseInterrupts *
|
|
getInterruptController(ThreadID tid)
|
|
{
|
|
if (interrupts.empty())
|
|
return NULL;
|
|
|
|
assert(interrupts.size() > tid);
|
|
return interrupts[tid];
|
|
}
|
|
|
|
virtual void wakeup(ThreadID tid) = 0;
|
|
|
|
void postInterrupt(ThreadID tid, int int_num, int index);
|
|
|
|
void
|
|
clearInterrupt(ThreadID tid, int int_num, int index)
|
|
{
|
|
interrupts[tid]->clear(int_num, index);
|
|
}
|
|
|
|
void
|
|
clearInterrupts(ThreadID tid)
|
|
{
|
|
interrupts[tid]->clearAll();
|
|
}
|
|
|
|
bool
|
|
checkInterrupts(ThreadID tid) const
|
|
{
|
|
return FullSystem && interrupts[tid]->checkInterrupts();
|
|
}
|
|
|
|
protected:
|
|
std::vector<ThreadContext *> threadContexts;
|
|
|
|
trace::InstTracer * tracer;
|
|
|
|
public:
|
|
|
|
|
|
/** Invalid or unknown Pid. Possible when operating system is not present
|
|
* or has not assigned a pid yet */
|
|
static const uint32_t invldPid = std::numeric_limits<uint32_t>::max();
|
|
|
|
/// Provide access to the tracer pointer
|
|
trace::InstTracer * getTracer() { return tracer; }
|
|
|
|
/// Notify the CPU that the indicated context is now active.
|
|
virtual void activateContext(ThreadID thread_num);
|
|
|
|
/// Notify the CPU that the indicated context is now suspended.
|
|
/// Check if possible to enter a lower power state
|
|
virtual void suspendContext(ThreadID thread_num);
|
|
|
|
/// Notify the CPU that the indicated context is now halted.
|
|
virtual void haltContext(ThreadID thread_num);
|
|
|
|
/// Given a Thread Context pointer return the thread num
|
|
int findContext(ThreadContext *tc);
|
|
|
|
/// Given a thread num get tho thread context for it
|
|
virtual ThreadContext *getContext(int tn) { return threadContexts[tn]; }
|
|
|
|
/// Get the number of thread contexts available
|
|
unsigned
|
|
numContexts()
|
|
{
|
|
return static_cast<unsigned>(threadContexts.size());
|
|
}
|
|
|
|
/// Convert ContextID to threadID
|
|
ThreadID
|
|
contextToThread(ContextID cid)
|
|
{
|
|
return static_cast<ThreadID>(cid - threadContexts[0]->contextId());
|
|
}
|
|
|
|
public:
|
|
PARAMS(BaseCPU);
|
|
BaseCPU(const Params ¶ms, bool is_checker = false);
|
|
virtual ~BaseCPU();
|
|
|
|
void init() override;
|
|
void startup() override;
|
|
void regStats() override;
|
|
|
|
void regProbePoints() override;
|
|
|
|
void registerThreadContexts();
|
|
|
|
// Functions to deschedule and reschedule the events to enter the
|
|
// power gating sleep before and after checkpoiting respectively.
|
|
void deschedulePowerGatingEvent();
|
|
void schedulePowerGatingEvent();
|
|
|
|
/**
|
|
* Prepare for another CPU to take over execution.
|
|
*
|
|
* When this method exits, all internal state should have been
|
|
* flushed. After the method returns, the simulator calls
|
|
* takeOverFrom() on the new CPU with this CPU as its parameter.
|
|
*/
|
|
virtual void switchOut();
|
|
|
|
/**
|
|
* Load the state of a CPU from the previous CPU object, invoked
|
|
* on all new CPUs that are about to be switched in.
|
|
*
|
|
* A CPU model implementing this method is expected to initialize
|
|
* its state from the old CPU and connect its memory (unless they
|
|
* are already connected) to the memories connected to the old
|
|
* CPU.
|
|
*
|
|
* @param cpu CPU to initialize read state from.
|
|
*/
|
|
virtual void takeOverFrom(BaseCPU *cpu);
|
|
|
|
/**
|
|
* Set the reset of the CPU to be either asserted or deasserted.
|
|
*
|
|
* When asserted, the CPU should be stopped and waiting. When deasserted,
|
|
* the CPU should start running again, unless some other condition would
|
|
* also prevent it. At the point the reset is deasserted, it should be
|
|
* reinitialized as defined by the ISA it's running and any other relevant
|
|
* part of its configuration (reset address, etc).
|
|
*
|
|
* @param state The new state of the reset signal to this CPU.
|
|
*/
|
|
virtual void setReset(bool state);
|
|
|
|
/**
|
|
* Flush all TLBs in the CPU.
|
|
*
|
|
* This method is mainly used to flush stale translations when
|
|
* switching CPUs. It is also exported to the Python world to
|
|
* allow it to request a TLB flush after draining the CPU to make
|
|
* it easier to compare traces when debugging
|
|
* handover/checkpointing.
|
|
*/
|
|
void flushTLBs();
|
|
|
|
/**
|
|
* Determine if the CPU is switched out.
|
|
*
|
|
* @return True if the CPU is switched out, false otherwise.
|
|
*/
|
|
bool switchedOut() const { return _switchedOut; }
|
|
|
|
/**
|
|
* Verify that the system is in a memory mode supported by the
|
|
* CPU.
|
|
*
|
|
* Implementations are expected to query the system for the
|
|
* current memory mode and ensure that it is what the CPU model
|
|
* expects. If the check fails, the implementation should
|
|
* terminate the simulation using fatal().
|
|
*/
|
|
virtual void verifyMemoryMode() const { };
|
|
|
|
/**
|
|
* Number of threads we're actually simulating (<= SMT_MAX_THREADS).
|
|
* This is a constant for the duration of the simulation.
|
|
*/
|
|
ThreadID numThreads;
|
|
|
|
System *system;
|
|
|
|
/**
|
|
* Get the cache line size of the system.
|
|
*/
|
|
inline Addr cacheLineSize() const { return _cacheLineSize; }
|
|
|
|
/**
|
|
* Serialize this object to the given output stream.
|
|
*
|
|
* @note CPU models should normally overload the serializeThread()
|
|
* method instead of the serialize() method as this provides a
|
|
* uniform data format for all CPU models and promotes better code
|
|
* reuse.
|
|
*
|
|
* @param cp The stream to serialize to.
|
|
*/
|
|
void serialize(CheckpointOut &cp) const override;
|
|
|
|
/**
|
|
* Reconstruct the state of this object from a checkpoint.
|
|
*
|
|
* @note CPU models should normally overload the
|
|
* unserializeThread() method instead of the unserialize() method
|
|
* as this provides a uniform data format for all CPU models and
|
|
* promotes better code reuse.
|
|
|
|
* @param cp The checkpoint use.
|
|
*/
|
|
void unserialize(CheckpointIn &cp) override;
|
|
|
|
/**
|
|
* Serialize a single thread.
|
|
*
|
|
* @param cp The stream to serialize to.
|
|
* @param tid ID of the current thread.
|
|
*/
|
|
virtual void serializeThread(CheckpointOut &cp, ThreadID tid) const {};
|
|
|
|
/**
|
|
* Unserialize one thread.
|
|
*
|
|
* @param cp The checkpoint use.
|
|
* @param tid ID of the current thread.
|
|
*/
|
|
virtual void unserializeThread(CheckpointIn &cp, ThreadID tid) {};
|
|
|
|
virtual Counter totalInsts() const = 0;
|
|
|
|
virtual Counter totalOps() const = 0;
|
|
|
|
/**
|
|
* Schedule an event that exits the simulation loops after a
|
|
* predefined number of instructions.
|
|
*
|
|
* This method is usually called from the configuration script to
|
|
* get an exit event some time in the future. It is typically used
|
|
* when the script wants to simulate for a specific number of
|
|
* instructions rather than ticks.
|
|
*
|
|
* @param tid Thread monitor.
|
|
* @param insts Number of instructions into the future.
|
|
* @param cause Cause to signal in the exit event.
|
|
*/
|
|
void scheduleInstStop(ThreadID tid, Counter insts, std::string cause);
|
|
|
|
/**
|
|
* Schedule simpoint events using the scheduleInstStop function.
|
|
*
|
|
* This is used to raise a SIMPOINT_BEGIN exit event in the gem5 standard
|
|
* library.
|
|
*
|
|
* @param inst_starts A vector of number of instructions to start simpoints
|
|
*/
|
|
|
|
void scheduleSimpointsInstStop(std::vector<Counter> inst_starts);
|
|
|
|
/**
|
|
* Schedule an exit event when any threads in the core reach the max_insts
|
|
* instructions using the scheduleInstStop function.
|
|
*
|
|
* This is used to raise a MAX_INSTS exit event in thegem5 standard library
|
|
*
|
|
* @param max_insts Number of instructions into the future.
|
|
*/
|
|
void scheduleInstStopAnyThread(Counter max_insts);
|
|
|
|
/**
|
|
* Get the number of instructions executed by the specified thread
|
|
* on this CPU. Used by Python to control simulation.
|
|
*
|
|
* @param tid Thread monitor
|
|
* @return Number of instructions executed
|
|
*/
|
|
uint64_t getCurrentInstCount(ThreadID tid);
|
|
|
|
public:
|
|
/**
|
|
* @{
|
|
* @name PMU Probe points.
|
|
*/
|
|
|
|
/**
|
|
* Helper method to trigger PMU probes for a committed
|
|
* instruction.
|
|
*
|
|
* @param inst Instruction that just committed
|
|
* @param pc PC of the instruction that just committed
|
|
*/
|
|
virtual void probeInstCommit(const StaticInstPtr &inst, Addr pc);
|
|
|
|
protected:
|
|
/**
|
|
* Helper method to instantiate probe points belonging to this
|
|
* object.
|
|
*
|
|
* @param name Name of the probe point.
|
|
* @return A unique_ptr to the new probe point.
|
|
*/
|
|
probing::PMUUPtr pmuProbePoint(const char *name);
|
|
|
|
/**
|
|
* Instruction commit probe point.
|
|
*
|
|
* This probe point is triggered whenever one or more instructions
|
|
* are committed. It is normally triggered once for every
|
|
* instruction. However, CPU models committing bundles of
|
|
* instructions may call notify once for the entire bundle.
|
|
*/
|
|
probing::PMUUPtr ppRetiredInsts;
|
|
probing::PMUUPtr ppRetiredInstsPC;
|
|
|
|
/** Retired load instructions */
|
|
probing::PMUUPtr ppRetiredLoads;
|
|
/** Retired store instructions */
|
|
probing::PMUUPtr ppRetiredStores;
|
|
|
|
/** Retired branches (any type) */
|
|
probing::PMUUPtr ppRetiredBranches;
|
|
|
|
/** CPU cycle counter even if any thread Context is suspended*/
|
|
probing::PMUUPtr ppAllCycles;
|
|
|
|
/** CPU cycle counter, only counts if any thread contexts is active **/
|
|
probing::PMUUPtr ppActiveCycles;
|
|
|
|
/**
|
|
* ProbePoint that signals transitions of threadContexts sets.
|
|
* The ProbePoint reports information through it bool parameter.
|
|
* - If the parameter is true then the last enabled threadContext of the
|
|
* CPU object was disabled.
|
|
* - If the parameter is false then a threadContext was enabled, all the
|
|
* remaining threadContexts are disabled.
|
|
*/
|
|
ProbePointArg<bool> *ppSleeping;
|
|
/** @} */
|
|
|
|
enum CPUState
|
|
{
|
|
CPU_STATE_ON,
|
|
CPU_STATE_SLEEP,
|
|
CPU_STATE_WAKEUP
|
|
};
|
|
|
|
Cycles previousCycle;
|
|
CPUState previousState;
|
|
|
|
/** base method keeping track of cycle progression **/
|
|
inline void
|
|
updateCycleCounters(CPUState state)
|
|
{
|
|
uint32_t delta = curCycle() - previousCycle;
|
|
|
|
if (previousState == CPU_STATE_ON) {
|
|
ppActiveCycles->notify(delta);
|
|
}
|
|
|
|
switch (state) {
|
|
case CPU_STATE_WAKEUP:
|
|
ppSleeping->notify(false);
|
|
break;
|
|
case CPU_STATE_SLEEP:
|
|
ppSleeping->notify(true);
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
|
|
ppAllCycles->notify(delta);
|
|
|
|
previousCycle = curCycle();
|
|
previousState = state;
|
|
}
|
|
|
|
// Function tracing
|
|
private:
|
|
bool functionTracingEnabled;
|
|
std::ostream *functionTraceStream;
|
|
Addr currentFunctionStart;
|
|
Addr currentFunctionEnd;
|
|
Tick functionEntryTick;
|
|
void enableFunctionTrace();
|
|
void traceFunctionsInternal(Addr pc);
|
|
|
|
private:
|
|
static std::vector<BaseCPU *> cpuList; //!< Static global cpu list
|
|
|
|
public:
|
|
void
|
|
traceFunctions(Addr pc)
|
|
{
|
|
if (functionTracingEnabled)
|
|
traceFunctionsInternal(pc);
|
|
}
|
|
|
|
static int numSimulatedCPUs() { return cpuList.size(); }
|
|
static Counter
|
|
numSimulatedInsts()
|
|
{
|
|
Counter total = 0;
|
|
|
|
int size = cpuList.size();
|
|
for (int i = 0; i < size; ++i)
|
|
total += cpuList[i]->totalInsts();
|
|
|
|
return total;
|
|
}
|
|
|
|
static Counter
|
|
numSimulatedOps()
|
|
{
|
|
Counter total = 0;
|
|
|
|
int size = cpuList.size();
|
|
for (int i = 0; i < size; ++i)
|
|
total += cpuList[i]->totalOps();
|
|
|
|
return total;
|
|
}
|
|
|
|
public:
|
|
struct BaseCPUStats : public statistics::Group
|
|
{
|
|
BaseCPUStats(statistics::Group *parent);
|
|
// Number of CPU insts and ops committed at CPU core level
|
|
statistics::Scalar numInsts;
|
|
statistics::Scalar numOps;
|
|
// Number of CPU cycles simulated
|
|
statistics::Scalar numCycles;
|
|
/* CPI/IPC for total cycle counts and macro insts */
|
|
statistics::Formula cpi;
|
|
statistics::Formula ipc;
|
|
statistics::Scalar numWorkItemsStarted;
|
|
statistics::Scalar numWorkItemsCompleted;
|
|
} baseStats;
|
|
|
|
private:
|
|
std::vector<AddressMonitor> addressMonitor;
|
|
|
|
public:
|
|
void armMonitor(ThreadID tid, Addr address);
|
|
bool mwait(ThreadID tid, PacketPtr pkt);
|
|
void mwaitAtomic(ThreadID tid, ThreadContext *tc, BaseMMU *mmu);
|
|
AddressMonitor *
|
|
getCpuAddrMonitor(ThreadID tid)
|
|
{
|
|
assert(tid < numThreads);
|
|
return &addressMonitor[tid];
|
|
}
|
|
|
|
Cycles syscallRetryLatency;
|
|
|
|
/** This function is used to instruct the memory subsystem that a
|
|
* transaction should be aborted and the speculative state should be
|
|
* thrown away. This is called in the transaction's very last breath in
|
|
* the core. Afterwards, the core throws away its speculative state and
|
|
* resumes execution at the point the transaction started, i.e. reverses
|
|
* time. When instruction execution resumes, the core expects the
|
|
* memory subsystem to be in a stable, i.e. pre-speculative, state as
|
|
* well. */
|
|
virtual void
|
|
htmSendAbortSignal(ThreadID tid, uint64_t htm_uid,
|
|
HtmFailureFaultCause cause)
|
|
{
|
|
panic("htmSendAbortSignal not implemented");
|
|
}
|
|
|
|
// Enables CPU to enter power gating on a configurable cycle count
|
|
protected:
|
|
void enterPwrGating();
|
|
|
|
const Cycles pwrGatingLatency;
|
|
const bool powerGatingOnIdle;
|
|
EventFunctionWrapper enterPwrGatingEvent;
|
|
|
|
|
|
public:
|
|
struct FetchCPUStats : public statistics::Group
|
|
{
|
|
FetchCPUStats(statistics::Group *parent, int thread_id);
|
|
|
|
/* Total number of instructions fetched */
|
|
statistics::Scalar numInsts;
|
|
|
|
/* Total number of operations fetched */
|
|
statistics::Scalar numOps;
|
|
|
|
/* Number of instruction fetched per cycle. */
|
|
statistics::Formula fetchRate;
|
|
|
|
/* Total number of branches fetched */
|
|
statistics::Scalar numBranches;
|
|
|
|
/* Number of branch fetches per cycle. */
|
|
statistics::Formula branchRate;
|
|
|
|
/* Number of cycles stalled due to an icache miss */
|
|
statistics::Scalar icacheStallCycles;
|
|
|
|
/* Number of times fetch was asked to suspend by Execute */
|
|
statistics::Scalar numFetchSuspends;
|
|
|
|
};
|
|
|
|
struct ExecuteCPUStats: public statistics::Group
|
|
{
|
|
ExecuteCPUStats(statistics::Group *parent, int thread_id);
|
|
|
|
/* Stat for total number of executed instructions */
|
|
statistics::Scalar numInsts;
|
|
/* Number of executed nops */
|
|
statistics::Scalar numNop;
|
|
/* Number of executed branches */
|
|
statistics::Scalar numBranches;
|
|
/* Stat for total number of executed load instructions */
|
|
statistics::Scalar numLoadInsts;
|
|
/* Number of executed store instructions */
|
|
statistics::Formula numStoreInsts;
|
|
/* Number of instructions executed per cycle */
|
|
statistics::Formula instRate;
|
|
|
|
/* Number of cycles stalled for D-cache responses */
|
|
statistics::Scalar dcacheStallCycles;
|
|
|
|
/* Number of condition code register file accesses */
|
|
statistics::Scalar numCCRegReads;
|
|
statistics::Scalar numCCRegWrites;
|
|
|
|
/* number of float alu accesses */
|
|
statistics::Scalar numFpAluAccesses;
|
|
|
|
/* Number of float register file accesses */
|
|
statistics::Scalar numFpRegReads;
|
|
statistics::Scalar numFpRegWrites;
|
|
|
|
/* Number of integer alu accesses */
|
|
statistics::Scalar numIntAluAccesses;
|
|
|
|
/* Number of integer register file accesses */
|
|
statistics::Scalar numIntRegReads;
|
|
statistics::Scalar numIntRegWrites;
|
|
|
|
/* number of simulated memory references */
|
|
statistics::Scalar numMemRefs;
|
|
|
|
/* Number of misc register file accesses */
|
|
statistics::Scalar numMiscRegReads;
|
|
statistics::Scalar numMiscRegWrites;
|
|
|
|
/* Number of vector alu accesses */
|
|
statistics::Scalar numVecAluAccesses;
|
|
|
|
/* Number of predicate register file accesses */
|
|
mutable statistics::Scalar numVecPredRegReads;
|
|
statistics::Scalar numVecPredRegWrites;
|
|
|
|
/* Number of vector register file accesses */
|
|
mutable statistics::Scalar numVecRegReads;
|
|
statistics::Scalar numVecRegWrites;
|
|
|
|
/* Number of ops discarded before committing */
|
|
statistics::Scalar numDiscardedOps;
|
|
};
|
|
|
|
struct CommitCPUStats: public statistics::Group
|
|
{
|
|
CommitCPUStats(statistics::Group *parent, int thread_id);
|
|
|
|
/* Number of simulated instructions committed */
|
|
statistics::Scalar numInsts;
|
|
statistics::Scalar numOps;
|
|
|
|
/* Number of instructions committed that are not NOP or prefetches */
|
|
statistics::Scalar numInstsNotNOP;
|
|
statistics::Scalar numOpsNotNOP;
|
|
|
|
/* CPI/IPC for total cycle counts and macro insts */
|
|
statistics::Formula cpi;
|
|
statistics::Formula ipc;
|
|
|
|
/* Number of committed memory references. */
|
|
statistics::Scalar numMemRefs;
|
|
|
|
/* Number of float instructions */
|
|
statistics::Scalar numFpInsts;
|
|
|
|
/* Number of int instructions */
|
|
statistics::Scalar numIntInsts;
|
|
|
|
/* number of load instructions */
|
|
statistics::Scalar numLoadInsts;
|
|
|
|
/* Number of store instructions */
|
|
statistics::Scalar numStoreInsts;
|
|
|
|
/* Number of vector instructions */
|
|
statistics::Scalar numVecInsts;
|
|
|
|
/* Number of instructions committed by type (OpClass) */
|
|
statistics::Vector committedInstType;
|
|
|
|
/* number of control instructions committed by control inst type */
|
|
statistics::Vector committedControl;
|
|
void updateComCtrlStats(const StaticInstPtr staticInst);
|
|
|
|
};
|
|
|
|
std::vector<std::unique_ptr<FetchCPUStats>> fetchStats;
|
|
std::vector<std::unique_ptr<ExecuteCPUStats>> executeStats;
|
|
std::vector<std::unique_ptr<CommitCPUStats>> commitStats;
|
|
};
|
|
|
|
} // namespace gem5
|
|
|
|
#endif // __CPU_BASE_HH__
|