blob: 3976b66fe48ff8d17eca01c973b34ddde0eccc01 [file] [log] [blame]
/*
* Copyright (c) 2011-2013, 2017, 2020 ARM Limited
* All rights reserved
*
* The license below extends only to copyright in the software and shall
* not be construed as granting a license to any other intellectual
* property including but not limited to intellectual property relating
* to a hardware implementation of the functionality of the software
* licensed hereunder. You may use the software subject to the license
* terms below provided that you ensure that this notice is replicated
* unmodified and in its entirety in all distributions of the software,
* modified or unmodified, in source code or in binary form.
*
* Copyright (c) 2002-2005 The Regents of The University of Michigan
* Copyright (c) 2011 Regents of the University of California
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions are
* met: redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer;
* redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution;
* neither the name of the copyright holders nor the names of its
* contributors may be used to endorse or promote products derived from
* this software without specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
* OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
#ifndef __CPU_BASE_HH__
#define __CPU_BASE_HH__
#include <memory>
#include <vector>
#include "arch/generic/interrupts.hh"
#include "base/statistics.hh"
#include "debug/Mwait.hh"
#include "mem/htm.hh"
#include "mem/port_proxy.hh"
#include "sim/clocked_object.hh"
#include "sim/eventq.hh"
#include "sim/full_system.hh"
#include "sim/insttracer.hh"
#include "sim/probe/pmu.hh"
#include "sim/probe/probe.hh"
#include "sim/signal.hh"
#include "sim/system.hh"
namespace gem5
{
class BaseCPU;
struct BaseCPUParams;
class CheckerCPU;
class ThreadContext;
struct AddressMonitor
{
AddressMonitor();
bool doMonitor(PacketPtr pkt);
bool armed;
Addr vAddr;
Addr pAddr;
uint64_t val;
bool waiting; // 0=normal, 1=mwaiting
bool gotWakeup;
};
class CPUProgressEvent : public Event
{
protected:
Tick _interval;
Counter lastNumInst;
BaseCPU *cpu;
bool _repeatEvent;
public:
CPUProgressEvent(BaseCPU *_cpu, Tick ival = 0);
void process();
void interval(Tick ival) { _interval = ival; }
Tick interval() { return _interval; }
void repeatEvent(bool repeat) { _repeatEvent = repeat; }
virtual const char *description() const;
};
class BaseCPU : public ClockedObject
{
protected:
/// Instruction count used for SPARC misc register
/// @todo unify this with the counters that cpus individually keep
Tick instCnt;
// every cpu has an id, put it in the base cpu
// Set at initialization, only time a cpuId might change is during a
// takeover (which should be done from within the BaseCPU anyway,
// therefore no setCpuId() method is provided
int _cpuId;
/** Each cpu will have a socket ID that corresponds to its physical location
* in the system. This is usually used to bucket cpu cores under single DVFS
* domain. This information may also be required by the OS to identify the
* cpu core grouping (as in the case of ARM via MPIDR register)
*/
const uint32_t _socketId;
/** instruction side request id that must be placed in all requests */
RequestorID _instRequestorId;
/** data side request id that must be placed in all requests */
RequestorID _dataRequestorId;
/** An intrenal representation of a task identifier within gem5. This is
* used so the CPU can add which taskId (which is an internal representation
* of the OS process ID) to each request so components in the memory system
* can track which process IDs are ultimately interacting with them
*/
uint32_t _taskId;
/** The current OS process ID that is executing on this processor. This is
* used to generate a taskId */
uint32_t _pid;
/** Is the CPU switched out or active? */
bool _switchedOut;
/** Cache the cache line size that we get from the system */
const unsigned int _cacheLineSize;
/** Global CPU statistics that are merged into the Root object. */
struct GlobalStats : public statistics::Group
{
GlobalStats(statistics::Group *parent);
statistics::Value simInsts;
statistics::Value simOps;
statistics::Formula hostInstRate;
statistics::Formula hostOpRate;
};
/**
* Pointer to the global stat structure. This needs to be
* constructed from regStats since we merge it into the root
* group. */
static std::unique_ptr<GlobalStats> globalStats;
SignalSinkPort<bool> modelResetPort;
public:
/**
* Purely virtual method that returns a reference to the data
* port. All subclasses must implement this method.
*
* @return a reference to the data port
*/
virtual Port &getDataPort() = 0;
/**
* Purely virtual method that returns a reference to the instruction
* port. All subclasses must implement this method.
*
* @return a reference to the instruction port
*/
virtual Port &getInstPort() = 0;
/** Reads this CPU's ID. */
int cpuId() const { return _cpuId; }
/** Reads this CPU's Socket ID. */
uint32_t socketId() const { return _socketId; }
/** Reads this CPU's unique data requestor ID */
RequestorID dataRequestorId() const { return _dataRequestorId; }
/** Reads this CPU's unique instruction requestor ID */
RequestorID instRequestorId() const { return _instRequestorId; }
/**
* Get a port on this CPU. All CPUs have a data and
* instruction port, and this method uses getDataPort and
* getInstPort of the subclasses to resolve the two ports.
*
* @param if_name the port name
* @param idx ignored index
*
* @return a reference to the port with the given name
*/
Port &getPort(const std::string &if_name,
PortID idx=InvalidPortID) override;
/** Get cpu task id */
uint32_t taskId() const { return _taskId; }
/** Set cpu task id */
void taskId(uint32_t id) { _taskId = id; }
uint32_t getPid() const { return _pid; }
void setPid(uint32_t pid) { _pid = pid; }
inline void workItemBegin() { baseStats.numWorkItemsStarted++; }
inline void workItemEnd() { baseStats.numWorkItemsCompleted++; }
// @todo remove me after debugging with legion done
Tick instCount() { return instCnt; }
protected:
std::vector<BaseInterrupts*> interrupts;
public:
BaseInterrupts *
getInterruptController(ThreadID tid)
{
if (interrupts.empty())
return NULL;
assert(interrupts.size() > tid);
return interrupts[tid];
}
virtual void wakeup(ThreadID tid) = 0;
void postInterrupt(ThreadID tid, int int_num, int index);
void
clearInterrupt(ThreadID tid, int int_num, int index)
{
interrupts[tid]->clear(int_num, index);
}
void
clearInterrupts(ThreadID tid)
{
interrupts[tid]->clearAll();
}
bool
checkInterrupts(ThreadID tid) const
{
return FullSystem && interrupts[tid]->checkInterrupts();
}
protected:
std::vector<ThreadContext *> threadContexts;
trace::InstTracer * tracer;
public:
/** Invalid or unknown Pid. Possible when operating system is not present
* or has not assigned a pid yet */
static const uint32_t invldPid = std::numeric_limits<uint32_t>::max();
/// Provide access to the tracer pointer
trace::InstTracer * getTracer() { return tracer; }
/// Notify the CPU that the indicated context is now active.
virtual void activateContext(ThreadID thread_num);
/// Notify the CPU that the indicated context is now suspended.
/// Check if possible to enter a lower power state
virtual void suspendContext(ThreadID thread_num);
/// Notify the CPU that the indicated context is now halted.
virtual void haltContext(ThreadID thread_num);
/// Given a Thread Context pointer return the thread num
int findContext(ThreadContext *tc);
/// Given a thread num get tho thread context for it
virtual ThreadContext *getContext(int tn) { return threadContexts[tn]; }
/// Get the number of thread contexts available
unsigned
numContexts()
{
return static_cast<unsigned>(threadContexts.size());
}
/// Convert ContextID to threadID
ThreadID
contextToThread(ContextID cid)
{
return static_cast<ThreadID>(cid - threadContexts[0]->contextId());
}
public:
PARAMS(BaseCPU);
BaseCPU(const Params &params, bool is_checker = false);
virtual ~BaseCPU();
void init() override;
void startup() override;
void regStats() override;
void regProbePoints() override;
void registerThreadContexts();
// Functions to deschedule and reschedule the events to enter the
// power gating sleep before and after checkpoiting respectively.
void deschedulePowerGatingEvent();
void schedulePowerGatingEvent();
/**
* Prepare for another CPU to take over execution.
*
* When this method exits, all internal state should have been
* flushed. After the method returns, the simulator calls
* takeOverFrom() on the new CPU with this CPU as its parameter.
*/
virtual void switchOut();
/**
* Load the state of a CPU from the previous CPU object, invoked
* on all new CPUs that are about to be switched in.
*
* A CPU model implementing this method is expected to initialize
* its state from the old CPU and connect its memory (unless they
* are already connected) to the memories connected to the old
* CPU.
*
* @param cpu CPU to initialize read state from.
*/
virtual void takeOverFrom(BaseCPU *cpu);
/**
* Set the reset of the CPU to be either asserted or deasserted.
*
* When asserted, the CPU should be stopped and waiting. When deasserted,
* the CPU should start running again, unless some other condition would
* also prevent it. At the point the reset is deasserted, it should be
* reinitialized as defined by the ISA it's running and any other relevant
* part of its configuration (reset address, etc).
*
* @param state The new state of the reset signal to this CPU.
*/
virtual void setReset(bool state);
/**
* Flush all TLBs in the CPU.
*
* This method is mainly used to flush stale translations when
* switching CPUs. It is also exported to the Python world to
* allow it to request a TLB flush after draining the CPU to make
* it easier to compare traces when debugging
* handover/checkpointing.
*/
void flushTLBs();
/**
* Determine if the CPU is switched out.
*
* @return True if the CPU is switched out, false otherwise.
*/
bool switchedOut() const { return _switchedOut; }
/**
* Verify that the system is in a memory mode supported by the
* CPU.
*
* Implementations are expected to query the system for the
* current memory mode and ensure that it is what the CPU model
* expects. If the check fails, the implementation should
* terminate the simulation using fatal().
*/
virtual void verifyMemoryMode() const { };
/**
* Number of threads we're actually simulating (<= SMT_MAX_THREADS).
* This is a constant for the duration of the simulation.
*/
ThreadID numThreads;
System *system;
/**
* Get the cache line size of the system.
*/
inline unsigned int cacheLineSize() const { return _cacheLineSize; }
/**
* Serialize this object to the given output stream.
*
* @note CPU models should normally overload the serializeThread()
* method instead of the serialize() method as this provides a
* uniform data format for all CPU models and promotes better code
* reuse.
*
* @param cp The stream to serialize to.
*/
void serialize(CheckpointOut &cp) const override;
/**
* Reconstruct the state of this object from a checkpoint.
*
* @note CPU models should normally overload the
* unserializeThread() method instead of the unserialize() method
* as this provides a uniform data format for all CPU models and
* promotes better code reuse.
* @param cp The checkpoint use.
*/
void unserialize(CheckpointIn &cp) override;
/**
* Serialize a single thread.
*
* @param cp The stream to serialize to.
* @param tid ID of the current thread.
*/
virtual void serializeThread(CheckpointOut &cp, ThreadID tid) const {};
/**
* Unserialize one thread.
*
* @param cp The checkpoint use.
* @param tid ID of the current thread.
*/
virtual void unserializeThread(CheckpointIn &cp, ThreadID tid) {};
virtual Counter totalInsts() const = 0;
virtual Counter totalOps() const = 0;
/**
* Schedule an event that exits the simulation loops after a
* predefined number of instructions.
*
* This method is usually called from the configuration script to
* get an exit event some time in the future. It is typically used
* when the script wants to simulate for a specific number of
* instructions rather than ticks.
*
* @param tid Thread monitor.
* @param insts Number of instructions into the future.
* @param cause Cause to signal in the exit event.
*/
void scheduleInstStop(ThreadID tid, Counter insts, std::string cause);
/**
* Schedule simpoint events using the scheduleInstStop function.
*
* This is used to raise a SIMPOINT_BEGIN exit event in the gem5 standard
* library.
*
* @param inst_starts A vector of number of instructions to start simpoints
*/
void scheduleSimpointsInstStop(std::vector<Counter> inst_starts);
/**
* Schedule an exit event when any threads in the core reach the max_insts
* instructions using the scheduleInstStop function.
*
* This is used to raise a MAX_INSTS exit event in thegem5 standard library
*
* @param max_insts Number of instructions into the future.
*/
void scheduleInstStopAnyThread(Counter max_insts);
/**
* Get the number of instructions executed by the specified thread
* on this CPU. Used by Python to control simulation.
*
* @param tid Thread monitor
* @return Number of instructions executed
*/
uint64_t getCurrentInstCount(ThreadID tid);
public:
/**
* @{
* @name PMU Probe points.
*/
/**
* Helper method to trigger PMU probes for a committed
* instruction.
*
* @param inst Instruction that just committed
* @param pc PC of the instruction that just committed
*/
virtual void probeInstCommit(const StaticInstPtr &inst, Addr pc);
protected:
/**
* Helper method to instantiate probe points belonging to this
* object.
*
* @param name Name of the probe point.
* @return A unique_ptr to the new probe point.
*/
probing::PMUUPtr pmuProbePoint(const char *name);
/**
* Instruction commit probe point.
*
* This probe point is triggered whenever one or more instructions
* are committed. It is normally triggered once for every
* instruction. However, CPU models committing bundles of
* instructions may call notify once for the entire bundle.
*/
probing::PMUUPtr ppRetiredInsts;
probing::PMUUPtr ppRetiredInstsPC;
/** Retired load instructions */
probing::PMUUPtr ppRetiredLoads;
/** Retired store instructions */
probing::PMUUPtr ppRetiredStores;
/** Retired branches (any type) */
probing::PMUUPtr ppRetiredBranches;
/** CPU cycle counter even if any thread Context is suspended*/
probing::PMUUPtr ppAllCycles;
/** CPU cycle counter, only counts if any thread contexts is active **/
probing::PMUUPtr ppActiveCycles;
/**
* ProbePoint that signals transitions of threadContexts sets.
* The ProbePoint reports information through it bool parameter.
* - If the parameter is true then the last enabled threadContext of the
* CPU object was disabled.
* - If the parameter is false then a threadContext was enabled, all the
* remaining threadContexts are disabled.
*/
ProbePointArg<bool> *ppSleeping;
/** @} */
enum CPUState
{
CPU_STATE_ON,
CPU_STATE_SLEEP,
CPU_STATE_WAKEUP
};
Cycles previousCycle;
CPUState previousState;
/** base method keeping track of cycle progression **/
inline void
updateCycleCounters(CPUState state)
{
uint32_t delta = curCycle() - previousCycle;
if (previousState == CPU_STATE_ON) {
ppActiveCycles->notify(delta);
}
switch (state) {
case CPU_STATE_WAKEUP:
ppSleeping->notify(false);
break;
case CPU_STATE_SLEEP:
ppSleeping->notify(true);
break;
default:
break;
}
ppAllCycles->notify(delta);
previousCycle = curCycle();
previousState = state;
}
// Function tracing
private:
bool functionTracingEnabled;
std::ostream *functionTraceStream;
Addr currentFunctionStart;
Addr currentFunctionEnd;
Tick functionEntryTick;
void enableFunctionTrace();
void traceFunctionsInternal(Addr pc);
private:
static std::vector<BaseCPU *> cpuList; //!< Static global cpu list
public:
void
traceFunctions(Addr pc)
{
if (functionTracingEnabled)
traceFunctionsInternal(pc);
}
static int numSimulatedCPUs() { return cpuList.size(); }
static Counter
numSimulatedInsts()
{
Counter total = 0;
int size = cpuList.size();
for (int i = 0; i < size; ++i)
total += cpuList[i]->totalInsts();
return total;
}
static Counter
numSimulatedOps()
{
Counter total = 0;
int size = cpuList.size();
for (int i = 0; i < size; ++i)
total += cpuList[i]->totalOps();
return total;
}
public:
struct BaseCPUStats : public statistics::Group
{
BaseCPUStats(statistics::Group *parent);
// Number of CPU insts and ops committed at CPU core level
statistics::Scalar numInsts;
statistics::Scalar numOps;
// Number of CPU cycles simulated
statistics::Scalar numCycles;
/* CPI/IPC for total cycle counts and macro insts */
statistics::Formula cpi;
statistics::Formula ipc;
statistics::Scalar numWorkItemsStarted;
statistics::Scalar numWorkItemsCompleted;
} baseStats;
private:
std::vector<AddressMonitor> addressMonitor;
public:
void armMonitor(ThreadID tid, Addr address);
bool mwait(ThreadID tid, PacketPtr pkt);
void mwaitAtomic(ThreadID tid, ThreadContext *tc, BaseMMU *mmu);
AddressMonitor *
getCpuAddrMonitor(ThreadID tid)
{
assert(tid < numThreads);
return &addressMonitor[tid];
}
Cycles syscallRetryLatency;
/** This function is used to instruct the memory subsystem that a
* transaction should be aborted and the speculative state should be
* thrown away. This is called in the transaction's very last breath in
* the core. Afterwards, the core throws away its speculative state and
* resumes execution at the point the transaction started, i.e. reverses
* time. When instruction execution resumes, the core expects the
* memory subsystem to be in a stable, i.e. pre-speculative, state as
* well. */
virtual void
htmSendAbortSignal(ThreadID tid, uint64_t htm_uid,
HtmFailureFaultCause cause)
{
panic("htmSendAbortSignal not implemented");
}
// Enables CPU to enter power gating on a configurable cycle count
protected:
void enterPwrGating();
const Cycles pwrGatingLatency;
const bool powerGatingOnIdle;
EventFunctionWrapper enterPwrGatingEvent;
public:
struct FetchCPUStats : public statistics::Group
{
FetchCPUStats(statistics::Group *parent, int thread_id);
/* Total number of instructions fetched */
statistics::Scalar numInsts;
/* Total number of operations fetched */
statistics::Scalar numOps;
/* Number of instruction fetched per cycle. */
statistics::Formula fetchRate;
/* Total number of branches fetched */
statistics::Scalar numBranches;
/* Number of branch fetches per cycle. */
statistics::Formula branchRate;
/* Number of cycles stalled due to an icache miss */
statistics::Scalar icacheStallCycles;
/* Number of times fetch was asked to suspend by Execute */
statistics::Scalar numFetchSuspends;
};
struct ExecuteCPUStats: public statistics::Group
{
ExecuteCPUStats(statistics::Group *parent, int thread_id);
/* Stat for total number of executed instructions */
statistics::Scalar numInsts;
/* Number of executed nops */
statistics::Scalar numNop;
/* Number of executed branches */
statistics::Scalar numBranches;
/* Stat for total number of executed load instructions */
statistics::Scalar numLoadInsts;
/* Number of executed store instructions */
statistics::Formula numStoreInsts;
/* Number of instructions executed per cycle */
statistics::Formula instRate;
/* Number of cycles stalled for D-cache responses */
statistics::Scalar dcacheStallCycles;
/* Number of condition code register file accesses */
statistics::Scalar numCCRegReads;
statistics::Scalar numCCRegWrites;
/* number of float alu accesses */
statistics::Scalar numFpAluAccesses;
/* Number of float register file accesses */
statistics::Scalar numFpRegReads;
statistics::Scalar numFpRegWrites;
/* Number of integer alu accesses */
statistics::Scalar numIntAluAccesses;
/* Number of integer register file accesses */
statistics::Scalar numIntRegReads;
statistics::Scalar numIntRegWrites;
/* number of simulated memory references */
statistics::Scalar numMemRefs;
/* Number of misc register file accesses */
statistics::Scalar numMiscRegReads;
statistics::Scalar numMiscRegWrites;
/* Number of vector alu accesses */
statistics::Scalar numVecAluAccesses;
/* Number of predicate register file accesses */
mutable statistics::Scalar numVecPredRegReads;
statistics::Scalar numVecPredRegWrites;
/* Number of vector register file accesses */
mutable statistics::Scalar numVecRegReads;
statistics::Scalar numVecRegWrites;
/* Number of ops discarded before committing */
statistics::Scalar numDiscardedOps;
};
struct CommitCPUStats: public statistics::Group
{
CommitCPUStats(statistics::Group *parent, int thread_id);
/* Number of simulated instructions committed */
statistics::Scalar numInsts;
statistics::Scalar numOps;
/* Number of instructions committed that are not NOP or prefetches */
statistics::Scalar numInstsNotNOP;
statistics::Scalar numOpsNotNOP;
/* CPI/IPC for total cycle counts and macro insts */
statistics::Formula cpi;
statistics::Formula ipc;
/* Number of committed memory references. */
statistics::Scalar numMemRefs;
/* Number of float instructions */
statistics::Scalar numFpInsts;
/* Number of int instructions */
statistics::Scalar numIntInsts;
/* number of load instructions */
statistics::Scalar numLoadInsts;
/* Number of store instructions */
statistics::Scalar numStoreInsts;
/* Number of vector instructions */
statistics::Scalar numVecInsts;
/* Number of instructions committed by type (OpClass) */
statistics::Vector committedInstType;
/* number of control instructions committed by control inst type */
statistics::Vector committedControl;
void updateComCtrlStats(const StaticInstPtr staticInst);
};
std::vector<std::unique_ptr<FetchCPUStats>> fetchStats;
std::vector<std::unique_ptr<ExecuteCPUStats>> executeStats;
std::vector<std::unique_ptr<CommitCPUStats>> commitStats;
};
} // namespace gem5
#endif // __CPU_BASE_HH__