diff options
Diffstat (limited to 'cpu/o3')
-rw-r--r-- | cpu/o3/alpha_cpu_impl.hh | 24 | ||||
-rw-r--r-- | cpu/o3/commit_impl.hh | 14 | ||||
-rw-r--r-- | cpu/o3/thread_state.hh | 29 |
3 files changed, 54 insertions, 13 deletions
diff --git a/cpu/o3/alpha_cpu_impl.hh b/cpu/o3/alpha_cpu_impl.hh index 1bf0652cd..071a870ef 100644 --- a/cpu/o3/alpha_cpu_impl.hh +++ b/cpu/o3/alpha_cpu_impl.hh @@ -153,15 +153,6 @@ AlphaFullCPU<Impl>::regStats() this->commit.regStats(); } -#if FULL_SYSTEM -template <class Impl> -void -AlphaFullCPU<Impl>::AlphaXC::dumpFuncProfile() -{ - // Currently not supported -} -#endif - template <class Impl> void AlphaFullCPU<Impl>::AlphaXC::takeOverFrom(ExecContext *old_context) @@ -336,13 +327,24 @@ AlphaFullCPU<Impl>::AlphaXC::readLastSuspend() template <class Impl> void +AlphaFullCPU<Impl>::AlphaXC::dumpFuncProfile() +{ + thread->dumpFuncProfile(); +} + +template <class Impl> +void AlphaFullCPU<Impl>::AlphaXC::profileClear() -{} +{ + thread->profileClear(); +} template <class Impl> void AlphaFullCPU<Impl>::AlphaXC::profileSample() -{} +{ + thread->profileSample(); +} #endif template <class Impl> diff --git a/cpu/o3/commit_impl.hh b/cpu/o3/commit_impl.hh index 364e685c2..cd10ec6b2 100644 --- a/cpu/o3/commit_impl.hh +++ b/cpu/o3/commit_impl.hh @@ -1035,6 +1035,20 @@ DefaultCommit<Impl>::commitHead(DynInstPtr &head_inst, unsigned inst_num) updateComInstStats(head_inst); +#if FULL_SYSTEM + if (thread[tid]->profile) { +// bool usermode = +// (cpu->readMiscReg(AlphaISA::IPR_DTB_CM, tid) & 0x18) != 0; +// thread[tid]->profilePC = usermode ? 1 : head_inst->readPC(); + thread[tid]->profilePC = head_inst->readPC(); + ProfileNode *node = thread[tid]->profile->consume(thread[tid]->getXCProxy(), + head_inst->staticInst); + + if (node) + thread[tid]->profileNode = node; + } +#endif + if (head_inst->traceData) { head_inst->traceData->setFetchSeq(head_inst->seqNum); head_inst->traceData->setCPSeq(thread[tid]->numInst); diff --git a/cpu/o3/thread_state.hh b/cpu/o3/thread_state.hh index 3f1208ea0..28f488143 100644 --- a/cpu/o3/thread_state.hh +++ b/cpu/o3/thread_state.hh @@ -31,8 +31,11 @@ #include "arch/faults.hh" #include "arch/isa_traits.hh" +#include "base/callback.hh" +#include "base/output.hh" #include "cpu/exec_context.hh" #include "cpu/thread_state.hh" +#include "sim/sim_exit.hh" class Event; class Process; @@ -83,8 +86,22 @@ struct O3ThreadState : public ThreadState { #if FULL_SYSTEM O3ThreadState(FullCPU *_cpu, int _thread_num, FunctionalMemory *_mem) : ThreadState(-1, _thread_num, _mem), - inSyscall(0), trapPending(0) - { } + cpu(_cpu), inSyscall(0), trapPending(0) + { + if (cpu->params->profile) { + profile = new FunctionProfile(cpu->params->system->kernelSymtab); + Callback *cb = + new MakeCallback<O3ThreadState, + &O3ThreadState::dumpFuncProfile>(this); + registerExitCallback(cb); + } + + // let's fill with a dummy node for now so we don't get a segfault + // on the first cycle when there's no node available. + static ProfileNode dummyNode; + profileNode = &dummyNode; + profilePC = 3; + } #else O3ThreadState(FullCPU *_cpu, int _thread_num, Process *_process, int _asid) : ThreadState(-1, _thread_num, _process->getMemory(), _process, _asid), @@ -138,6 +155,14 @@ struct O3ThreadState : public ThreadState { /** Handles the syscall. */ void syscall() { process->syscall(xcProxy); } #endif + +#if FULL_SYSTEM + void dumpFuncProfile() + { + std::ostream *os = simout.create(csprintf("profile.%s.dat", cpu->name())); + profile->dump(xcProxy, *os); + } +#endif }; #endif // __CPU_O3_THREAD_STATE_HH__ |