~swilson/gem5-docs/GPUCoalescer_8hh_source.html

 /*

  * Copyright (c) 2013-2015 Advanced Micro Devices, Inc.

  * All rights reserved.

  *

  * For use for simulation and test purposes only

  *

  * Redistribution and use in source and binary forms, with or without

  * modification, are permitted provided that the following conditions are met:

  *

  * 1. Redistributions of source code must retain the above copyright notice,

  * this list of conditions and the following disclaimer.

  *

  * 2. Redistributions in binary form must reproduce the above copyright notice,

  * this list of conditions and the following disclaimer in the documentation

  * and/or other materials provided with the distribution.

  *

  * 3. Neither the name of the copyright holder nor the names of its contributors

  * may be used to endorse or promote products derived from this software

  * without specific prior written permission.

  *

  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"

  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE

  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE

  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE

  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR

  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF

  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS

  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN

  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)

  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE

  * POSSIBILITY OF SUCH DAMAGE.

  *

  * Author: Sooraj Puthoor

  */


 #ifndef __MEM_RUBY_SYSTEM_GPU_COALESCER_HH__

 #define __MEM_RUBY_SYSTEM_GPU_COALESCER_HH__


 #include <iostream>

 #include <unordered_map>


 #include "base/statistics.hh"

 #include "mem/protocol/HSAScope.hh"

 #include "mem/protocol/HSASegment.hh"

 #include "mem/protocol/PrefetchBit.hh"

 #include "mem/protocol/RubyAccessMode.hh"

 #include "mem/protocol/RubyRequestType.hh"

 #include "mem/protocol/SequencerRequestType.hh"

 #include "mem/request.hh"

 #include "mem/ruby/common/Address.hh"

 #include "mem/ruby/common/Consumer.hh"

 #include "mem/ruby/system/Sequencer.hh"


 class DataBlock;

 class CacheMsg;

 class MachineID;

 class CacheMemory;


 class RubyGPUCoalescerParams;


 HSAScope reqScopeToHSAScope(Request* req);

 HSASegment reqSegmentToHSASegment(Request* req);


 struct GPUCoalescerRequest

 {

     PacketPtr pkt;

     RubyRequestType m_type;

     Cycles issue_time;


     GPUCoalescerRequest(PacketPtr _pkt, RubyRequestType _m_type,

                         Cycles _issue_time)

         : pkt(_pkt), m_type(_m_type), issue_time(_issue_time)

     {}

 };


 class RequestDesc

 {

   public:

     RequestDesc(PacketPtr pkt, RubyRequestType p_type, RubyRequestType s_type)

         : pkt(pkt), primaryType(p_type), secondaryType(s_type)

     {

     }


     RequestDesc() : pkt(nullptr), primaryType(RubyRequestType_NULL),

         secondaryType(RubyRequestType_NULL)

     {

     }


     PacketPtr pkt;

     RubyRequestType primaryType;

     RubyRequestType secondaryType;

 };


 std::ostream& operator<<(std::ostream& out, const GPUCoalescerRequest& obj);


 class GPUCoalescer : public RubyPort

 {

   public:

     typedef RubyGPUCoalescerParams Params;

     GPUCoalescer(const Params *);

     ~GPUCoalescer();


     // Public Methods

     void wakeup(); // Used only for deadlock detection


     void printProgress(std::ostream& out) const;

     void resetStats();

     void collateStats();

     void regStats();


     void writeCallback(Addr address, DataBlock& data);


     void writeCallback(Addr address,

                        MachineType mach,

                        DataBlock& data);


     void writeCallback(Addr address,

                        MachineType mach,

                        DataBlock& data,

                        Cycles initialRequestTime,

                        Cycles forwardRequestTime,

                        Cycles firstResponseTime,

                        bool isRegion);


     void writeCallback(Addr address,

                        MachineType mach,

                        DataBlock& data,

                        Cycles initialRequestTime,

                        Cycles forwardRequestTime,

                        Cycles firstResponseTime);


     void readCallback(Addr address, DataBlock& data);


     void readCallback(Addr address,

                       MachineType mach,

                       DataBlock& data);


     void readCallback(Addr address,

                       MachineType mach,

                       DataBlock& data,

                       Cycles initialRequestTime,

                       Cycles forwardRequestTime,

                       Cycles firstResponseTime);


     void readCallback(Addr address,

                       MachineType mach,

                       DataBlock& data,

                       Cycles initialRequestTime,

                       Cycles forwardRequestTime,

                       Cycles firstResponseTime,

                       bool isRegion);

     /* atomics need their own callback because the data

        might be const coming from SLICC */

     void atomicCallback(Addr address,

                         MachineType mach,

                         const DataBlock& data);


     void recordCPReadCallBack(MachineID myMachID, MachineID senderMachID);

     void recordCPWriteCallBack(MachineID myMachID, MachineID senderMachID);


     // Alternate implementations in VIPER Coalescer

     virtual RequestStatus makeRequest(PacketPtr pkt);


     int outstandingCount() const { return m_outstanding_count; }


     bool

     isDeadlockEventScheduled() const

     {

         return deadlockCheckEvent.scheduled();

     }


     void

     descheduleDeadlockEvent()

     {

         deschedule(deadlockCheckEvent);

     }


     bool empty() const;


     void print(std::ostream& out) const;

     void checkCoherence(Addr address);


     void markRemoved();

     void removeRequest(GPUCoalescerRequest* request);

     void evictionCallback(Addr address);

     void completeIssue();


     void insertKernel(int wavefront_id, PacketPtr pkt);


     void recordRequestType(SequencerRequestType requestType);

     Stats::Histogram& getOutstandReqHist() { return m_outstandReqHist; }


     Stats::Histogram& getLatencyHist() { return m_latencyHist; }

     Stats::Histogram& getTypeLatencyHist(uint32_t t)

     { return *m_typeLatencyHist[t]; }


     Stats::Histogram& getMissLatencyHist()

     { return m_missLatencyHist; }

     Stats::Histogram& getMissTypeLatencyHist(uint32_t t)

     { return *m_missTypeLatencyHist[t]; }


     Stats::Histogram& getMissMachLatencyHist(uint32_t t) const

     { return *m_missMachLatencyHist[t]; }


     Stats::Histogram&

     getMissTypeMachLatencyHist(uint32_t r, uint32_t t) const

     { return *m_missTypeMachLatencyHist[r][t]; }


     Stats::Histogram& getIssueToInitialDelayHist(uint32_t t) const

     { return *m_IssueToInitialDelayHist[t]; }


     Stats::Histogram&

     getInitialToForwardDelayHist(const MachineType t) const

     { return *m_InitialToForwardDelayHist[t]; }


     Stats::Histogram&

     getForwardRequestToFirstResponseHist(const MachineType t) const

     { return *m_ForwardToFirstResponseDelayHist[t]; }


     Stats::Histogram&

     getFirstResponseToCompletionDelayHist(const MachineType t) const

     { return *m_FirstResponseToCompletionDelayHist[t]; }


   // Changed to protected to enable inheritance by VIPER Coalescer

   protected:

     bool tryCacheAccess(Addr addr, RubyRequestType type,

                         Addr pc, RubyAccessMode access_mode,

                         int size, DataBlock*& data_ptr);

     // Alternate implementations in VIPER Coalescer

     virtual void issueRequest(PacketPtr pkt, RubyRequestType type);


     void kernelCallback(int wavfront_id);


     void hitCallback(GPUCoalescerRequest* request,

                      MachineType mach,

                      DataBlock& data,

                      bool success,

                      Cycles initialRequestTime,

                      Cycles forwardRequestTime,

                      Cycles firstResponseTime,

                      bool isRegion);

     void recordMissLatency(GPUCoalescerRequest* request,

                            MachineType mach,

                            Cycles initialRequestTime,

                            Cycles forwardRequestTime,

                            Cycles firstResponseTime,

                            bool success, bool isRegion);

     void completeHitCallback(std::vector<PacketPtr> & mylist, int len);

     PacketPtr mapAddrToPkt(Addr address);


     RequestStatus getRequestStatus(PacketPtr pkt,

                                    RubyRequestType request_type);

     bool insertRequest(PacketPtr pkt, RubyRequestType request_type);


     bool handleLlsc(Addr address, GPUCoalescerRequest* request);


     class IssueEvent : public Event

     {

       private:

         GPUCoalescer *seq;

       public:

         IssueEvent(GPUCoalescer *_seq);

         void process();

         const char *description() const;

     };


     IssueEvent issueEvent;


   // Changed to protected to enable inheritance by VIPER Coalescer

   protected:

     int m_max_outstanding_requests;

     int m_deadlock_threshold;


     CacheMemory* m_dataCache_ptr;

     CacheMemory* m_instCache_ptr;


     // The cache access latency for this GPU data cache. This is assessed at the

     // beginning of each access. This should be very similar to the

     // implementation in Sequencer() as this is very much like a Sequencer

     Cycles m_data_cache_hit_latency;


     // We need to track both the primary and secondary request types.

     // The secondary request type comprises a subset of RubyRequestTypes that

     // are understood by the L1 Controller. A primary request type can be any

     // RubyRequestType.

     typedef std::unordered_map<Addr, std::vector<RequestDesc>> CoalescingTable;

     CoalescingTable reqCoalescer;

     std::vector<Addr> newRequests;


     typedef std::unordered_map<Addr, GPUCoalescerRequest*> RequestTable;

     RequestTable m_writeRequestTable;

     RequestTable m_readRequestTable;

     // Global outstanding request count, across all request tables

     int m_outstanding_count;

     bool m_deadlock_check_scheduled;

     std::unordered_map<int, PacketPtr> kernelEndList;

     std::vector<int> newKernelEnds;


     int m_store_waiting_on_load_cycles;

     int m_store_waiting_on_store_cycles;

     int m_load_waiting_on_store_cycles;

     int m_load_waiting_on_load_cycles;


     bool m_runningGarnetStandalone;


     class GPUCoalescerWakeupEvent : public Event

     {

       private:

         GPUCoalescer *m_GPUCoalescer_ptr;


       public:

         GPUCoalescerWakeupEvent(GPUCoalescer *_seq) :

             m_GPUCoalescer_ptr(_seq) {}

         void process() { m_GPUCoalescer_ptr->wakeup(); }

         const char *description() const

         {

             return "GPUCoalescer deadlock check";

         }

     };


     GPUCoalescerWakeupEvent deadlockCheckEvent;

     bool assumingRfOCoherence;


     // m5 style stats for TCP hit/miss counts

     Stats::Scalar GPU_TCPLdHits;

     Stats::Scalar GPU_TCPLdTransfers;

     Stats::Scalar GPU_TCCLdHits;

     Stats::Scalar GPU_LdMiss;


     Stats::Scalar GPU_TCPStHits;

     Stats::Scalar GPU_TCPStTransfers;

     Stats::Scalar GPU_TCCStHits;

     Stats::Scalar GPU_StMiss;


     Stats::Scalar CP_TCPLdHits;

     Stats::Scalar CP_TCPLdTransfers;

     Stats::Scalar CP_TCCLdHits;

     Stats::Scalar CP_LdMiss;


     Stats::Scalar CP_TCPStHits;

     Stats::Scalar CP_TCPStTransfers;

     Stats::Scalar CP_TCCStHits;

     Stats::Scalar CP_StMiss;


     Stats::Histogram m_outstandReqHist;


     Stats::Histogram m_latencyHist;

     std::vector<Stats::Histogram *> m_typeLatencyHist;


     Stats::Histogram m_missLatencyHist;

     std::vector<Stats::Histogram *> m_missTypeLatencyHist;


     std::vector<Stats::Histogram *> m_missMachLatencyHist;

     std::vector< std::vector<Stats::Histogram *> > m_missTypeMachLatencyHist;


     std::vector<Stats::Histogram *> m_IssueToInitialDelayHist;

     std::vector<Stats::Histogram *> m_InitialToForwardDelayHist;

     std::vector<Stats::Histogram *> m_ForwardToFirstResponseDelayHist;

     std::vector<Stats::Histogram *> m_FirstResponseToCompletionDelayHist;


 private:

     // Private copy constructor and assignment operator

     GPUCoalescer(const GPUCoalescer& obj);

     GPUCoalescer& operator=(const GPUCoalescer& obj);

 };


 inline std::ostream&

 operator<<(std::ostream& out, const GPUCoalescer& obj)

 {

     obj.print(out);

     out << std::flush;

     return out;

 }


 #endif // __MEM_RUBY_SYSTEM_GPU_COALESCER_HH__


GPUCoalescer::getLatencyHist
Stats::Histogram & getLatencyHist()
Definition: GPUCoalescer.hh:193

GPUCoalescer::recordMissLatency
void recordMissLatency(GPUCoalescerRequest *request, MachineType mach, Cycles initialRequestTime, Cycles forwardRequestTime, Cycles firstResponseTime, bool success, bool isRegion)
Definition: GPUCoalescer.cc:1203

GPUCoalescer::insertKernel
void insertKernel(int wavefront_id, PacketPtr pkt)
Definition: GPUCoalescer.cc:294

GPUCoalescer::atomicCallback
void atomicCallback(Addr address, MachineType mach, const DataBlock &data)
Definition: GPUCoalescer.cc:1073

GPUCoalescer::CP_TCCStHits
Stats::Scalar CP_TCCStHits
Definition: GPUCoalescer.hh:344

RequestDesc::RequestDesc
RequestDesc(PacketPtr pkt, RubyRequestType p_type, RubyRequestType s_type)
Definition: GPUCoalescer.hh:79

GPUCoalescer::GPU_TCPStHits
Stats::Scalar GPU_TCPStHits
Definition: GPUCoalescer.hh:332

Consumer.hh

GPUCoalescer::m_deadlock_threshold
int m_deadlock_threshold
Definition: GPUCoalescer.hh:274

Cycles
Cycles is a wrapper class for representing cycle counts, i.e.
Definition: types.hh:83

GPUCoalescer::m_missLatencyHist
Stats::Histogram m_missLatencyHist
Histogram for holding latency profile of all requests that miss in the controller connected to this s...
Definition: GPUCoalescer.hh:356

GPUCoalescer::GPUCoalescerWakeupEvent::GPUCoalescerWakeupEvent
GPUCoalescerWakeupEvent(GPUCoalescer *_seq)
Definition: GPUCoalescer.hh:314

GPUCoalescer::m_ForwardToFirstResponseDelayHist
std::vector< Stats::Histogram * > m_ForwardToFirstResponseDelayHist
Definition: GPUCoalescer.hh:367

GPUCoalescer::operator=
GPUCoalescer & operator=(const GPUCoalescer &obj)

GPUCoalescerRequest::m_type
RubyRequestType m_type
Definition: GPUCoalescer.hh:67

GPUCoalescer::reqCoalescer
CoalescingTable reqCoalescer
Definition: GPUCoalescer.hh:289

GPUCoalescer::issueRequest
virtual void issueRequest(PacketPtr pkt, RubyRequestType type)
Definition: GPUCoalescer.cc:873

GPUCoalescer::GPUCoalescer
GPUCoalescer(const Params *)
Definition: GPUCoalescer.cc:118

GPUCoalescer::m_readRequestTable
RequestTable m_readRequestTable
Definition: GPUCoalescer.hh:294

request.hh
Declaration of a request, the overall memory request consisting of the parts of the request that are ...

GPUCoalescer::GPU_TCPLdHits
Stats::Scalar GPU_TCPLdHits
Definition: GPUCoalescer.hh:327

GPUCoalescer::CP_StMiss
Stats::Scalar CP_StMiss
Definition: GPUCoalescer.hh:345

addr
ip6_addr_t addr
Definition: inet.hh:335

GPUCoalescer::GPU_TCCStHits
Stats::Scalar GPU_TCCStHits
Definition: GPUCoalescer.hh:334

Event::scheduled
bool scheduled() const
Determine if the current event is scheduled.
Definition: eventq.hh:381

GPUCoalescer::recordCPWriteCallBack
void recordCPWriteCallBack(MachineID myMachID, MachineID senderMachID)
Definition: GPUCoalescer.cc:1162

GPUCoalescer::kernelCallback
void kernelCallback(int wavfront_id)
Definition: GPUCoalescer.cc:1063

GPUCoalescer::getMissTypeLatencyHist
Stats::Histogram & getMissTypeLatencyHist(uint32_t t)
Definition: GPUCoalescer.hh:199

GPUCoalescer::CP_LdMiss
Stats::Scalar CP_LdMiss
Definition: GPUCoalescer.hh:340

GPUCoalescer::GPU_TCPLdTransfers
Stats::Scalar GPU_TCPLdTransfers
Definition: GPUCoalescer.hh:328

GPUCoalescer::getRequestStatus
RequestStatus getRequestStatus(PacketPtr pkt, RubyRequestType request_type)
Definition: GPUCoalescer.cc:234

GPUCoalescer::~GPUCoalescer
~GPUCoalescer()
Definition: GPUCoalescer.cc:149

GPUCoalescer::GPUCoalescerWakeupEvent::description
const char * description() const
Return a C string describing the event.
Definition: GPUCoalescer.hh:317

GPUCoalescer::CP_TCPLdTransfers
Stats::Scalar CP_TCPLdTransfers
Definition: GPUCoalescer.hh:338

GPUCoalescer::makeRequest
virtual RequestStatus makeRequest(PacketPtr pkt)
Definition: GPUCoalescer.cc:695

GPUCoalescer::m_missMachLatencyHist
std::vector< Stats::Histogram * > m_missMachLatencyHist
Histograms for profiling the latencies for requests that required external messages.
Definition: GPUCoalescer.hh:361

GPUCoalescer::m_max_outstanding_requests
int m_max_outstanding_requests
Definition: GPUCoalescer.hh:273

GPUCoalescer::wakeup
void wakeup()
Definition: GPUCoalescer.cc:154

GPUCoalescer::m_latencyHist
Stats::Histogram m_latencyHist
Histogram for holding latency profile of all requests.
Definition: GPUCoalescer.hh:351

GPUCoalescer::tryCacheAccess
bool tryCacheAccess(Addr addr, RubyRequestType type, Addr pc, RubyAccessMode access_mode, int size, DataBlock *&data_ptr)

operator<<
std::ostream & operator<<(std::ostream &out, const GPUCoalescerRequest &obj)

DataBlock
Definition: DataBlock.hh:40

GPUCoalescer::RequestTable
std::unordered_map< Addr, GPUCoalescerRequest * > RequestTable
Definition: GPUCoalescer.hh:292

GPUCoalescer::completeIssue
void completeIssue()
Definition: GPUCoalescer.cc:1006

statistics.hh
Declaration of Statistics objects.

GPUCoalescer::IssueEvent::IssueEvent
IssueEvent(GPUCoalescer *_seq)
Definition: GPUCoalescer.cc:999

Stats::Scalar
This is a simple scalar statistic, like a counter.
Definition: statistics.hh:2475

GPUCoalescer::getForwardRequestToFirstResponseHist
Stats::Histogram & getForwardRequestToFirstResponseHist(const MachineType t) const
Definition: GPUCoalescer.hh:217

GPUCoalescer::IssueEvent
Definition: GPUCoalescer.hh:258

GPUCoalescer::descheduleDeadlockEvent
void descheduleDeadlockEvent()
Definition: GPUCoalescer.hh:173

std::vector
STL vector class.
Definition: stl.hh:40

EventManager::deschedule
void deschedule(Event &event)
Definition: eventq.hh:734

Request
Definition: request.hh:87

GPUCoalescer::CP_TCPStTransfers
Stats::Scalar CP_TCPStTransfers
Definition: GPUCoalescer.hh:343

data
const char data[]
Definition: circlebuf.cc:43

GPUCoalescer::empty
bool empty() const
Definition: GPUCoalescer.cc:680

GPUCoalescer::Params
RubyGPUCoalescerParams Params
Definition: GPUCoalescer.hh:99

GPUCoalescer::GPUCoalescerWakeupEvent
Definition: GPUCoalescer.hh:308

GPUCoalescer::IssueEvent::description
const char * description() const
Return a C string describing the event.
Definition: GPUCoalescer.cc:1051

GPUCoalescer::CoalescingTable
std::unordered_map< Addr, std::vector< RequestDesc > > CoalescingTable
Definition: GPUCoalescer.hh:288

reqSegmentToHSASegment
HSASegment reqSegmentToHSASegment(Request *req)
Definition: GPUCoalescer.cc:93

GPUCoalescer::markRemoved
void markRemoved()
Definition: GPUCoalescer.cc:381

GPUCoalescer::isDeadlockEventScheduled
bool isDeadlockEventScheduled() const
Definition: GPUCoalescer.hh:167

GPUCoalescer
Definition: GPUCoalescer.hh:96

GPUCoalescer::GPU_LdMiss
Stats::Scalar GPU_LdMiss
Definition: GPUCoalescer.hh:330

GPUCoalescer::m_dataCache_ptr
CacheMemory * m_dataCache_ptr
Definition: GPUCoalescer.hh:276

GPUCoalescer::IssueEvent::seq
GPUCoalescer * seq
Definition: GPUCoalescer.hh:261

GPUCoalescer::readCallback
void readCallback(Addr address, DataBlock &data)
Definition: GPUCoalescer.cc:537

GPUCoalescer::insertRequest
bool insertRequest(PacketPtr pkt, RubyRequestType request_type)
Definition: GPUCoalescer.cc:311

RequestDesc::primaryType
RubyRequestType primaryType
Definition: GPUCoalescer.hh:90

GPUCoalescer::collateStats
void collateStats()

GPUCoalescer::writeCallback
void writeCallback(Addr address, DataBlock &data)
Definition: GPUCoalescer.cc:455

GPUCoalescer::assumingRfOCoherence
bool assumingRfOCoherence
Definition: GPUCoalescer.hh:324

GPUCoalescer::newRequests
std::vector< Addr > newRequests
Definition: GPUCoalescer.hh:290

GPUCoalescer::GPU_TCCLdHits
Stats::Scalar GPU_TCCLdHits
Definition: GPUCoalescer.hh:329

GPUCoalescer::getIssueToInitialDelayHist
Stats::Histogram & getIssueToInitialDelayHist(uint32_t t) const
Definition: GPUCoalescer.hh:209

GPUCoalescer::m_store_waiting_on_load_cycles
int m_store_waiting_on_load_cycles
Definition: GPUCoalescer.hh:301

GPUCoalescer::GPUCoalescerWakeupEvent::process
void process()
Definition: GPUCoalescer.hh:316

GPUCoalescerRequest::pkt
PacketPtr pkt
Definition: GPUCoalescer.hh:66

Stats::Histogram
A simple histogram stat.
Definition: statistics.hh:2551

GPUCoalescer::m_outstandReqHist
Stats::Histogram m_outstandReqHist
Histogram for number of outstanding requests per cycle.
Definition: GPUCoalescer.hh:348

GPUCoalescer::m_missTypeMachLatencyHist
std::vector< std::vector< Stats::Histogram * > > m_missTypeMachLatencyHist
Definition: GPUCoalescer.hh:362

GPUCoalescer::deadlockCheckEvent
GPUCoalescerWakeupEvent deadlockCheckEvent
Definition: GPUCoalescer.hh:323

MipsISA::r
r
Definition: pra_constants.hh:97

MemObject::Params
MemObjectParams Params
Definition: mem_object.hh:63

GPUCoalescer::completeHitCallback
void completeHitCallback(std::vector< PacketPtr > &mylist, int len)
Definition: GPUCoalescer.cc:1176

GPUCoalescer::recordRequestType
void recordRequestType(SequencerRequestType requestType)
Definition: GPUCoalescer.cc:994

Address.hh

GPUCoalescer::m_InitialToForwardDelayHist
std::vector< Stats::Histogram * > m_InitialToForwardDelayHist
Definition: GPUCoalescer.hh:366

GPUCoalescer::checkCoherence
void checkCoherence(Addr address)
Definition: GPUCoalescer.cc:986

Addr
uint64_t Addr
Address type This will probably be moved somewhere else in the near future.
Definition: types.hh:142

GPUCoalescer::getInitialToForwardDelayHist
Stats::Histogram & getInitialToForwardDelayHist(const MachineType t) const
Definition: GPUCoalescer.hh:213

reqScopeToHSAScope
HSAScope reqScopeToHSAScope(Request *req)
Definition: GPUCoalescer.cc:73

GPUCoalescer::m_load_waiting_on_load_cycles
int m_load_waiting_on_load_cycles
Definition: GPUCoalescer.hh:304

Packet
A Packet is used to encapsulate a transfer between two objects in the memory system (e...
Definition: packet.hh:245

GPUCoalescer::hitCallback
void hitCallback(GPUCoalescerRequest *request, MachineType mach, DataBlock &data, bool success, Cycles initialRequestTime, Cycles forwardRequestTime, Cycles firstResponseTime, bool isRegion)
Definition: GPUCoalescer.cc:593

GPUCoalescer::kernelEndList
std::unordered_map< int, PacketPtr > kernelEndList
Definition: GPUCoalescer.hh:298

GPUCoalescer::getMissTypeMachLatencyHist
Stats::Histogram & getMissTypeMachLatencyHist(uint32_t r, uint32_t t) const
Definition: GPUCoalescer.hh:206

Sequencer.hh

GPUCoalescer::GPU_StMiss
Stats::Scalar GPU_StMiss
Definition: GPUCoalescer.hh:335

GPUCoalescer::m_IssueToInitialDelayHist
std::vector< Stats::Histogram * > m_IssueToInitialDelayHist
Histograms for recording the breakdown of miss latency.
Definition: GPUCoalescer.hh:365

GPUCoalescer::getOutstandReqHist
Stats::Histogram & getOutstandReqHist()
Definition: GPUCoalescer.hh:191

GPUCoalescer::CP_TCPLdHits
Stats::Scalar CP_TCPLdHits
Definition: GPUCoalescer.hh:337

GPUCoalescer::outstandingCount
int outstandingCount() const
Definition: GPUCoalescer.hh:164

RequestDesc::RequestDesc
RequestDesc()
Definition: GPUCoalescer.hh:84

CacheMemory
Definition: CacheMemory.hh:50

GPUCoalescer::regStats
void regStats()
Register statistics for this object.
Definition: GPUCoalescer.cc:1281

GPUCoalescer::m_typeLatencyHist
std::vector< Stats::Histogram * > m_typeLatencyHist
Definition: GPUCoalescer.hh:352

GPUCoalescer::recordCPReadCallBack
void recordCPReadCallBack(MachineID myMachID, MachineID senderMachID)
Definition: GPUCoalescer.cc:1148

GPUCoalescer::getFirstResponseToCompletionDelayHist
Stats::Histogram & getFirstResponseToCompletionDelayHist(const MachineType t) const
Definition: GPUCoalescer.hh:221

GPUCoalescer::getMissLatencyHist
Stats::Histogram & getMissLatencyHist()
Definition: GPUCoalescer.hh:197

GPUCoalescer::getTypeLatencyHist
Stats::Histogram & getTypeLatencyHist(uint32_t t)
Definition: GPUCoalescer.hh:194

X86ISA::type
type
Definition: misc.hh:728

X86ISA::size
int size()
Definition: pagetable.hh:146

GPUCoalescer::mapAddrToPkt
PacketPtr mapAddrToPkt(Addr address)
Definition: GPUCoalescer.cc:1194

GPUCoalescer::newKernelEnds
std::vector< int > newKernelEnds
Definition: GPUCoalescer.hh:299

GPUCoalescer::removeRequest
void removeRequest(GPUCoalescerRequest *request)
Definition: GPUCoalescer.cc:389

GPUCoalescerRequest::GPUCoalescerRequest
GPUCoalescerRequest(PacketPtr _pkt, RubyRequestType _m_type, Cycles _issue_time)
Definition: GPUCoalescer.hh:70

RequestDesc::secondaryType
RubyRequestType secondaryType
Definition: GPUCoalescer.hh:91

GPUCoalescer::print
void print(std::ostream &out) const
Definition: GPUCoalescer.cc:973

Event
Definition: eventq.hh:185

GPUCoalescer::CP_TCPStHits
Stats::Scalar CP_TCPStHits
Definition: GPUCoalescer.hh:342

GPUCoalescer::m_load_waiting_on_store_cycles
int m_load_waiting_on_store_cycles
Definition: GPUCoalescer.hh:303

GPUCoalescer::m_writeRequestTable
RequestTable m_writeRequestTable
Definition: GPUCoalescer.hh:293

ArmISA::len
Bitfield< 18, 16 > len
Definition: miscregs.hh:1626

GPUCoalescer::issueEvent
IssueEvent issueEvent
Definition: GPUCoalescer.hh:268

GPUCoalescer::m_instCache_ptr
CacheMemory * m_instCache_ptr
Definition: GPUCoalescer.hh:277

GPUCoalescer::resetStats
void resetStats()
Reset statistics associated with this object.
Definition: GPUCoalescer.cc:206

RequestDesc::pkt
PacketPtr pkt
Definition: GPUCoalescer.hh:89

GPUCoalescer::m_outstanding_count
int m_outstanding_count
Definition: GPUCoalescer.hh:296

GPUCoalescer::IssueEvent::process
void process()
Definition: GPUCoalescer.cc:1045

GPUCoalescer::m_data_cache_hit_latency
Cycles m_data_cache_hit_latency
Definition: GPUCoalescer.hh:282

GPUCoalescer::handleLlsc
bool handleLlsc(Addr address, GPUCoalescerRequest *request)
Definition: GPUCoalescer.cc:411

pc
IntReg pc
Definition: remote_gdb.hh:91

GPUCoalescer::GPUCoalescerWakeupEvent::m_GPUCoalescer_ptr
GPUCoalescer * m_GPUCoalescer_ptr
Definition: GPUCoalescer.hh:311

GPUCoalescer::printProgress
void printProgress(std::ostream &out) const
Definition: GPUCoalescer.cc:229

MachineID
Definition: MachineID.hh:38

ArmISA::t
Bitfield< 5 > t
Definition: miscregs.hh:1382

GPUCoalescer::getMissMachLatencyHist
Stats::Histogram & getMissMachLatencyHist(uint32_t t) const
Definition: GPUCoalescer.hh:202

GPUCoalescer::m_runningGarnetStandalone
bool m_runningGarnetStandalone
Definition: GPUCoalescer.hh:306

GPUCoalescer::m_FirstResponseToCompletionDelayHist
std::vector< Stats::Histogram * > m_FirstResponseToCompletionDelayHist
Definition: GPUCoalescer.hh:368

GPUCoalescer::m_missTypeLatencyHist
std::vector< Stats::Histogram * > m_missTypeLatencyHist
Definition: GPUCoalescer.hh:357

GPUCoalescer::m_store_waiting_on_store_cycles
int m_store_waiting_on_store_cycles
Definition: GPUCoalescer.hh:302

RubyPort
Definition: RubyPort.hh:57

GPUCoalescer::evictionCallback
void evictionCallback(Addr address)
Definition: GPUCoalescer.cc:1057

GPUCoalescerRequest::issue_time
Cycles issue_time
Definition: GPUCoalescer.hh:68

GPUCoalescer::GPU_TCPStTransfers
Stats::Scalar GPU_TCPStTransfers
Definition: GPUCoalescer.hh:333

RequestDesc
Definition: GPUCoalescer.hh:76

GPUCoalescer::m_deadlock_check_scheduled
bool m_deadlock_check_scheduled
Definition: GPUCoalescer.hh:297

GPUCoalescer::CP_TCCLdHits
Stats::Scalar CP_TCCLdHits
Definition: GPUCoalescer.hh:339

GPUCoalescerRequest
Definition: GPUCoalescer.hh:64