| /* |
| * Copyright (c) 2016-2017 Advanced Micro Devices, Inc. |
| * All rights reserved. |
| * |
| * For use for simulation and test purposes only |
| * |
| * Redistribution and use in source and binary forms, with or without |
| * modification, are permitted provided that the following conditions are met: |
| * |
| * 1. Redistributions of source code must retain the above copyright notice, |
| * this list of conditions and the following disclaimer. |
| * |
| * 2. Redistributions in binary form must reproduce the above copyright notice, |
| * this list of conditions and the following disclaimer in the documentation |
| * and/or other materials provided with the distribution. |
| * |
| * 3. Neither the name of the copyright holder nor the names of its |
| * contributors may be used to endorse or promote products derived from this |
| * software without specific prior written permission. |
| * |
| * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" |
| * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE |
| * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE |
| * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE |
| * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR |
| * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF |
| * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS |
| * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN |
| * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) |
| * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE |
| * POSSIBILITY OF SUCH DAMAGE. |
| * |
| * Authors: John Kalamatianos |
| */ |
| |
| #include "gpu-compute/scalar_memory_pipeline.hh" |
| |
| #include "debug/GPUMem.hh" |
| #include "debug/GPUReg.hh" |
| #include "gpu-compute/compute_unit.hh" |
| #include "gpu-compute/gpu_dyn_inst.hh" |
| #include "gpu-compute/scalar_register_file.hh" |
| #include "gpu-compute/shader.hh" |
| #include "gpu-compute/wavefront.hh" |
| |
| ScalarMemPipeline::ScalarMemPipeline(const ComputeUnitParams &p, |
| ComputeUnit &cu) |
| : computeUnit(cu), _name(cu.name() + ".ScalarMemPipeline"), |
| queueSize(p.scalar_mem_queue_size), |
| inflightStores(0), inflightLoads(0) |
| { |
| } |
| |
| void |
| ScalarMemPipeline::exec() |
| { |
| // afind oldest scalar request whose data has arrived |
| GPUDynInstPtr m = !returnedLoads.empty() ? returnedLoads.front() : |
| !returnedStores.empty() ? returnedStores.front() : nullptr; |
| |
| Wavefront *w = nullptr; |
| |
| bool accessSrf = true; |
| // check the SRF to see if the operands of a load (or load component |
| // of an atomic) are accessible |
| if ((m) && (m->isLoad() || m->isAtomicRet())) { |
| w = m->wavefront(); |
| |
| accessSrf = |
| w->computeUnit->srf[w->simdId]-> |
| canScheduleWriteOperandsFromLoad(w, m); |
| } |
| |
| if ((!returnedStores.empty() || !returnedLoads.empty()) && |
| m->latency.rdy() && computeUnit.scalarMemToSrfBus.rdy() && |
| accessSrf && |
| (computeUnit.shader->coissue_return || |
| computeUnit.scalarMemUnit.rdy())) { |
| |
| w = m->wavefront(); |
| |
| if (m->isLoad() || m->isAtomicRet()) { |
| w->computeUnit->srf[w->simdId]-> |
| scheduleWriteOperandsFromLoad(w, m); |
| } |
| |
| m->completeAcc(m); |
| w->decLGKMInstsIssued(); |
| |
| if (m->isLoad() || m->isAtomic()) { |
| returnedLoads.pop(); |
| assert(inflightLoads > 0); |
| --inflightLoads; |
| } else { |
| returnedStores.pop(); |
| assert(inflightStores > 0); |
| --inflightStores; |
| } |
| |
| // Decrement outstanding register count |
| computeUnit.shader->ScheduleAdd(&w->outstandingReqs, m->time, -1); |
| |
| if (m->isStore() || m->isAtomic()) { |
| computeUnit.shader->ScheduleAdd(&w->scalarOutstandingReqsWrGm, |
| m->time, -1); |
| } |
| |
| if (m->isLoad() || m->isAtomic()) { |
| computeUnit.shader->ScheduleAdd(&w->scalarOutstandingReqsRdGm, |
| m->time, -1); |
| } |
| |
| // Mark write bus busy for appropriate amount of time |
| computeUnit.scalarMemToSrfBus.set(m->time); |
| if (!computeUnit.shader->coissue_return) |
| w->computeUnit->scalarMemUnit.set(m->time); |
| } |
| |
| // If pipeline has executed a global memory instruction |
| // execute global memory packets and issue global |
| // memory packets to DTLB |
| if (!issuedRequests.empty()) { |
| GPUDynInstPtr mp = issuedRequests.front(); |
| if (mp->isLoad() || mp->isAtomic()) { |
| |
| if (inflightLoads >= queueSize) { |
| return; |
| } else { |
| ++inflightLoads; |
| } |
| } else { |
| if (inflightStores >= queueSize) { |
| return; |
| } else { |
| ++inflightStores; |
| } |
| } |
| mp->initiateAcc(mp); |
| issuedRequests.pop(); |
| |
| DPRINTF(GPUMem, "CU%d: WF[%d][%d] Popping scalar mem_op\n", |
| computeUnit.cu_id, mp->simdId, mp->wfSlotId); |
| } |
| } |
| |
| void |
| ScalarMemPipeline::regStats() |
| { |
| } |