| # Copyright (c) 2018-2020 Inria |
| # All rights reserved. |
| # |
| # Redistribution and use in source and binary forms, with or without |
| # modification, are permitted provided that the following conditions are |
| # met: redistributions of source code must retain the above copyright |
| # notice, this list of conditions and the following disclaimer; |
| # redistributions in binary form must reproduce the above copyright |
| # notice, this list of conditions and the following disclaimer in the |
| # documentation and/or other materials provided with the distribution; |
| # neither the name of the copyright holders nor the names of its |
| # contributors may be used to endorse or promote products derived from |
| # this software without specific prior written permission. |
| # |
| # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
| # "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
| # LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR |
| # A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT |
| # OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, |
| # SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT |
| # LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, |
| # DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY |
| # THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
| # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
| # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| |
| from m5.params import * |
| from m5.proxy import * |
| from m5.SimObject import * |
| |
| from m5.objects.IndexingPolicies import * |
| from m5.objects.ReplacementPolicies import * |
| |
| class BaseCacheCompressor(SimObject): |
| type = 'BaseCacheCompressor' |
| abstract = True |
| cxx_class = 'gem5::compression::Base' |
| cxx_header = "mem/cache/compressors/base.hh" |
| |
| block_size = Param.Int(Parent.cache_line_size, "Block size in bytes") |
| chunk_size_bits = Param.Unsigned(32, |
| "Size of a parsing data chunk (in bits)") |
| size_threshold_percentage = Param.Percent(50, |
| "Minimum percentage of the block size, a compressed block must " |
| "achieve to be stored in compressed format") |
| |
| comp_chunks_per_cycle = Param.Unsigned(1, |
| "Number of chunks that can be compressed in parallel per cycle.") |
| comp_extra_latency = Param.Cycles(1, "Number of extra cycles required " |
| "to finish compression (e.g., due to shifting and packaging).") |
| decomp_chunks_per_cycle = Param.Unsigned(1, |
| "Number of chunks that can be decompressed in parallel per cycle.") |
| decomp_extra_latency = Param.Cycles(1, "Number of extra cycles required " |
| "to finish decompression (e.g., due to shifting and packaging).") |
| |
| class BaseDictionaryCompressor(BaseCacheCompressor): |
| type = 'BaseDictionaryCompressor' |
| abstract = True |
| cxx_class = 'gem5::compression::BaseDictionaryCompressor' |
| cxx_header = "mem/cache/compressors/dictionary_compressor.hh" |
| |
| dictionary_size = Param.Int(Parent.cache_line_size, |
| "Number of dictionary entries") |
| |
| class Base64Delta8(BaseDictionaryCompressor): |
| type = 'Base64Delta8' |
| cxx_class = 'gem5::compression::Base64Delta8' |
| cxx_header = "mem/cache/compressors/base_delta.hh" |
| |
| chunk_size_bits = 64 |
| |
| # Base-delta compressors achieve 1-cycle latencies |
| comp_chunks_per_cycle = 8 * Self.block_size / Self.chunk_size_bits |
| comp_extra_latency = 0 |
| decomp_chunks_per_cycle = 8 * Self.block_size / Self.chunk_size_bits |
| decomp_extra_latency = 0 |
| |
| class Base64Delta16(BaseDictionaryCompressor): |
| type = 'Base64Delta16' |
| cxx_class = 'gem5::compression::Base64Delta16' |
| cxx_header = "mem/cache/compressors/base_delta.hh" |
| |
| chunk_size_bits = 64 |
| |
| # Base-delta compressors achieve 1-cycle latencies |
| comp_chunks_per_cycle = 8 * Self.block_size / Self.chunk_size_bits |
| comp_extra_latency = 0 |
| decomp_chunks_per_cycle = 8 * Self.block_size / Self.chunk_size_bits |
| decomp_extra_latency = 0 |
| |
| class Base64Delta32(BaseDictionaryCompressor): |
| type = 'Base64Delta32' |
| cxx_class = 'gem5::compression::Base64Delta32' |
| cxx_header = "mem/cache/compressors/base_delta.hh" |
| |
| chunk_size_bits = 64 |
| |
| # Base-delta compressors achieve 1-cycle latencies |
| comp_chunks_per_cycle = 8 * Self.block_size / Self.chunk_size_bits |
| comp_extra_latency = 0 |
| decomp_chunks_per_cycle = 8 * Self.block_size / Self.chunk_size_bits |
| decomp_extra_latency = 0 |
| |
| class Base32Delta8(BaseDictionaryCompressor): |
| type = 'Base32Delta8' |
| cxx_class = 'gem5::compression::Base32Delta8' |
| cxx_header = "mem/cache/compressors/base_delta.hh" |
| |
| chunk_size_bits = 32 |
| |
| # Base-delta compressors achieve 1-cycle latencies |
| comp_chunks_per_cycle = 8 * Self.block_size / Self.chunk_size_bits |
| comp_extra_latency = 0 |
| decomp_chunks_per_cycle = 8 * Self.block_size / Self.chunk_size_bits |
| decomp_extra_latency = 0 |
| |
| class Base32Delta16(BaseDictionaryCompressor): |
| type = 'Base32Delta16' |
| cxx_class = 'gem5::compression::Base32Delta16' |
| cxx_header = "mem/cache/compressors/base_delta.hh" |
| |
| chunk_size_bits = 32 |
| |
| # Base-delta compressors achieve 1-cycle latencies |
| comp_chunks_per_cycle = 8 * Self.block_size / Self.chunk_size_bits |
| comp_extra_latency = 0 |
| decomp_chunks_per_cycle = 8 * Self.block_size / Self.chunk_size_bits |
| decomp_extra_latency = 0 |
| |
| class Base16Delta8(BaseDictionaryCompressor): |
| type = 'Base16Delta8' |
| cxx_class = 'gem5::compression::Base16Delta8' |
| cxx_header = "mem/cache/compressors/base_delta.hh" |
| |
| chunk_size_bits = 16 |
| |
| # Base-delta compressors achieve 1-cycle latencies |
| comp_chunks_per_cycle = 8 * Self.block_size / Self.chunk_size_bits |
| comp_extra_latency = 0 |
| decomp_chunks_per_cycle = 8 * Self.block_size / Self.chunk_size_bits |
| decomp_extra_latency = 0 |
| |
| class CPack(BaseDictionaryCompressor): |
| type = 'CPack' |
| cxx_class = 'gem5::compression::CPack' |
| cxx_header = "mem/cache/compressors/cpack.hh" |
| |
| comp_chunks_per_cycle = 2 |
| # Accounts for pattern matching, length generation, packaging and shifting |
| comp_extra_latency = 5 |
| decomp_chunks_per_cycle = 2 |
| decomp_extra_latency = 1 |
| |
| class FPC(BaseDictionaryCompressor): |
| type = 'FPC' |
| cxx_class = 'gem5::compression::FPC' |
| cxx_header = "mem/cache/compressors/fpc.hh" |
| |
| comp_chunks_per_cycle = 8 |
| comp_extra_latency = 1 |
| decomp_chunks_per_cycle = 4 |
| decomp_extra_latency = 1 |
| |
| # Dummy dictionary size, since FPC has no dictionary |
| dictionary_size = 1 |
| |
| zero_run_bits = Param.Int(3, "Number of bits of the zero run bit field") |
| |
| class FPCD(BaseDictionaryCompressor): |
| type = 'FPCD' |
| cxx_class = 'gem5::compression::FPCD' |
| cxx_header = "mem/cache/compressors/fpcd.hh" |
| |
| # Accounts for checking all patterns, selecting patterns, and shifting |
| # The original claim of a decompression latency of 2 cycles would likely |
| # generate an unrealistically complex circuit |
| comp_chunks_per_cycle = 4 |
| comp_extra_latency = 1 |
| decomp_chunks_per_cycle = 4 |
| decomp_extra_latency = 0 |
| |
| dictionary_size = 2 |
| |
| class FrequentValuesCompressor(BaseCacheCompressor): |
| type = 'FrequentValuesCompressor' |
| cxx_class = 'gem5::compression::FrequentValues' |
| cxx_header = "mem/cache/compressors/frequent_values.hh" |
| |
| chunk_size_bits = 32 |
| code_generation_ticks = Param.Unsigned(10000, "Number of elapsed " \ |
| "ticks until the samples are analyzed and their codes are generated.") |
| # @todo The width of a counter width is determined by the maximum |
| # number of times a given value appears in the cache - i.e., |
| # log2(cache_size/chunk_size_bits))". |
| counter_bits = Param.Unsigned(18, "Number of bits per frequency counter.") |
| max_code_length = Param.Unsigned(18, "Maximum number of bits in a " |
| "codeword. If 0, table indices are not encoded.") |
| num_samples = Param.Unsigned(100000, "Number of samples that must be " \ |
| "taken before compression is effectively used.") |
| check_saturation = Param.Bool(False, "Whether the counters should be " \ |
| "manipulated in case of saturation.") |
| |
| vft_assoc = Param.Int(16, "Associativity of the VFT.") |
| vft_entries = Param.MemorySize("1024", "Number of entries of the VFT.") |
| vft_indexing_policy = Param.BaseIndexingPolicy( |
| SetAssociative(entry_size = 1, assoc = Parent.vft_assoc, |
| size = Parent.vft_entries), "Indexing policy of the VFT.") |
| vft_replacement_policy = Param.BaseReplacementPolicy(LFURP(), |
| "Replacement policy of the VFT.") |
| |
| comp_chunks_per_cycle = 1 |
| comp_extra_latency = 1 |
| decomp_chunks_per_cycle = 1 |
| decomp_extra_latency = 0 |
| |
| class MultiCompressor(BaseCacheCompressor): |
| type = 'MultiCompressor' |
| cxx_class = 'gem5::compression::Multi' |
| cxx_header = "mem/cache/compressors/multi.hh" |
| |
| # Dummy default compressor list. This might not be an optimal choice, |
| # since these compressors have many overlapping patterns |
| compressors = VectorParam.BaseCacheCompressor([CPack(), FPCD()], |
| "Array of compressors") |
| encoding_in_tags = Param.Bool(False, "If set the bits to inform which " |
| "sub-compressor compressed some data are added to its corresponding " |
| "tag entry.") |
| |
| # Use the sub-compressors' latencies |
| comp_chunks_per_cycle = 0 |
| decomp_chunks_per_cycle = 0 |
| |
| # Assume extra 1 cycle to select the results of the winning sub-compressor |
| comp_extra_latency = 1 |
| |
| # Multi-compressors may need a couple of extra cycles to the select |
| # which sub-compressor should be used to decompress the data |
| decomp_extra_latency = 1 |
| |
| class PerfectCompressor(BaseCacheCompressor): |
| type = 'PerfectCompressor' |
| cxx_class = 'gem5::compression::Perfect' |
| cxx_header = "mem/cache/compressors/perfect.hh" |
| |
| chunk_size_bits = 64 |
| |
| max_compression_ratio = Param.Int("Maximum compression ratio allowed") |
| |
| # In a perfect world compression and decompression happen in 1 cycle |
| comp_chunks_per_cycle = 8 * Self.block_size / Self.chunk_size_bits |
| comp_extra_latency = 0 |
| decomp_chunks_per_cycle = 8 * Self.block_size / Self.chunk_size_bits |
| decomp_extra_latency = 0 |
| |
| class RepeatedQwordsCompressor(BaseDictionaryCompressor): |
| type = 'RepeatedQwordsCompressor' |
| cxx_class = 'gem5::compression::RepeatedQwords' |
| cxx_header = "mem/cache/compressors/repeated_qwords.hh" |
| |
| chunk_size_bits = 64 |
| |
| # Assume 1-cycle latencies |
| comp_chunks_per_cycle = 8 * Self.block_size / Self.chunk_size_bits |
| comp_extra_latency = 0 |
| decomp_chunks_per_cycle = 8 * Self.block_size / Self.chunk_size_bits |
| decomp_extra_latency = 0 |
| |
| class ZeroCompressor(BaseDictionaryCompressor): |
| type = 'ZeroCompressor' |
| cxx_class = 'gem5::compression::Zero' |
| cxx_header = "mem/cache/compressors/zero.hh" |
| |
| chunk_size_bits = 64 |
| |
| # Assume 1-cycle latencies |
| comp_chunks_per_cycle = 8 * Self.block_size / Self.chunk_size_bits |
| comp_extra_latency = 0 |
| decomp_chunks_per_cycle = 8 * Self.block_size / Self.chunk_size_bits |
| decomp_extra_latency = 0 |
| |
| class BDI(MultiCompressor): |
| compressors = [ |
| ZeroCompressor(size_threshold_percentage=99), |
| RepeatedQwordsCompressor(size_threshold_percentage=99), |
| Base64Delta8(size_threshold_percentage=99), |
| Base64Delta16(size_threshold_percentage=99), |
| Base64Delta32(size_threshold_percentage=99), |
| Base32Delta8(size_threshold_percentage=99), |
| Base32Delta16(size_threshold_percentage=99), |
| Base16Delta8(size_threshold_percentage=99), |
| ] |
| |
| # By default assume that the encoding is stored in the tags, and is |
| # retrieved and decoded while (and ends before) the data is being read. |
| decomp_extra_latency = 0 |
| encoding_in_tags=True |