mem: Split the hit_latency into tag_latency and data_latency

If the cache access mode is parallel, i.e. "sequential_access" parameter is set to "False", tags and data are accessed in parallel. Therefore, the hit_latency is the maximum latency between tag_latency and data_latency. On the other hand, if the cache access mode is sequential, i.e. "sequential_access" parameter is set to "True", tags and data are accessed sequentially. Therefore, the hit_latency is the sum of tag_latency plus data_latency. Signed-off-by: Jason Lowe-Power <jason@lowepower.com>
2016-11-30 17:10:27 -05:00
parent 047caf24ba
commit ce2722cdd9
15 changed files with 95 additions and 36 deletions
--- a/configs/common/Caches.py
+++ b/configs/common/Caches.py
@@ -48,7 +48,8 @@ from m5.objects import *

 class L1Cache(Cache):
    assoc = 2
-    hit_latency = 2
+    tag_latency = 2
+    data_latency = 2
    response_latency = 2
    mshrs = 4
    tgts_per_mshr = 20
@@ -63,7 +64,8 @@ class L1_DCache(L1Cache):

 class L2Cache(Cache):
    assoc = 8
-    hit_latency = 20
+    tag_latency = 20
+    data_latency = 20
    response_latency = 20
    mshrs = 20
    tgts_per_mshr = 12
@@ -71,7 +73,8 @@ class L2Cache(Cache):

 class IOCache(Cache):
    assoc = 8
-    hit_latency = 50
+    tag_latency = 50
+    data_latency = 50
    response_latency = 50
    mshrs = 20
    size = '1kB'
@@ -79,7 +82,8 @@ class IOCache(Cache):

 class PageTableWalkerCache(Cache):
    assoc = 2
-    hit_latency = 2
+    tag_latency = 2
+    data_latency = 2
    response_latency = 2
    mshrs = 10
    size = '1kB'
--- a/configs/common/O3_ARM_v7a.py
+++ b/configs/common/O3_ARM_v7a.py
@@ -147,7 +147,8 @@ class O3_ARM_v7a_3(DerivO3CPU):

 # Instruction Cache
 class O3_ARM_v7a_ICache(Cache):
-    hit_latency = 1
+    tag_latency = 1
+    data_latency = 1
    response_latency = 1
    mshrs = 2
    tgts_per_mshr = 8
@@ -159,7 +160,8 @@ class O3_ARM_v7a_ICache(Cache):

 # Data Cache
 class O3_ARM_v7a_DCache(Cache):
-    hit_latency = 2
+    tag_latency = 2
+    data_latency = 2
    response_latency = 2
    mshrs = 6
    tgts_per_mshr = 8
@@ -172,7 +174,8 @@ class O3_ARM_v7a_DCache(Cache):
 # TLB Cache
 # Use a cache as a L2 TLB
 class O3_ARM_v7aWalkCache(Cache):
-    hit_latency = 4
+    tag_latency = 4
+    data_latency = 4
    response_latency = 4
    mshrs = 6
    tgts_per_mshr = 8
@@ -185,7 +188,8 @@ class O3_ARM_v7aWalkCache(Cache):

 # L2 Cache
 class O3_ARM_v7aL2(Cache):
-    hit_latency = 12
+    tag_latency = 12
+    data_latency = 12
    response_latency = 12
    mshrs = 16
    tgts_per_mshr = 8
--- a/configs/example/arm/devices.py
+++ b/configs/example/arm/devices.py
@@ -45,7 +45,8 @@ from common.Caches import *
 from common import CpuConfig

 class L1I(L1_ICache):
-    hit_latency = 1
+    tag_latency = 1
+    data_latency = 1
    response_latency = 1
    mshrs = 4
    tgts_per_mshr = 8
@@ -54,7 +55,8 @@ class L1I(L1_ICache):


 class L1D(L1_DCache):
-    hit_latency = 2
+    tag_latency = 2
+    data_latency = 2
    response_latency = 1
    mshrs = 16
    tgts_per_mshr = 16
@@ -64,7 +66,8 @@ class L1D(L1_DCache):


 class WalkCache(PageTableWalkerCache):
-    hit_latency = 4
+    tag_latency = 4
+    data_latency = 4
    response_latency = 4
    mshrs = 6
    tgts_per_mshr = 8
@@ -74,7 +77,8 @@ class WalkCache(PageTableWalkerCache):


 class L2(L2Cache):
-    hit_latency = 12
+    tag_latency = 12
+    data_latency = 12
    response_latency = 5
    mshrs = 32
    tgts_per_mshr = 8
@@ -87,7 +91,8 @@ class L2(L2Cache):
 class L3(Cache):
    size = '16MB'
    assoc = 16
-    hit_latency = 20
+    tag_latency = 20
+    data_latency = 20
    response_latency = 20
    mshrs = 20
    tgts_per_mshr = 12
--- a/configs/example/memcheck.py
+++ b/configs/example/memcheck.py
@@ -153,7 +153,7 @@ for t, m in zip(testerspec, multiplier):

 # Define a prototype L1 cache that we scale for all successive levels
 proto_l1 = Cache(size = '32kB', assoc = 4,
-                 hit_latency = 1, response_latency = 1,
+                 tag_latency = 1, data_latency = 1, response_latency = 1,
                 tgts_per_mshr = 8)

 if options.blocking:
@@ -175,7 +175,8 @@ for scale in cachespec[:-1]:
     prev = cache_proto[0]
     next = prev()
     next.size = prev.size * scale
-     next.hit_latency = prev.hit_latency * 10
+     next.tag_latency = prev.tag_latency * 10
+     next.data_latency = prev.data_latency * 10
     next.response_latency = prev.response_latency * 10
     next.assoc = prev.assoc * scale
     next.mshrs = prev.mshrs * scale
--- a/configs/example/memtest.py
+++ b/configs/example/memtest.py
@@ -176,7 +176,7 @@ else:

 # Define a prototype L1 cache that we scale for all successive levels
 proto_l1 = Cache(size = '32kB', assoc = 4,
-                 hit_latency = 1, response_latency = 1,
+                 tag_latency = 1, data_latency = 1, response_latency = 1,
                 tgts_per_mshr = 8, clusivity = 'mostly_incl',
                 writeback_clean = True)

@@ -194,7 +194,8 @@ for scale in cachespec[:-1]:
     prev = cache_proto[0]
     next = prev()
     next.size = prev.size * scale
-     next.hit_latency = prev.hit_latency * 10
+     next.tag_latency = prev.tag_latency * 10
+     next.data_latency = prev.data_latency * 10
     next.response_latency = prev.response_latency * 10
     next.assoc = prev.assoc * scale
     next.mshrs = prev.mshrs * scale
--- a/configs/learning_gem5/part1/caches.py
+++ b/configs/learning_gem5/part1/caches.py
@@ -45,7 +45,8 @@ class L1Cache(Cache):
    """Simple L1 Cache with default values"""

    assoc = 2
-    hit_latency = 2
+    tag_latency = 2
+    data_latency = 2
    response_latency = 2
    mshrs = 4
    tgts_per_mshr = 20
@@ -107,7 +108,8 @@ class L2Cache(Cache):
    # Default parameters
    size = '256kB'
    assoc = 8
-    hit_latency = 20
+    tag_latency = 20
+    data_latency = 20
    response_latency = 20
    mshrs = 20
    tgts_per_mshr = 12