e553a7bfa7
this patch adds the source for mcpat, a power, area, and timing modeling framework.
1162 lines
66 KiB
C++
1162 lines
66 KiB
C++
/*****************************************************************************
|
|
* McPAT
|
|
* SOFTWARE LICENSE AGREEMENT
|
|
* Copyright 2012 Hewlett-Packard Development Company, L.P.
|
|
* All Rights Reserved
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions are
|
|
* met: redistributions of source code must retain the above copyright
|
|
* notice, this list of conditions and the following disclaimer;
|
|
* redistributions in binary form must reproduce the above copyright
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
* documentation and/or other materials provided with the distribution;
|
|
* neither the name of the copyright holders nor the names of its
|
|
* contributors may be used to endorse or promote products derived from
|
|
* this software without specific prior written permission.
|
|
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
|
* OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
|
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
|
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.”
|
|
*
|
|
***************************************************************************/
|
|
|
|
#include <algorithm>
|
|
#include <cassert>
|
|
#include <cmath>
|
|
#include <cstring>
|
|
#include <iostream>
|
|
|
|
#include "XML_Parse.h"
|
|
#include "arbiter.h"
|
|
#include "array.h"
|
|
#include "basic_circuit.h"
|
|
#include "const.h"
|
|
#include "io.h"
|
|
#include "logic.h"
|
|
#include "parameter.h"
|
|
#include "sharedcache.h"
|
|
|
|
SharedCache::SharedCache(ParseXML* XML_interface, int ithCache_, InputParameter* interface_ip_, enum cache_level cacheL_)
|
|
:XML(XML_interface),
|
|
ithCache(ithCache_),
|
|
interface_ip(*interface_ip_),
|
|
cacheL(cacheL_),
|
|
dir_overhead(0)
|
|
{
|
|
int idx;
|
|
int tag, data;
|
|
bool is_default, debug;
|
|
enum Device_ty device_t;
|
|
enum Core_type core_t;
|
|
double size, line, assoc, banks;
|
|
if (cacheL==L2 && XML->sys.Private_L2)
|
|
{
|
|
device_t=Core_device;
|
|
core_t = (enum Core_type)XML->sys.core[ithCache].machine_type;
|
|
}
|
|
else
|
|
{
|
|
device_t=LLC_device;
|
|
core_t = Inorder;
|
|
}
|
|
|
|
debug = false;
|
|
is_default=true;//indication for default setup
|
|
if (XML->sys.Embedded)
|
|
{
|
|
interface_ip.wt =Global_30;
|
|
interface_ip.wire_is_mat_type = 0;
|
|
interface_ip.wire_os_mat_type = 1;
|
|
}
|
|
else
|
|
{
|
|
interface_ip.wt =Global;
|
|
interface_ip.wire_is_mat_type = 2;
|
|
interface_ip.wire_os_mat_type = 2;
|
|
}
|
|
set_cache_param();
|
|
|
|
//All lower level cache are physically indexed and tagged.
|
|
size = cachep.capacity;
|
|
line = cachep.blockW;
|
|
assoc = cachep.assoc;
|
|
banks = cachep.nbanks;
|
|
if ((cachep.dir_ty==ST&& cacheL==L1Directory)||(cachep.dir_ty==ST&& cacheL==L2Directory))
|
|
{
|
|
assoc = 0;
|
|
tag = XML->sys.physical_address_width + EXTRA_TAG_BITS;
|
|
interface_ip.num_search_ports = 1;
|
|
}
|
|
else
|
|
{
|
|
idx = debug?9:int(ceil(log2(size/line/assoc)));
|
|
tag = debug?51:XML->sys.physical_address_width-idx-int(ceil(log2(line))) + EXTRA_TAG_BITS;
|
|
interface_ip.num_search_ports = 0;
|
|
if (cachep.dir_ty==SBT)
|
|
{
|
|
dir_overhead = ceil(XML->sys.number_of_cores/8.0)*8/(cachep.blockW*8);
|
|
line = cachep.blockW*(1+ dir_overhead) ;
|
|
size = cachep.capacity*(1+ dir_overhead);
|
|
|
|
}
|
|
}
|
|
// if (XML->sys.first_level_dir==2)
|
|
// tag += int(XML->sys.domain_size + 5);
|
|
interface_ip.specific_tag = 1;
|
|
interface_ip.tag_w = tag;
|
|
interface_ip.cache_sz = (int)size;
|
|
interface_ip.line_sz = (int)line;
|
|
interface_ip.assoc = (int)assoc;
|
|
interface_ip.nbanks = (int)banks;
|
|
interface_ip.out_w = interface_ip.line_sz*8/2;
|
|
interface_ip.access_mode = 1;
|
|
interface_ip.throughput = cachep.throughput;
|
|
interface_ip.latency = cachep.latency;
|
|
interface_ip.is_cache = true;
|
|
interface_ip.pure_ram = false;
|
|
interface_ip.pure_cam = false;
|
|
interface_ip.obj_func_dyn_energy = 0;
|
|
interface_ip.obj_func_dyn_power = 0;
|
|
interface_ip.obj_func_leak_power = 0;
|
|
interface_ip.obj_func_cycle_t = 1;
|
|
interface_ip.num_rw_ports = 1;//lower level cache usually has one port.
|
|
interface_ip.num_rd_ports = 0;
|
|
interface_ip.num_wr_ports = 0;
|
|
interface_ip.num_se_rd_ports = 0;
|
|
// interface_ip.force_cache_config =true;
|
|
// interface_ip.ndwl = 4;
|
|
// interface_ip.ndbl = 8;
|
|
// interface_ip.nspd = 1;
|
|
// interface_ip.ndcm =1 ;
|
|
// interface_ip.ndsam1 =1;
|
|
// interface_ip.ndsam2 =1;
|
|
unicache.caches = new ArrayST(&interface_ip, cachep.name + "cache", device_t, true, core_t);
|
|
unicache.area.set_area(unicache.area.get_area()+ unicache.caches->local_result.area);
|
|
area.set_area(area.get_area()+ unicache.caches->local_result.area);
|
|
interface_ip.force_cache_config =false;
|
|
|
|
if (!((cachep.dir_ty==ST&& cacheL==L1Directory)||(cachep.dir_ty==ST&& cacheL==L2Directory)))
|
|
{
|
|
tag = XML->sys.physical_address_width + EXTRA_TAG_BITS;
|
|
data = (XML->sys.physical_address_width) + int(ceil(log2(size/line))) + unicache.caches->l_ip.line_sz;
|
|
interface_ip.specific_tag = 1;
|
|
interface_ip.tag_w = tag;
|
|
interface_ip.line_sz = int(ceil(data/8.0));//int(ceil(pow(2.0,ceil(log2(data)))/8.0));
|
|
interface_ip.cache_sz = cachep.missb_size*interface_ip.line_sz;
|
|
interface_ip.assoc = 0;
|
|
interface_ip.is_cache = true;
|
|
interface_ip.pure_ram = false;
|
|
interface_ip.pure_cam = false;
|
|
interface_ip.nbanks = 1;
|
|
interface_ip.out_w = interface_ip.line_sz*8/2;
|
|
interface_ip.access_mode = 0;
|
|
interface_ip.throughput = cachep.throughput;//means cycle time
|
|
interface_ip.latency = cachep.latency;//means access time
|
|
interface_ip.obj_func_dyn_energy = 0;
|
|
interface_ip.obj_func_dyn_power = 0;
|
|
interface_ip.obj_func_leak_power = 0;
|
|
interface_ip.obj_func_cycle_t = 1;
|
|
interface_ip.num_rw_ports = 1;
|
|
interface_ip.num_rd_ports = 0;
|
|
interface_ip.num_wr_ports = 0;
|
|
interface_ip.num_se_rd_ports = 0;
|
|
interface_ip.num_search_ports = 1;
|
|
unicache.missb = new ArrayST(&interface_ip, cachep.name + "MissB", device_t, true, core_t);
|
|
unicache.area.set_area(unicache.area.get_area()+ unicache.missb->local_result.area);
|
|
area.set_area(area.get_area()+ unicache.missb->local_result.area);
|
|
//fill buffer
|
|
tag = XML->sys.physical_address_width + EXTRA_TAG_BITS;
|
|
data = unicache.caches->l_ip.line_sz;
|
|
interface_ip.specific_tag = 1;
|
|
interface_ip.tag_w = tag;
|
|
interface_ip.line_sz = data;//int(pow(2.0,ceil(log2(data))));
|
|
interface_ip.cache_sz = data*cachep.fu_size ;
|
|
interface_ip.assoc = 0;
|
|
interface_ip.nbanks = 1;
|
|
interface_ip.out_w = interface_ip.line_sz*8/2;
|
|
interface_ip.access_mode = 0;
|
|
interface_ip.throughput = cachep.throughput;
|
|
interface_ip.latency = cachep.latency;
|
|
interface_ip.obj_func_dyn_energy = 0;
|
|
interface_ip.obj_func_dyn_power = 0;
|
|
interface_ip.obj_func_leak_power = 0;
|
|
interface_ip.obj_func_cycle_t = 1;
|
|
interface_ip.num_rw_ports = 1;
|
|
interface_ip.num_rd_ports = 0;
|
|
interface_ip.num_wr_ports = 0;
|
|
interface_ip.num_se_rd_ports = 0;
|
|
unicache.ifb = new ArrayST(&interface_ip, cachep.name + "FillB", device_t, true, core_t);
|
|
unicache.area.set_area(unicache.area.get_area()+ unicache.ifb->local_result.area);
|
|
area.set_area(area.get_area()+ unicache.ifb->local_result.area);
|
|
//prefetch buffer
|
|
tag = XML->sys.physical_address_width + EXTRA_TAG_BITS;//check with previous entries to decide wthether to merge.
|
|
data = unicache.caches->l_ip.line_sz;//separate queue to prevent from cache polution.
|
|
interface_ip.specific_tag = 1;
|
|
interface_ip.tag_w = tag;
|
|
interface_ip.line_sz = data;//int(pow(2.0,ceil(log2(data))));
|
|
interface_ip.cache_sz = cachep.prefetchb_size*interface_ip.line_sz;
|
|
interface_ip.assoc = 0;
|
|
interface_ip.nbanks = 1;
|
|
interface_ip.out_w = interface_ip.line_sz*8/2;
|
|
interface_ip.access_mode = 0;
|
|
interface_ip.throughput = cachep.throughput;
|
|
interface_ip.latency = cachep.latency;
|
|
interface_ip.obj_func_dyn_energy = 0;
|
|
interface_ip.obj_func_dyn_power = 0;
|
|
interface_ip.obj_func_leak_power = 0;
|
|
interface_ip.obj_func_cycle_t = 1;
|
|
interface_ip.num_rw_ports = 1;
|
|
interface_ip.num_rd_ports = 0;
|
|
interface_ip.num_wr_ports = 0;
|
|
interface_ip.num_se_rd_ports = 0;
|
|
unicache.prefetchb = new ArrayST(&interface_ip, cachep.name + "PrefetchB", device_t, true, core_t);
|
|
unicache.area.set_area(unicache.area.get_area()+ unicache.prefetchb->local_result.area);
|
|
area.set_area(area.get_area()+ unicache.prefetchb->local_result.area);
|
|
//WBB
|
|
tag = XML->sys.physical_address_width + EXTRA_TAG_BITS;
|
|
data = unicache.caches->l_ip.line_sz;
|
|
interface_ip.specific_tag = 1;
|
|
interface_ip.tag_w = tag;
|
|
interface_ip.line_sz = data;
|
|
interface_ip.cache_sz = cachep.wbb_size*interface_ip.line_sz;
|
|
interface_ip.assoc = 0;
|
|
interface_ip.nbanks = 1;
|
|
interface_ip.out_w = interface_ip.line_sz*8/2;
|
|
interface_ip.access_mode = 0;
|
|
interface_ip.throughput = cachep.throughput;
|
|
interface_ip.latency = cachep.latency;
|
|
interface_ip.obj_func_dyn_energy = 0;
|
|
interface_ip.obj_func_dyn_power = 0;
|
|
interface_ip.obj_func_leak_power = 0;
|
|
interface_ip.obj_func_cycle_t = 1;
|
|
interface_ip.num_rw_ports = 1;
|
|
interface_ip.num_rd_ports = 0;
|
|
interface_ip.num_wr_ports = 0;
|
|
interface_ip.num_se_rd_ports = 0;
|
|
unicache.wbb = new ArrayST(&interface_ip, cachep.name + "WBB", device_t, true, core_t);
|
|
unicache.area.set_area(unicache.area.get_area()+ unicache.wbb->local_result.area);
|
|
area.set_area(area.get_area()+ unicache.wbb->local_result.area);
|
|
}
|
|
// //pipeline
|
|
// interface_ip.pipeline_stages = int(ceil(llCache.caches.local_result.access_time/llCache.caches.local_result.cycle_time));
|
|
// interface_ip.per_stage_vector = llCache.caches.l_ip.out_w + llCache.caches.l_ip.tag_w ;
|
|
// pipeLogicCache.init_pipeline(is_default, &interface_ip);
|
|
// pipeLogicCache.compute_pipeline();
|
|
|
|
/*
|
|
if (!((XML->sys.number_of_dir_levels==1 && XML->sys.first_level_dir ==1)
|
|
||(XML->sys.number_of_dir_levels==1 && XML->sys.first_level_dir ==2)))//not single level IC and DIC
|
|
{
|
|
//directory Now assuming one directory per bank, TODO:should change it later
|
|
size = XML->sys.L2directory.L2Dir_config[0];
|
|
line = XML->sys.L2directory.L2Dir_config[1];
|
|
assoc = XML->sys.L2directory.L2Dir_config[2];
|
|
banks = XML->sys.L2directory.L2Dir_config[3];
|
|
tag = debug?51:XML->sys.physical_address_width + EXTRA_TAG_BITS;//TODO: a little bit over estimate
|
|
interface_ip.specific_tag = 0;
|
|
interface_ip.tag_w = tag;
|
|
interface_ip.cache_sz = XML->sys.L2directory.L2Dir_config[0];
|
|
interface_ip.line_sz = XML->sys.L2directory.L2Dir_config[1];
|
|
interface_ip.assoc = XML->sys.L2directory.L2Dir_config[2];
|
|
interface_ip.nbanks = XML->sys.L2directory.L2Dir_config[3];
|
|
interface_ip.out_w = interface_ip.line_sz*8;
|
|
interface_ip.access_mode = 0;//debug?0:XML->sys.core[ithCore].icache.icache_config[5];
|
|
interface_ip.throughput = XML->sys.L2directory.L2Dir_config[4]/clockRate;
|
|
interface_ip.latency = XML->sys.L2directory.L2Dir_config[5]/clockRate;
|
|
interface_ip.is_cache = true;
|
|
interface_ip.obj_func_dyn_energy = 0;
|
|
interface_ip.obj_func_dyn_power = 0;
|
|
interface_ip.obj_func_leak_power = 0;
|
|
interface_ip.obj_func_cycle_t = 1;
|
|
interface_ip.num_rw_ports = 1;//lower level cache usually has one port.
|
|
interface_ip.num_rd_ports = 0;
|
|
interface_ip.num_wr_ports = 0;
|
|
interface_ip.num_se_rd_ports = 0;
|
|
|
|
strcpy(directory.caches.name,"L2 Directory");
|
|
directory.caches.init_cache(&interface_ip);
|
|
directory.caches.optimize_array();
|
|
directory.area += directory.caches.local_result.area;
|
|
//output_data_csv(directory.caches.local_result);
|
|
///cout<<"area="<<area<<endl;
|
|
|
|
//miss buffer Each MSHR contains enough state to handle one or more accesses of any type to a single memory line.
|
|
//Due to the generality of the MSHR mechanism, the amount of state involved is non-trivial,
|
|
//including the address, pointers to the cache entry and destination register, written data, and various other pieces of state.
|
|
tag = XML->sys.physical_address_width + EXTRA_TAG_BITS;
|
|
data = (XML->sys.physical_address_width) + int(ceil(log2(size/line))) + directory.caches.l_ip.line_sz;
|
|
interface_ip.specific_tag = 1;
|
|
interface_ip.tag_w = tag;
|
|
interface_ip.line_sz = int(ceil(data/8.0));//int(ceil(pow(2.0,ceil(log2(data)))/8.0));
|
|
interface_ip.cache_sz = XML->sys.L2[ithCache].buffer_sizes[0]*interface_ip.line_sz;
|
|
interface_ip.assoc = 0;
|
|
interface_ip.nbanks = 1;
|
|
interface_ip.out_w = interface_ip.line_sz*8;
|
|
interface_ip.access_mode = 0;
|
|
interface_ip.throughput = XML->sys.L2[ithCache].L2_config[4]/clockRate;//means cycle time
|
|
interface_ip.latency = XML->sys.L2[ithCache].L2_config[5]/clockRate;//means access time
|
|
interface_ip.obj_func_dyn_energy = 0;
|
|
interface_ip.obj_func_dyn_power = 0;
|
|
interface_ip.obj_func_leak_power = 0;
|
|
interface_ip.obj_func_cycle_t = 1;
|
|
interface_ip.num_rw_ports = 1;
|
|
interface_ip.num_rd_ports = 0;
|
|
interface_ip.num_wr_ports = 0;
|
|
interface_ip.num_se_rd_ports = 0;
|
|
strcpy(directory.missb.name,"directoryMissB");
|
|
directory.missb.init_cache(&interface_ip);
|
|
directory.missb.optimize_array();
|
|
directory.area += directory.missb.local_result.area;
|
|
//output_data_csv(directory.missb.local_result);
|
|
///cout<<"area="<<area<<endl;
|
|
|
|
//fill buffer
|
|
tag = XML->sys.physical_address_width + EXTRA_TAG_BITS;
|
|
data = directory.caches.l_ip.line_sz;
|
|
interface_ip.specific_tag = 1;
|
|
interface_ip.tag_w = tag;
|
|
interface_ip.line_sz = data;//int(pow(2.0,ceil(log2(data))));
|
|
interface_ip.cache_sz = data*XML->sys.L2[ithCache].buffer_sizes[1];
|
|
interface_ip.assoc = 0;
|
|
interface_ip.nbanks = 1;
|
|
interface_ip.out_w = interface_ip.line_sz*8;
|
|
interface_ip.access_mode = 0;
|
|
interface_ip.throughput = XML->sys.L2[ithCache].L2_config[4]/clockRate;
|
|
interface_ip.latency = XML->sys.L2[ithCache].L2_config[5]/clockRate;
|
|
interface_ip.obj_func_dyn_energy = 0;
|
|
interface_ip.obj_func_dyn_power = 0;
|
|
interface_ip.obj_func_leak_power = 0;
|
|
interface_ip.obj_func_cycle_t = 1;
|
|
interface_ip.num_rw_ports = 1;
|
|
interface_ip.num_rd_ports = 0;
|
|
interface_ip.num_wr_ports = 0;
|
|
interface_ip.num_se_rd_ports = 0;
|
|
strcpy(directory.ifb.name,"directoryFillB");
|
|
directory.ifb.init_cache(&interface_ip);
|
|
directory.ifb.optimize_array();
|
|
directory.area += directory.ifb.local_result.area;
|
|
//output_data_csv(directory.ifb.local_result);
|
|
///cout<<"area="<<area<<endl;
|
|
|
|
//prefetch buffer
|
|
tag = XML->sys.physical_address_width + EXTRA_TAG_BITS;//check with previous entries to decide wthether to merge.
|
|
data = directory.caches.l_ip.line_sz;//separate queue to prevent from cache polution.
|
|
interface_ip.specific_tag = 1;
|
|
interface_ip.tag_w = tag;
|
|
interface_ip.line_sz = data;//int(pow(2.0,ceil(log2(data))));
|
|
interface_ip.cache_sz = XML->sys.L2[ithCache].buffer_sizes[2]*interface_ip.line_sz;
|
|
interface_ip.assoc = 0;
|
|
interface_ip.nbanks = 1;
|
|
interface_ip.out_w = interface_ip.line_sz*8;
|
|
interface_ip.access_mode = 0;
|
|
interface_ip.throughput = XML->sys.L2[ithCache].L2_config[4]/clockRate;
|
|
interface_ip.latency = XML->sys.L2[ithCache].L2_config[5]/clockRate;
|
|
interface_ip.obj_func_dyn_energy = 0;
|
|
interface_ip.obj_func_dyn_power = 0;
|
|
interface_ip.obj_func_leak_power = 0;
|
|
interface_ip.obj_func_cycle_t = 1;
|
|
interface_ip.num_rw_ports = 1;
|
|
interface_ip.num_rd_ports = 0;
|
|
interface_ip.num_wr_ports = 0;
|
|
interface_ip.num_se_rd_ports = 0;
|
|
strcpy(directory.prefetchb.name,"directoryPrefetchB");
|
|
directory.prefetchb.init_cache(&interface_ip);
|
|
directory.prefetchb.optimize_array();
|
|
directory.area += directory.prefetchb.local_result.area;
|
|
//output_data_csv(directory.prefetchb.local_result);
|
|
///cout<<"area="<<area<<endl;
|
|
|
|
//WBB
|
|
tag = XML->sys.physical_address_width + EXTRA_TAG_BITS;
|
|
data = directory.caches.l_ip.line_sz;
|
|
interface_ip.specific_tag = 1;
|
|
interface_ip.tag_w = tag;
|
|
interface_ip.line_sz = data;
|
|
interface_ip.cache_sz = XML->sys.L2[ithCache].buffer_sizes[3]*interface_ip.line_sz;
|
|
interface_ip.assoc = 0;
|
|
interface_ip.nbanks = 1;
|
|
interface_ip.out_w = interface_ip.line_sz*8;
|
|
interface_ip.access_mode = 0;
|
|
interface_ip.throughput = XML->sys.L2[ithCache].L2_config[4]/clockRate;
|
|
interface_ip.latency = XML->sys.L2[ithCache].L2_config[4]/clockRate;
|
|
interface_ip.obj_func_dyn_energy = 0;
|
|
interface_ip.obj_func_dyn_power = 0;
|
|
interface_ip.obj_func_leak_power = 0;
|
|
interface_ip.obj_func_cycle_t = 1;
|
|
interface_ip.num_rw_ports = 1;
|
|
interface_ip.num_rd_ports = 0;
|
|
interface_ip.num_wr_ports = 0;
|
|
interface_ip.num_se_rd_ports = 0;
|
|
strcpy(directory.wbb.name,"directoryWBB");
|
|
directory.wbb.init_cache(&interface_ip);
|
|
directory.wbb.optimize_array();
|
|
directory.area += directory.wbb.local_result.area;
|
|
}
|
|
|
|
if (XML->sys.number_of_dir_levels ==2 && XML->sys.first_level_dir==0)
|
|
{
|
|
//first level directory
|
|
size = XML->sys.L2directory.L2Dir_config[0]*XML->sys.domain_size/128;
|
|
line = int(ceil(XML->sys.domain_size/8.0));
|
|
assoc = XML->sys.L2directory.L2Dir_config[2];
|
|
banks = XML->sys.L2directory.L2Dir_config[3];
|
|
tag = debug?51:XML->sys.physical_address_width + EXTRA_TAG_BITS;//TODO: a little bit over estimate
|
|
interface_ip.specific_tag = 1;
|
|
interface_ip.tag_w = tag;
|
|
interface_ip.cache_sz = XML->sys.L2directory.L2Dir_config[0];
|
|
interface_ip.line_sz = XML->sys.L2directory.L2Dir_config[1];
|
|
interface_ip.assoc = XML->sys.L2directory.L2Dir_config[2];
|
|
interface_ip.nbanks = XML->sys.L2directory.L2Dir_config[3];
|
|
interface_ip.out_w = interface_ip.line_sz*8;
|
|
interface_ip.access_mode = 0;//debug?0:XML->sys.core[ithCore].icache.icache_config[5];
|
|
interface_ip.throughput = XML->sys.L2directory.L2Dir_config[4]/clockRate;
|
|
interface_ip.latency = XML->sys.L2directory.L2Dir_config[5]/clockRate;
|
|
interface_ip.is_cache = true;
|
|
interface_ip.obj_func_dyn_energy = 0;
|
|
interface_ip.obj_func_dyn_power = 0;
|
|
interface_ip.obj_func_leak_power = 0;
|
|
interface_ip.obj_func_cycle_t = 1;
|
|
interface_ip.num_rw_ports = 1;//lower level cache usually has one port.
|
|
interface_ip.num_rd_ports = 0;
|
|
interface_ip.num_wr_ports = 0;
|
|
interface_ip.num_se_rd_ports = 0;
|
|
|
|
strcpy(directory1.caches.name,"first level Directory");
|
|
directory1.caches.init_cache(&interface_ip);
|
|
directory1.caches.optimize_array();
|
|
directory1.area += directory1.caches.local_result.area;
|
|
//output_data_csv(directory.caches.local_result);
|
|
///cout<<"area="<<area<<endl;
|
|
|
|
//miss buffer Each MSHR contains enough state to handle one or more accesses of any type to a single memory line.
|
|
//Due to the generality of the MSHR mechanism, the amount of state involved is non-trivial,
|
|
//including the address, pointers to the cache entry and destination register, written data, and various other pieces of state.
|
|
tag = XML->sys.physical_address_width + EXTRA_TAG_BITS;
|
|
data = (XML->sys.physical_address_width) + int(ceil(log2(size/line))) + directory1.caches.l_ip.line_sz;
|
|
interface_ip.specific_tag = 1;
|
|
interface_ip.tag_w = tag;
|
|
interface_ip.line_sz = int(ceil(data/8.0));//int(ceil(pow(2.0,ceil(log2(data)))/8.0));
|
|
interface_ip.cache_sz = XML->sys.L2[ithCache].buffer_sizes[0]*interface_ip.line_sz;
|
|
interface_ip.assoc = 0;
|
|
interface_ip.nbanks = 1;
|
|
interface_ip.out_w = interface_ip.line_sz*8;
|
|
interface_ip.access_mode = 0;
|
|
interface_ip.throughput = XML->sys.L2[ithCache].L2_config[4]/clockRate;//means cycle time
|
|
interface_ip.latency = XML->sys.L2[ithCache].L2_config[5]/clockRate;//means access time
|
|
interface_ip.obj_func_dyn_energy = 0;
|
|
interface_ip.obj_func_dyn_power = 0;
|
|
interface_ip.obj_func_leak_power = 0;
|
|
interface_ip.obj_func_cycle_t = 1;
|
|
interface_ip.num_rw_ports = 1;
|
|
interface_ip.num_rd_ports = 0;
|
|
interface_ip.num_wr_ports = 0;
|
|
interface_ip.num_se_rd_ports = 0;
|
|
strcpy(directory1.missb.name,"directory1MissB");
|
|
directory1.missb.init_cache(&interface_ip);
|
|
directory1.missb.optimize_array();
|
|
directory1.area += directory1.missb.local_result.area;
|
|
//output_data_csv(directory.missb.local_result);
|
|
///cout<<"area="<<area<<endl;
|
|
|
|
//fill buffer
|
|
tag = XML->sys.physical_address_width + EXTRA_TAG_BITS;
|
|
data = directory1.caches.l_ip.line_sz;
|
|
interface_ip.specific_tag = 1;
|
|
interface_ip.tag_w = tag;
|
|
interface_ip.line_sz = data;//int(pow(2.0,ceil(log2(data))));
|
|
interface_ip.cache_sz = data*XML->sys.L2[ithCache].buffer_sizes[1];
|
|
interface_ip.assoc = 0;
|
|
interface_ip.nbanks = 1;
|
|
interface_ip.out_w = interface_ip.line_sz*8;
|
|
interface_ip.access_mode = 0;
|
|
interface_ip.throughput = XML->sys.L2[ithCache].L2_config[4]/clockRate;
|
|
interface_ip.latency = XML->sys.L2[ithCache].L2_config[5]/clockRate;
|
|
interface_ip.obj_func_dyn_energy = 0;
|
|
interface_ip.obj_func_dyn_power = 0;
|
|
interface_ip.obj_func_leak_power = 0;
|
|
interface_ip.obj_func_cycle_t = 1;
|
|
interface_ip.num_rw_ports = 1;
|
|
interface_ip.num_rd_ports = 0;
|
|
interface_ip.num_wr_ports = 0;
|
|
interface_ip.num_se_rd_ports = 0;
|
|
strcpy(directory1.ifb.name,"directory1FillB");
|
|
directory1.ifb.init_cache(&interface_ip);
|
|
directory1.ifb.optimize_array();
|
|
directory1.area += directory1.ifb.local_result.area;
|
|
//output_data_csv(directory.ifb.local_result);
|
|
///cout<<"area="<<area<<endl;
|
|
|
|
//prefetch buffer
|
|
tag = XML->sys.physical_address_width + EXTRA_TAG_BITS;//check with previous entries to decide wthether to merge.
|
|
data = directory1.caches.l_ip.line_sz;//separate queue to prevent from cache polution.
|
|
interface_ip.specific_tag = 1;
|
|
interface_ip.tag_w = tag;
|
|
interface_ip.line_sz = data;//int(pow(2.0,ceil(log2(data))));
|
|
interface_ip.cache_sz = XML->sys.L2[ithCache].buffer_sizes[2]*interface_ip.line_sz;
|
|
interface_ip.assoc = 0;
|
|
interface_ip.nbanks = 1;
|
|
interface_ip.out_w = interface_ip.line_sz*8;
|
|
interface_ip.access_mode = 0;
|
|
interface_ip.throughput = XML->sys.L2[ithCache].L2_config[4]/clockRate;
|
|
interface_ip.latency = XML->sys.L2[ithCache].L2_config[5]/clockRate;
|
|
interface_ip.obj_func_dyn_energy = 0;
|
|
interface_ip.obj_func_dyn_power = 0;
|
|
interface_ip.obj_func_leak_power = 0;
|
|
interface_ip.obj_func_cycle_t = 1;
|
|
interface_ip.num_rw_ports = 1;
|
|
interface_ip.num_rd_ports = 0;
|
|
interface_ip.num_wr_ports = 0;
|
|
interface_ip.num_se_rd_ports = 0;
|
|
strcpy(directory1.prefetchb.name,"directory1PrefetchB");
|
|
directory1.prefetchb.init_cache(&interface_ip);
|
|
directory1.prefetchb.optimize_array();
|
|
directory1.area += directory1.prefetchb.local_result.area;
|
|
//output_data_csv(directory.prefetchb.local_result);
|
|
///cout<<"area="<<area<<endl;
|
|
|
|
//WBB
|
|
tag = XML->sys.physical_address_width + EXTRA_TAG_BITS;
|
|
data = directory1.caches.l_ip.line_sz;
|
|
interface_ip.specific_tag = 1;
|
|
interface_ip.tag_w = tag;
|
|
interface_ip.line_sz = data;
|
|
interface_ip.cache_sz = XML->sys.L2[ithCache].buffer_sizes[3]*interface_ip.line_sz;
|
|
interface_ip.assoc = 0;
|
|
interface_ip.nbanks = 1;
|
|
interface_ip.out_w = interface_ip.line_sz*8;
|
|
interface_ip.access_mode = 0;
|
|
interface_ip.throughput = XML->sys.L2[ithCache].L2_config[4]/clockRate;
|
|
interface_ip.latency = XML->sys.L2[ithCache].L2_config[5]/clockRate;
|
|
interface_ip.obj_func_dyn_energy = 0;
|
|
interface_ip.obj_func_dyn_power = 0;
|
|
interface_ip.obj_func_leak_power = 0;
|
|
interface_ip.obj_func_cycle_t = 1;
|
|
interface_ip.num_rw_ports = 1;
|
|
interface_ip.num_rd_ports = 0;
|
|
interface_ip.num_wr_ports = 0;
|
|
interface_ip.num_se_rd_ports = 0;
|
|
strcpy(directory1.wbb.name,"directoryWBB");
|
|
directory1.wbb.init_cache(&interface_ip);
|
|
directory1.wbb.optimize_array();
|
|
directory1.area += directory1.wbb.local_result.area;
|
|
}
|
|
|
|
if (XML->sys.first_level_dir==1)//IC
|
|
{
|
|
tag = XML->sys.physical_address_width + EXTRA_TAG_BITS;
|
|
data = int(ceil(XML->sys.domain_size/8.0));
|
|
interface_ip.specific_tag = 1;
|
|
interface_ip.tag_w = tag;
|
|
interface_ip.line_sz = data;
|
|
interface_ip.cache_sz = XML->sys.domain_size*data*XML->sys.L2[ithCache].L2_config[0]/XML->sys.L2[ithCache].L2_config[1];
|
|
interface_ip.assoc = 0;
|
|
interface_ip.nbanks = 1024;
|
|
interface_ip.out_w = interface_ip.line_sz*8;
|
|
interface_ip.access_mode = 0;
|
|
interface_ip.throughput = XML->sys.L2[ithCache].L2_config[4]/clockRate;
|
|
interface_ip.latency = XML->sys.L2[ithCache].L2_config[5]/clockRate;
|
|
interface_ip.obj_func_dyn_energy = 0;
|
|
interface_ip.obj_func_dyn_power = 0;
|
|
interface_ip.obj_func_leak_power = 0;
|
|
interface_ip.obj_func_cycle_t = 1;
|
|
interface_ip.num_rw_ports = 1;
|
|
interface_ip.num_rd_ports = 0;
|
|
interface_ip.num_wr_ports = 0;
|
|
interface_ip.num_se_rd_ports = 0;
|
|
strcpy(inv_dir.caches.name,"inv_dir");
|
|
inv_dir.caches.init_cache(&interface_ip);
|
|
inv_dir.caches.optimize_array();
|
|
inv_dir.area = inv_dir.caches.local_result.area;
|
|
|
|
}
|
|
*/
|
|
// //pipeline
|
|
// interface_ip.pipeline_stages = int(ceil(directory.caches.local_result.access_time/directory.caches.local_result.cycle_time));
|
|
// interface_ip.per_stage_vector = directory.caches.l_ip.out_w + directory.caches.l_ip.tag_w ;
|
|
// pipeLogicDirectory.init_pipeline(is_default, &interface_ip);
|
|
// pipeLogicDirectory.compute_pipeline();
|
|
//
|
|
// //clock power
|
|
// clockNetwork.init_wire_external(is_default, &interface_ip);
|
|
// clockNetwork.clk_area =area*1.1;//10% of placement overhead. rule of thumb
|
|
// clockNetwork.end_wiring_level =5;//toplevel metal
|
|
// clockNetwork.start_wiring_level =5;//toplevel metal
|
|
// clockNetwork.num_regs = pipeLogicCache.tot_stage_vector + pipeLogicDirectory.tot_stage_vector;
|
|
// clockNetwork.optimize_wire();
|
|
|
|
}
|
|
|
|
|
|
void SharedCache::computeEnergy(bool is_tdp)
|
|
{
|
|
double homenode_data_access = (cachep.dir_ty==SBT)? 0.9:1.0;
|
|
if (is_tdp)
|
|
{
|
|
if (!((cachep.dir_ty==ST&& cacheL==L1Directory)||(cachep.dir_ty==ST&& cacheL==L2Directory)))
|
|
{
|
|
//init stats for Peak
|
|
unicache.caches->stats_t.readAc.access = .67*unicache.caches->l_ip.num_rw_ports*cachep.duty_cycle*homenode_data_access;
|
|
unicache.caches->stats_t.readAc.miss = 0;
|
|
unicache.caches->stats_t.readAc.hit = unicache.caches->stats_t.readAc.access - unicache.caches->stats_t.readAc.miss;
|
|
unicache.caches->stats_t.writeAc.access = .33*unicache.caches->l_ip.num_rw_ports*cachep.duty_cycle*homenode_data_access;
|
|
unicache.caches->stats_t.writeAc.miss = 0;
|
|
unicache.caches->stats_t.writeAc.hit = unicache.caches->stats_t.writeAc.access - unicache.caches->stats_t.writeAc.miss;
|
|
unicache.caches->tdp_stats = unicache.caches->stats_t;
|
|
|
|
if (cachep.dir_ty==SBT)
|
|
{
|
|
homenode_stats_t.readAc.access = .67*unicache.caches->l_ip.num_rw_ports*cachep.dir_duty_cycle*(1-homenode_data_access);
|
|
homenode_stats_t.readAc.miss = 0;
|
|
homenode_stats_t.readAc.hit = homenode_stats_t.readAc.access - homenode_stats_t.readAc.miss;
|
|
homenode_stats_t.writeAc.access = .67*unicache.caches->l_ip.num_rw_ports*cachep.dir_duty_cycle*(1-homenode_data_access);
|
|
homenode_stats_t.writeAc.miss = 0;
|
|
homenode_stats_t.writeAc.hit = homenode_stats_t.writeAc.access - homenode_stats_t.writeAc.miss;
|
|
homenode_tdp_stats = homenode_stats_t;
|
|
}
|
|
|
|
unicache.missb->stats_t.readAc.access = unicache.missb->l_ip.num_search_ports;
|
|
unicache.missb->stats_t.writeAc.access = unicache.missb->l_ip.num_search_ports;
|
|
unicache.missb->tdp_stats = unicache.missb->stats_t;
|
|
|
|
unicache.ifb->stats_t.readAc.access = unicache.ifb->l_ip.num_search_ports;
|
|
unicache.ifb->stats_t.writeAc.access = unicache.ifb->l_ip.num_search_ports;
|
|
unicache.ifb->tdp_stats = unicache.ifb->stats_t;
|
|
|
|
unicache.prefetchb->stats_t.readAc.access = unicache.prefetchb->l_ip.num_search_ports;
|
|
unicache.prefetchb->stats_t.writeAc.access = unicache.ifb->l_ip.num_search_ports;
|
|
unicache.prefetchb->tdp_stats = unicache.prefetchb->stats_t;
|
|
|
|
unicache.wbb->stats_t.readAc.access = unicache.wbb->l_ip.num_search_ports;
|
|
unicache.wbb->stats_t.writeAc.access = unicache.wbb->l_ip.num_search_ports;
|
|
unicache.wbb->tdp_stats = unicache.wbb->stats_t;
|
|
}
|
|
else
|
|
{
|
|
unicache.caches->stats_t.readAc.access = unicache.caches->l_ip.num_search_ports*cachep.duty_cycle;
|
|
unicache.caches->stats_t.readAc.miss = 0;
|
|
unicache.caches->stats_t.readAc.hit = unicache.caches->stats_t.readAc.access - unicache.caches->stats_t.readAc.miss;
|
|
unicache.caches->stats_t.writeAc.access = 0;
|
|
unicache.caches->stats_t.writeAc.miss = 0;
|
|
unicache.caches->stats_t.writeAc.hit = unicache.caches->stats_t.writeAc.access - unicache.caches->stats_t.writeAc.miss;
|
|
unicache.caches->tdp_stats = unicache.caches->stats_t;
|
|
|
|
}
|
|
|
|
}
|
|
else
|
|
{
|
|
//init stats for runtime power (RTP)
|
|
if (cacheL==L2)
|
|
{
|
|
unicache.caches->stats_t.readAc.access = XML->sys.L2[ithCache].read_accesses;
|
|
unicache.caches->stats_t.readAc.miss = XML->sys.L2[ithCache].read_misses;
|
|
unicache.caches->stats_t.readAc.hit = unicache.caches->stats_t.readAc.access - unicache.caches->stats_t.readAc.miss;
|
|
unicache.caches->stats_t.writeAc.access = XML->sys.L2[ithCache].write_accesses;
|
|
unicache.caches->stats_t.writeAc.miss = XML->sys.L2[ithCache].write_misses;
|
|
unicache.caches->stats_t.writeAc.hit = unicache.caches->stats_t.writeAc.access - unicache.caches->stats_t.writeAc.miss;
|
|
unicache.caches->rtp_stats = unicache.caches->stats_t;
|
|
|
|
if (cachep.dir_ty==SBT)
|
|
{
|
|
homenode_rtp_stats.readAc.access = XML->sys.L2[ithCache].homenode_read_accesses;
|
|
homenode_rtp_stats.readAc.miss = XML->sys.L2[ithCache].homenode_read_misses;
|
|
homenode_rtp_stats.readAc.hit = homenode_rtp_stats.readAc.access - homenode_rtp_stats.readAc.miss;
|
|
homenode_rtp_stats.writeAc.access = XML->sys.L2[ithCache].homenode_write_accesses;
|
|
homenode_rtp_stats.writeAc.miss = XML->sys.L2[ithCache].homenode_write_misses;
|
|
homenode_rtp_stats.writeAc.hit = homenode_rtp_stats.writeAc.access - homenode_rtp_stats.writeAc.miss;
|
|
}
|
|
}
|
|
else if (cacheL==L3)
|
|
{
|
|
unicache.caches->stats_t.readAc.access = XML->sys.L3[ithCache].read_accesses;
|
|
unicache.caches->stats_t.readAc.miss = XML->sys.L3[ithCache].read_misses;
|
|
unicache.caches->stats_t.readAc.hit = unicache.caches->stats_t.readAc.access - unicache.caches->stats_t.readAc.miss;
|
|
unicache.caches->stats_t.writeAc.access = XML->sys.L3[ithCache].write_accesses;
|
|
unicache.caches->stats_t.writeAc.miss = XML->sys.L3[ithCache].write_misses;
|
|
unicache.caches->stats_t.writeAc.hit = unicache.caches->stats_t.writeAc.access - unicache.caches->stats_t.writeAc.miss;
|
|
unicache.caches->rtp_stats = unicache.caches->stats_t;
|
|
|
|
if (cachep.dir_ty==SBT)
|
|
{
|
|
homenode_rtp_stats.readAc.access = XML->sys.L3[ithCache].homenode_read_accesses;
|
|
homenode_rtp_stats.readAc.miss = XML->sys.L3[ithCache].homenode_read_misses;
|
|
homenode_rtp_stats.readAc.hit = homenode_rtp_stats.readAc.access - homenode_rtp_stats.readAc.miss;
|
|
homenode_rtp_stats.writeAc.access = XML->sys.L3[ithCache].homenode_write_accesses;
|
|
homenode_rtp_stats.writeAc.miss = XML->sys.L3[ithCache].homenode_write_misses;
|
|
homenode_rtp_stats.writeAc.hit = homenode_rtp_stats.writeAc.access - homenode_rtp_stats.writeAc.miss;
|
|
}
|
|
}
|
|
else if (cacheL==L1Directory)
|
|
{
|
|
unicache.caches->stats_t.readAc.access = XML->sys.L1Directory[ithCache].read_accesses;
|
|
unicache.caches->stats_t.readAc.miss = XML->sys.L1Directory[ithCache].read_misses;
|
|
unicache.caches->stats_t.readAc.hit = unicache.caches->stats_t.readAc.access - unicache.caches->stats_t.readAc.miss;
|
|
unicache.caches->stats_t.writeAc.access = XML->sys.L1Directory[ithCache].write_accesses;
|
|
unicache.caches->stats_t.writeAc.miss = XML->sys.L1Directory[ithCache].write_misses;
|
|
unicache.caches->stats_t.writeAc.hit = unicache.caches->stats_t.writeAc.access - unicache.caches->stats_t.writeAc.miss;
|
|
unicache.caches->rtp_stats = unicache.caches->stats_t;
|
|
}
|
|
else if (cacheL==L2Directory)
|
|
{
|
|
unicache.caches->stats_t.readAc.access = XML->sys.L2Directory[ithCache].read_accesses;
|
|
unicache.caches->stats_t.readAc.miss = XML->sys.L2Directory[ithCache].read_misses;
|
|
unicache.caches->stats_t.readAc.hit = unicache.caches->stats_t.readAc.access - unicache.caches->stats_t.readAc.miss;
|
|
unicache.caches->stats_t.writeAc.access = XML->sys.L2Directory[ithCache].write_accesses;
|
|
unicache.caches->stats_t.writeAc.miss = XML->sys.L2Directory[ithCache].write_misses;
|
|
unicache.caches->stats_t.writeAc.hit = unicache.caches->stats_t.writeAc.access - unicache.caches->stats_t.writeAc.miss;
|
|
unicache.caches->rtp_stats = unicache.caches->stats_t;
|
|
}
|
|
if (!((cachep.dir_ty==ST&& cacheL==L1Directory)||(cachep.dir_ty==ST&& cacheL==L2Directory)))
|
|
{ //Assuming write back and write-allocate cache
|
|
|
|
unicache.missb->stats_t.readAc.access = unicache.caches->stats_t.writeAc.miss ;
|
|
unicache.missb->stats_t.writeAc.access = unicache.caches->stats_t.writeAc.miss;
|
|
unicache.missb->rtp_stats = unicache.missb->stats_t;
|
|
|
|
unicache.ifb->stats_t.readAc.access = unicache.caches->stats_t.writeAc.miss;
|
|
unicache.ifb->stats_t.writeAc.access = unicache.caches->stats_t.writeAc.miss;
|
|
unicache.ifb->rtp_stats = unicache.ifb->stats_t;
|
|
|
|
unicache.prefetchb->stats_t.readAc.access = unicache.caches->stats_t.writeAc.miss;
|
|
unicache.prefetchb->stats_t.writeAc.access = unicache.caches->stats_t.writeAc.miss;
|
|
unicache.prefetchb->rtp_stats = unicache.prefetchb->stats_t;
|
|
|
|
unicache.wbb->stats_t.readAc.access = unicache.caches->stats_t.writeAc.miss;
|
|
unicache.wbb->stats_t.writeAc.access = unicache.caches->stats_t.writeAc.miss;
|
|
if (cachep.dir_ty==SBT)
|
|
{
|
|
unicache.missb->stats_t.readAc.access += homenode_rtp_stats.writeAc.miss;
|
|
unicache.missb->stats_t.writeAc.access += homenode_rtp_stats.writeAc.miss;
|
|
unicache.missb->rtp_stats = unicache.missb->stats_t;
|
|
|
|
unicache.missb->stats_t.readAc.access += homenode_rtp_stats.writeAc.miss;
|
|
unicache.missb->stats_t.writeAc.access += homenode_rtp_stats.writeAc.miss;
|
|
unicache.missb->rtp_stats = unicache.missb->stats_t;
|
|
|
|
unicache.ifb->stats_t.readAc.access += homenode_rtp_stats.writeAc.miss;
|
|
unicache.ifb->stats_t.writeAc.access += homenode_rtp_stats.writeAc.miss;
|
|
unicache.ifb->rtp_stats = unicache.ifb->stats_t;
|
|
|
|
unicache.prefetchb->stats_t.readAc.access += homenode_rtp_stats.writeAc.miss;
|
|
unicache.prefetchb->stats_t.writeAc.access += homenode_rtp_stats.writeAc.miss;
|
|
unicache.prefetchb->rtp_stats = unicache.prefetchb->stats_t;
|
|
|
|
unicache.wbb->stats_t.readAc.access += homenode_rtp_stats.writeAc.miss;
|
|
unicache.wbb->stats_t.writeAc.access += homenode_rtp_stats.writeAc.miss;
|
|
}
|
|
unicache.wbb->rtp_stats = unicache.wbb->stats_t;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
unicache.power_t.reset();
|
|
if (!((cachep.dir_ty==ST&& cacheL==L1Directory)||(cachep.dir_ty==ST&& cacheL==L2Directory)))
|
|
{
|
|
unicache.power_t.readOp.dynamic += (unicache.caches->stats_t.readAc.hit*unicache.caches->local_result.power.readOp.dynamic+
|
|
unicache.caches->stats_t.readAc.miss*unicache.caches->local_result.tag_array2->power.readOp.dynamic+
|
|
unicache.caches->stats_t.writeAc.miss*unicache.caches->local_result.tag_array2->power.writeOp.dynamic+
|
|
unicache.caches->stats_t.writeAc.access*unicache.caches->local_result.power.writeOp.dynamic);//write miss will also generate a write later
|
|
|
|
if (cachep.dir_ty==SBT)
|
|
{
|
|
unicache.power_t.readOp.dynamic += homenode_stats_t.readAc.hit * (unicache.caches->local_result.data_array2->power.readOp.dynamic*dir_overhead +
|
|
unicache.caches->local_result.tag_array2->power.readOp.dynamic) +
|
|
homenode_stats_t.readAc.miss*unicache.caches->local_result.tag_array2->power.readOp.dynamic +
|
|
homenode_stats_t.writeAc.miss*unicache.caches->local_result.tag_array2->power.readOp.dynamic +
|
|
homenode_stats_t.writeAc.hit*(unicache.caches->local_result.data_array2->power.writeOp.dynamic*dir_overhead +
|
|
unicache.caches->local_result.tag_array2->power.readOp.dynamic+
|
|
homenode_stats_t.writeAc.miss*unicache.caches->local_result.power.writeOp.dynamic);//write miss on dynamic home node will generate a replacement write on whole cache block
|
|
|
|
|
|
}
|
|
|
|
unicache.power_t.readOp.dynamic += unicache.missb->stats_t.readAc.access*unicache.missb->local_result.power.searchOp.dynamic +
|
|
unicache.missb->stats_t.writeAc.access*unicache.missb->local_result.power.writeOp.dynamic;//each access to missb involves a CAM and a write
|
|
unicache.power_t.readOp.dynamic += unicache.ifb->stats_t.readAc.access*unicache.ifb->local_result.power.searchOp.dynamic +
|
|
unicache.ifb->stats_t.writeAc.access*unicache.ifb->local_result.power.writeOp.dynamic;
|
|
unicache.power_t.readOp.dynamic += unicache.prefetchb->stats_t.readAc.access*unicache.prefetchb->local_result.power.searchOp.dynamic +
|
|
unicache.prefetchb->stats_t.writeAc.access*unicache.prefetchb->local_result.power.writeOp.dynamic;
|
|
unicache.power_t.readOp.dynamic += unicache.wbb->stats_t.readAc.access*unicache.wbb->local_result.power.searchOp.dynamic +
|
|
unicache.wbb->stats_t.writeAc.access*unicache.wbb->local_result.power.writeOp.dynamic;
|
|
}
|
|
else
|
|
{
|
|
unicache.power_t.readOp.dynamic += (unicache.caches->stats_t.readAc.access*unicache.caches->local_result.power.searchOp.dynamic+
|
|
unicache.caches->stats_t.writeAc.access*unicache.caches->local_result.power.writeOp.dynamic);
|
|
}
|
|
|
|
if (is_tdp)
|
|
{
|
|
unicache.power = unicache.power_t + (unicache.caches->local_result.power)*pppm_lkg;
|
|
if (!((cachep.dir_ty==ST&& cacheL==L1Directory)||(cachep.dir_ty==ST&& cacheL==L2Directory)))
|
|
{
|
|
unicache.power = unicache.power+
|
|
(unicache.missb->local_result.power +
|
|
unicache.ifb->local_result.power +
|
|
unicache.prefetchb->local_result.power +
|
|
unicache.wbb->local_result.power)*pppm_lkg;
|
|
}
|
|
power = power + unicache.power;
|
|
// cout<<"unicache.caches->local_result.power.readOp.dynamic"<<unicache.caches->local_result.power.readOp.dynamic<<endl;
|
|
// cout<<"unicache.caches->local_result.power.writeOp.dynamic"<<unicache.caches->local_result.power.writeOp.dynamic<<endl;
|
|
}
|
|
else
|
|
{
|
|
unicache.rt_power = unicache.power_t + (unicache.caches->local_result.power)*pppm_lkg;
|
|
if (!((cachep.dir_ty==ST&& cacheL==L1Directory)||(cachep.dir_ty==ST&& cacheL==L2Directory)))
|
|
{
|
|
(unicache.rt_power = unicache.rt_power +
|
|
unicache.missb->local_result.power +
|
|
unicache.ifb->local_result.power +
|
|
unicache.prefetchb->local_result.power +
|
|
unicache.wbb->local_result.power)*pppm_lkg;
|
|
}
|
|
rt_power = rt_power + unicache.rt_power;
|
|
}
|
|
}
|
|
|
|
void SharedCache::displayEnergy(uint32_t indent,bool is_tdp)
|
|
{
|
|
string indent_str(indent, ' ');
|
|
string indent_str_next(indent+2, ' ');
|
|
bool long_channel = XML->sys.longer_channel_device;
|
|
|
|
if (is_tdp)
|
|
{
|
|
cout << (XML->sys.Private_L2? indent_str:"")<< cachep.name << endl;
|
|
cout << indent_str << "Area = " << area.get_area()*1e-6<< " mm^2" << endl;
|
|
cout << indent_str << "Peak Dynamic = " << power.readOp.dynamic*cachep.clockRate << " W" << endl;
|
|
cout << indent_str << "Subthreshold Leakage = "
|
|
<< (long_channel? power.readOp.longer_channel_leakage:power.readOp.leakage) <<" W" << endl;
|
|
//cout << indent_str << "Subthreshold Leakage = " << power.readOp.longer_channel_leakage <<" W" << endl;
|
|
cout << indent_str << "Gate Leakage = " << power.readOp.gate_leakage << " W" << endl;
|
|
cout << indent_str << "Runtime Dynamic = " << rt_power.readOp.dynamic/cachep.executionTime << " W" << endl;
|
|
cout <<endl;
|
|
}
|
|
else
|
|
{
|
|
}
|
|
}
|
|
|
|
//void SharedCache::computeMaxPower()
|
|
//{
|
|
// //Compute maximum power and runtime power.
|
|
// //When computing runtime power, McPAT gets or reasons out the statistics based on XML input.
|
|
// maxPower = 0.0;
|
|
// //llCache,itlb
|
|
// llCache.maxPower = 0.0;
|
|
// llCache.maxPower += (llCache.caches.l_ip.num_rw_ports*(0.67*llCache.caches.local_result.power.readOp.dynamic+0.33*llCache.caches.local_result.power.writeOp.dynamic)
|
|
// +llCache.caches.l_ip.num_rd_ports*llCache.caches.local_result.power.readOp.dynamic+llCache.caches.l_ip.num_wr_ports*llCache.caches.local_result.power.writeOp.dynamic
|
|
// +llCache.caches.l_ip.num_se_rd_ports*llCache.caches.local_result.power.readOp.dynamic)*clockRate;
|
|
// ///cout<<"llCache.maxPower=" <<llCache.maxPower<<endl;
|
|
//
|
|
// llCache.maxPower += llCache.missb.l_ip.num_search_ports*llCache.missb.local_result.power.searchOp.dynamic*clockRate;
|
|
// ///cout<<"llCache.maxPower=" <<llCache.maxPower<<endl;
|
|
//
|
|
// llCache.maxPower += llCache.ifb.l_ip.num_search_ports*llCache.ifb.local_result.power.searchOp.dynamic*clockRate;
|
|
// ///cout<<"llCache.maxPower=" <<llCache.maxPower<<endl;
|
|
//
|
|
// llCache.maxPower += llCache.prefetchb.l_ip.num_search_ports*llCache.prefetchb.local_result.power.searchOp.dynamic*clockRate;
|
|
// ///cout<<"llCache.maxPower=" <<llCache.maxPower<<endl;
|
|
//
|
|
// llCache.maxPower += llCache.wbb.l_ip.num_search_ports*llCache.wbb.local_result.power.searchOp.dynamic*clockRate;
|
|
// //llCache.maxPower *= scktRatio; //TODO: this calculation should be self-contained
|
|
// ///cout<<"llCache.maxPower=" <<llCache.maxPower<<endl;
|
|
//
|
|
//// directory_power = (directory.caches.l_ip.num_rw_ports*(0.67*directory.caches.local_result.power.readOp.dynamic+0.33*directory.caches.local_result.power.writeOp.dynamic)
|
|
//// +directory.caches.l_ip.num_rd_ports*directory.caches.local_result.power.readOp.dynamic+directory.caches.l_ip.num_wr_ports*directory.caches.local_result.power.writeOp.dynamic
|
|
//// +directory.caches.l_ip.num_se_rd_ports*directory.caches.local_result.power.readOp.dynamic)*clockRate;
|
|
//
|
|
// L2Tot.power.readOp.dynamic = llCache.maxPower;
|
|
// L2Tot.power.readOp.leakage = llCache.caches.local_result.power.readOp.leakage +
|
|
// llCache.missb.local_result.power.readOp.leakage +
|
|
// llCache.ifb.local_result.power.readOp.leakage +
|
|
// llCache.prefetchb.local_result.power.readOp.leakage +
|
|
// llCache.wbb.local_result.power.readOp.leakage;
|
|
//
|
|
// L2Tot.area.set_area(llCache.area*1.1*1e-6);//placement and routing overhead
|
|
//
|
|
// if (XML->sys.number_of_dir_levels==1)
|
|
// {
|
|
// if (XML->sys.first_level_dir==0)
|
|
// {
|
|
// directory.maxPower = 0.0;
|
|
// directory.maxPower += (directory.caches.l_ip.num_rw_ports*(0.67*directory.caches.local_result.power.readOp.dynamic+0.33*directory.caches.local_result.power.writeOp.dynamic)
|
|
// +directory.caches.l_ip.num_rd_ports*directory.caches.local_result.power.readOp.dynamic+directory.caches.l_ip.num_wr_ports*directory.caches.local_result.power.writeOp.dynamic
|
|
// +directory.caches.l_ip.num_se_rd_ports*directory.caches.local_result.power.readOp.dynamic)*clockRate;
|
|
// ///cout<<"directory.maxPower=" <<directory.maxPower<<endl;
|
|
//
|
|
// directory.maxPower += directory.missb.l_ip.num_search_ports*directory.missb.local_result.power.searchOp.dynamic*clockRate;
|
|
// ///cout<<"directory.maxPower=" <<directory.maxPower<<endl;
|
|
//
|
|
// directory.maxPower += directory.ifb.l_ip.num_search_ports*directory.ifb.local_result.power.searchOp.dynamic*clockRate;
|
|
// ///cout<<"directory.maxPower=" <<directory.maxPower<<endl;
|
|
//
|
|
// directory.maxPower += directory.prefetchb.l_ip.num_search_ports*directory.prefetchb.local_result.power.searchOp.dynamic*clockRate;
|
|
// ///cout<<"directory.maxPower=" <<directory.maxPower<<endl;
|
|
//
|
|
// directory.maxPower += directory.wbb.l_ip.num_search_ports*directory.wbb.local_result.power.searchOp.dynamic*clockRate;
|
|
//
|
|
// cc.power.readOp.dynamic = directory.maxPower*scktRatio*8;//8 is the memory controller counts
|
|
// cc.power.readOp.leakage = directory.caches.local_result.power.readOp.leakage +
|
|
// directory.missb.local_result.power.readOp.leakage +
|
|
// directory.ifb.local_result.power.readOp.leakage +
|
|
// directory.prefetchb.local_result.power.readOp.leakage +
|
|
// directory.wbb.local_result.power.readOp.leakage;
|
|
//
|
|
// cc.power.readOp.leakage *=8;
|
|
//
|
|
// cc.area.set_area(directory.area*8);
|
|
// cout<<"CC area="<<cc.area.get_area()*1e-6<<endl;
|
|
// cout<<"CC Power="<<cc.power.readOp.dynamic<<endl;
|
|
// ccTot.area.set_area(cc.area.get_area()*1e-6);
|
|
// ccTot.power = cc.power;
|
|
// cout<<"DC energy per access" << cc.power.readOp.dynamic/clockRate/8;
|
|
// }
|
|
// else if (XML->sys.first_level_dir==1)
|
|
// {
|
|
// inv_dir.maxPower = inv_dir.caches.local_result.power.searchOp.dynamic*clockRate*XML->sys.domain_size;
|
|
// cc.power.readOp.dynamic = inv_dir.maxPower*scktRatio*64/XML->sys.domain_size;
|
|
// cc.power.readOp.leakage = inv_dir.caches.local_result.power.readOp.leakage*inv_dir.caches.l_ip.nbanks*64/XML->sys.domain_size;
|
|
//
|
|
// cc.area.set_area(inv_dir.area*64/XML->sys.domain_size);
|
|
// cout<<"CC area="<<cc.area.get_area()*1e-6<<endl;
|
|
// cout<<"CC Power="<<cc.power.readOp.dynamic<<endl;
|
|
// ccTot.area.set_area(cc.area.get_area()*1e-6);
|
|
// cout<<"DC energy per access" << cc.power.readOp.dynamic/clockRate/8;
|
|
// ccTot.power = cc.power;
|
|
// }
|
|
// }
|
|
//
|
|
// else if (XML->sys.number_of_dir_levels==2)
|
|
// {
|
|
//
|
|
// directory.maxPower = 0.0;
|
|
// directory.maxPower += (directory.caches.l_ip.num_rw_ports*(0.67*directory.caches.local_result.power.readOp.dynamic+0.33*directory.caches.local_result.power.writeOp.dynamic)
|
|
// +directory.caches.l_ip.num_rd_ports*directory.caches.local_result.power.readOp.dynamic+directory.caches.l_ip.num_wr_ports*directory.caches.local_result.power.writeOp.dynamic
|
|
// +directory.caches.l_ip.num_se_rd_ports*directory.caches.local_result.power.readOp.dynamic)*clockRate;
|
|
// ///cout<<"directory.maxPower=" <<directory.maxPower<<endl;
|
|
//
|
|
// directory.maxPower += directory.missb.l_ip.num_search_ports*directory.missb.local_result.power.searchOp.dynamic*clockRate;
|
|
// ///cout<<"directory.maxPower=" <<directory.maxPower<<endl;
|
|
//
|
|
// directory.maxPower += directory.ifb.l_ip.num_search_ports*directory.ifb.local_result.power.searchOp.dynamic*clockRate;
|
|
// ///cout<<"directory.maxPower=" <<directory.maxPower<<endl;
|
|
//
|
|
// directory.maxPower += directory.prefetchb.l_ip.num_search_ports*directory.prefetchb.local_result.power.searchOp.dynamic*clockRate;
|
|
// ///cout<<"directory.maxPower=" <<directory.maxPower<<endl;
|
|
//
|
|
// directory.maxPower += directory.wbb.l_ip.num_search_ports*directory.wbb.local_result.power.searchOp.dynamic*clockRate;
|
|
//
|
|
// cc.power.readOp.dynamic = directory.maxPower*scktRatio*8;//8 is the memory controller counts
|
|
// cc.power.readOp.leakage = directory.caches.local_result.power.readOp.leakage +
|
|
// directory.missb.local_result.power.readOp.leakage +
|
|
// directory.ifb.local_result.power.readOp.leakage +
|
|
// directory.prefetchb.local_result.power.readOp.leakage +
|
|
// directory.wbb.local_result.power.readOp.leakage;
|
|
// cc.power.readOp.leakage *=8;
|
|
// cc.area.set_area(directory.area*8);
|
|
//
|
|
// if (XML->sys.first_level_dir==0)
|
|
// {
|
|
// directory1.maxPower = 0.0;
|
|
// directory1.maxPower += (directory1.caches.l_ip.num_rw_ports*(0.67*directory1.caches.local_result.power.readOp.dynamic+0.33*directory1.caches.local_result.power.writeOp.dynamic)
|
|
// +directory1.caches.l_ip.num_rd_ports*directory1.caches.local_result.power.readOp.dynamic+directory1.caches.l_ip.num_wr_ports*directory1.caches.local_result.power.writeOp.dynamic
|
|
// +directory1.caches.l_ip.num_se_rd_ports*directory1.caches.local_result.power.readOp.dynamic)*clockRate;
|
|
// ///cout<<"directory1.maxPower=" <<directory1.maxPower<<endl;
|
|
//
|
|
// directory1.maxPower += directory1.missb.l_ip.num_search_ports*directory1.missb.local_result.power.searchOp.dynamic*clockRate;
|
|
// ///cout<<"directory1.maxPower=" <<directory1.maxPower<<endl;
|
|
//
|
|
// directory1.maxPower += directory1.ifb.l_ip.num_search_ports*directory1.ifb.local_result.power.searchOp.dynamic*clockRate;
|
|
// ///cout<<"directory1.maxPower=" <<directory1.maxPower<<endl;
|
|
//
|
|
// directory1.maxPower += directory1.prefetchb.l_ip.num_search_ports*directory1.prefetchb.local_result.power.searchOp.dynamic*clockRate;
|
|
// ///cout<<"directory1.maxPower=" <<directory1.maxPower<<endl;
|
|
//
|
|
// directory1.maxPower += directory1.wbb.l_ip.num_search_ports*directory1.wbb.local_result.power.searchOp.dynamic*clockRate;
|
|
//
|
|
// cc1.power.readOp.dynamic = directory1.maxPower*scktRatio*64/XML->sys.domain_size;
|
|
// cc1.power.readOp.leakage = directory1.caches.local_result.power.readOp.leakage +
|
|
// directory1.missb.local_result.power.readOp.leakage +
|
|
// directory1.ifb.local_result.power.readOp.leakage +
|
|
// directory1.prefetchb.local_result.power.readOp.leakage +
|
|
// directory1.wbb.local_result.power.readOp.leakage;
|
|
// cc1.power.readOp.leakage *= 64/XML->sys.domain_size;
|
|
// cc1.area.set_area(directory1.area*64/XML->sys.domain_size);
|
|
//
|
|
// cout<<"CC area="<<(cc.area.get_area()+cc1.area.get_area())*1e-6<<endl;
|
|
// cout<<"CC Power="<<cc.power.readOp.dynamic + cc1.power.readOp.dynamic <<endl;
|
|
// ccTot.area.set_area((cc.area.get_area()+cc1.area.get_area())*1e-6);
|
|
// ccTot.power = cc.power + cc1.power;
|
|
// }
|
|
// else if (XML->sys.first_level_dir==1)
|
|
// {
|
|
// inv_dir.maxPower = inv_dir.caches.local_result.power.searchOp.dynamic*clockRate*XML->sys.domain_size;
|
|
// cc1.power.readOp.dynamic = inv_dir.maxPower*scktRatio*(64/XML->sys.domain_size);
|
|
// cc1.power.readOp.leakage = inv_dir.caches.local_result.power.readOp.leakage*inv_dir.caches.l_ip.nbanks*XML->sys.domain_size;
|
|
//
|
|
// cc1.area.set_area(inv_dir.area*64/XML->sys.domain_size);
|
|
// cout<<"CC area="<<(cc.area.get_area()+cc1.area.get_area())*1e-6<<endl;
|
|
// cout<<"CC Power="<<cc.power.readOp.dynamic + cc1.power.readOp.dynamic <<endl;
|
|
// ccTot.area.set_area((cc.area.get_area()+cc1.area.get_area())*1e-6);
|
|
// ccTot.power = cc.power + cc1.power;
|
|
//
|
|
// }
|
|
// else if (XML->sys.first_level_dir==2)
|
|
// {
|
|
// cout<<"CC area="<<cc.area.get_area()*1e-6<<endl;
|
|
// cout<<"CC Power="<<cc.power.readOp.dynamic<<endl;
|
|
// ccTot.area.set_area(cc.area.get_area()*1e-6);
|
|
// ccTot.power = cc.power;
|
|
// }
|
|
// }
|
|
//
|
|
//cout<<"L2cache size="<<L2Tot.area.get_area()*1e-6<<endl;
|
|
//cout<<"L2cache dynamic power="<<L2Tot.power.readOp.dynamic<<endl;
|
|
//cout<<"L2cache laeakge power="<<L2Tot.power.readOp.leakage<<endl;
|
|
//
|
|
// ///cout<<"llCache.maxPower=" <<llCache.maxPower<<endl;
|
|
//
|
|
//
|
|
// maxPower += llCache.maxPower;
|
|
// ///cout<<"maxpower=" <<maxPower<<endl;
|
|
//
|
|
//// maxPower += pipeLogicCache.power.readOp.dynamic*clockRate;
|
|
//// ///cout<<"pipeLogic.power="<<pipeLogicCache.power.readOp.dynamic*clockRate<<endl;
|
|
//// ///cout<<"maxpower=" <<maxPower<<endl;
|
|
////
|
|
//// maxPower += pipeLogicDirectory.power.readOp.dynamic*clockRate;
|
|
//// ///cout<<"pipeLogic.power="<<pipeLogicDirectory.power.readOp.dynamic*clockRate<<endl;
|
|
//// ///cout<<"maxpower=" <<maxPower<<endl;
|
|
////
|
|
//// //clock power
|
|
//// maxPower += clockNetwork.total_power.readOp.dynamic*clockRate;
|
|
//// ///cout<<"clockNetwork.total_power="<<clockNetwork.total_power.readOp.dynamic*clockRate<<endl;
|
|
//// ///cout<<"maxpower=" <<maxPower<<endl;
|
|
//
|
|
//}
|
|
|
|
void SharedCache::set_cache_param()
|
|
{
|
|
if (cacheL==L2)
|
|
{
|
|
cachep.name = "L2";
|
|
cachep.clockRate = XML->sys.L2[ithCache].clockrate;
|
|
cachep.clockRate *= 1e6;
|
|
cachep.executionTime = XML->sys.total_cycles/(XML->sys.target_core_clockrate*1e6);
|
|
interface_ip.data_arr_ram_cell_tech_type = XML->sys.L2[ithCache].device_type;//long channel device LSTP
|
|
interface_ip.data_arr_peri_global_tech_type = XML->sys.L2[ithCache].device_type;
|
|
interface_ip.tag_arr_ram_cell_tech_type = XML->sys.L2[ithCache].device_type;
|
|
interface_ip.tag_arr_peri_global_tech_type = XML->sys.L2[ithCache].device_type;
|
|
cachep.capacity = XML->sys.L2[ithCache].L2_config[0];
|
|
cachep.blockW = XML->sys.L2[ithCache].L2_config[1];
|
|
cachep.assoc = XML->sys.L2[ithCache].L2_config[2];
|
|
cachep.nbanks = XML->sys.L2[ithCache].L2_config[3];
|
|
cachep.throughput = XML->sys.L2[ithCache].L2_config[4]/cachep.clockRate;
|
|
cachep.latency = XML->sys.L2[ithCache].L2_config[5]/cachep.clockRate;
|
|
cachep.missb_size = XML->sys.L2[ithCache].buffer_sizes[0];
|
|
cachep.fu_size = XML->sys.L2[ithCache].buffer_sizes[1];
|
|
cachep.prefetchb_size= XML->sys.L2[ithCache].buffer_sizes[2];
|
|
cachep.wbb_size = XML->sys.L2[ithCache].buffer_sizes[3];
|
|
cachep.duty_cycle = XML->sys.L2[ithCache].duty_cycle;
|
|
if (!XML->sys.L2[ithCache].merged_dir)
|
|
{
|
|
cachep.dir_ty = NonDir;
|
|
}
|
|
else
|
|
{
|
|
cachep.dir_ty = SBT;
|
|
cachep.dir_duty_cycle = XML->sys.L2[ithCache].dir_duty_cycle;
|
|
}
|
|
}
|
|
else if (cacheL==L3)
|
|
{
|
|
cachep.name = "L3";
|
|
cachep.clockRate = XML->sys.L3[ithCache].clockrate;
|
|
cachep.clockRate *= 1e6;
|
|
cachep.executionTime = XML->sys.total_cycles/(XML->sys.target_core_clockrate*1e6);
|
|
interface_ip.data_arr_ram_cell_tech_type = XML->sys.L3[ithCache].device_type;//long channel device LSTP
|
|
interface_ip.data_arr_peri_global_tech_type = XML->sys.L3[ithCache].device_type;
|
|
interface_ip.tag_arr_ram_cell_tech_type = XML->sys.L3[ithCache].device_type;
|
|
interface_ip.tag_arr_peri_global_tech_type = XML->sys.L3[ithCache].device_type;
|
|
cachep.capacity = XML->sys.L3[ithCache].L3_config[0];
|
|
cachep.blockW = XML->sys.L3[ithCache].L3_config[1];
|
|
cachep.assoc = XML->sys.L3[ithCache].L3_config[2];
|
|
cachep.nbanks = XML->sys.L3[ithCache].L3_config[3];
|
|
cachep.throughput = XML->sys.L3[ithCache].L3_config[4]/cachep.clockRate;
|
|
cachep.latency = XML->sys.L3[ithCache].L3_config[5]/cachep.clockRate;
|
|
cachep.missb_size = XML->sys.L3[ithCache].buffer_sizes[0];
|
|
cachep.fu_size = XML->sys.L3[ithCache].buffer_sizes[1];
|
|
cachep.prefetchb_size= XML->sys.L3[ithCache].buffer_sizes[2];
|
|
cachep.wbb_size = XML->sys.L3[ithCache].buffer_sizes[3];
|
|
cachep.duty_cycle = XML->sys.L3[ithCache].duty_cycle;
|
|
if (!XML->sys.L2[ithCache].merged_dir)
|
|
{
|
|
cachep.dir_ty = NonDir;
|
|
}
|
|
else
|
|
{
|
|
cachep.dir_ty = SBT;
|
|
cachep.dir_duty_cycle = XML->sys.L2[ithCache].dir_duty_cycle;
|
|
}
|
|
}
|
|
else if (cacheL==L1Directory)
|
|
{
|
|
cachep.name = "First Level Directory";
|
|
cachep.dir_ty = (enum Dir_type) XML->sys.L1Directory[ithCache].Directory_type;
|
|
cachep.clockRate = XML->sys.L1Directory[ithCache].clockrate;
|
|
cachep.clockRate *= 1e6;
|
|
cachep.executionTime = XML->sys.total_cycles/(XML->sys.target_core_clockrate*1e6);
|
|
interface_ip.data_arr_ram_cell_tech_type = XML->sys.L1Directory[ithCache].device_type;//long channel device LSTP
|
|
interface_ip.data_arr_peri_global_tech_type = XML->sys.L1Directory[ithCache].device_type;
|
|
interface_ip.tag_arr_ram_cell_tech_type = XML->sys.L1Directory[ithCache].device_type;
|
|
interface_ip.tag_arr_peri_global_tech_type = XML->sys.L1Directory[ithCache].device_type;
|
|
cachep.capacity = XML->sys.L1Directory[ithCache].Dir_config[0];
|
|
cachep.blockW = XML->sys.L1Directory[ithCache].Dir_config[1];
|
|
cachep.assoc = XML->sys.L1Directory[ithCache].Dir_config[2];
|
|
cachep.nbanks = XML->sys.L1Directory[ithCache].Dir_config[3];
|
|
cachep.throughput = XML->sys.L1Directory[ithCache].Dir_config[4]/cachep.clockRate;
|
|
cachep.latency = XML->sys.L1Directory[ithCache].Dir_config[5]/cachep.clockRate;
|
|
cachep.missb_size = XML->sys.L1Directory[ithCache].buffer_sizes[0];
|
|
cachep.fu_size = XML->sys.L1Directory[ithCache].buffer_sizes[1];
|
|
cachep.prefetchb_size= XML->sys.L1Directory[ithCache].buffer_sizes[2];
|
|
cachep.wbb_size = XML->sys.L1Directory[ithCache].buffer_sizes[3];
|
|
cachep.duty_cycle = XML->sys.L1Directory[ithCache].duty_cycle;
|
|
}
|
|
else if (cacheL==L2Directory)
|
|
{
|
|
cachep.name = "Second Level Directory";
|
|
cachep.dir_ty = (enum Dir_type) XML->sys.L2Directory[ithCache].Directory_type;
|
|
cachep.clockRate = XML->sys.L2Directory[ithCache].clockrate;
|
|
cachep.clockRate *= 1e6;
|
|
cachep.executionTime = XML->sys.total_cycles/(XML->sys.target_core_clockrate*1e6);
|
|
interface_ip.data_arr_ram_cell_tech_type = XML->sys.L2Directory[ithCache].device_type;//long channel device LSTP
|
|
interface_ip.data_arr_peri_global_tech_type = XML->sys.L2Directory[ithCache].device_type;
|
|
interface_ip.tag_arr_ram_cell_tech_type = XML->sys.L2Directory[ithCache].device_type;
|
|
interface_ip.tag_arr_peri_global_tech_type = XML->sys.L2Directory[ithCache].device_type;
|
|
cachep.capacity = XML->sys.L2Directory[ithCache].Dir_config[0];
|
|
cachep.blockW = XML->sys.L2Directory[ithCache].Dir_config[1];
|
|
cachep.assoc = XML->sys.L2Directory[ithCache].Dir_config[2];
|
|
cachep.nbanks = XML->sys.L2Directory[ithCache].Dir_config[3];
|
|
cachep.throughput = XML->sys.L2Directory[ithCache].Dir_config[4]/cachep.clockRate;
|
|
cachep.latency = XML->sys.L2Directory[ithCache].Dir_config[5]/cachep.clockRate;
|
|
cachep.missb_size = XML->sys.L2Directory[ithCache].buffer_sizes[0];
|
|
cachep.fu_size = XML->sys.L2Directory[ithCache].buffer_sizes[1];
|
|
cachep.prefetchb_size= XML->sys.L2Directory[ithCache].buffer_sizes[2];
|
|
cachep.wbb_size = XML->sys.L2Directory[ithCache].buffer_sizes[3];
|
|
cachep.duty_cycle = XML->sys.L2Directory[ithCache].duty_cycle;
|
|
}
|
|
//cachep.cache_duty_cycle=cachep.dir_duty_cycle = 0.35;
|
|
}
|
|
|