2014-04-01 18:44:30 +02:00
|
|
|
/*****************************************************************************
|
|
|
|
* McPAT/CACTI
|
|
|
|
* SOFTWARE LICENSE AGREEMENT
|
|
|
|
* Copyright 2012 Hewlett-Packard Development Company, L.P.
|
2014-06-03 22:32:59 +02:00
|
|
|
* Copyright (c) 2010-2013 Advanced Micro Devices, Inc.
|
2014-04-01 18:44:30 +02:00
|
|
|
* All Rights Reserved
|
|
|
|
*
|
|
|
|
* Redistribution and use in source and binary forms, with or without
|
|
|
|
* modification, are permitted provided that the following conditions are
|
|
|
|
* met: redistributions of source code must retain the above copyright
|
|
|
|
* notice, this list of conditions and the following disclaimer;
|
|
|
|
* redistributions in binary form must reproduce the above copyright
|
|
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
|
|
* documentation and/or other materials provided with the distribution;
|
|
|
|
* neither the name of the copyright holders nor the names of its
|
|
|
|
* contributors may be used to endorse or promote products derived from
|
|
|
|
* this software without specific prior written permission.
|
|
|
|
|
|
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
|
|
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
|
|
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
|
|
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
|
|
|
* OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
|
|
|
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
|
|
|
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
|
|
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
|
|
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
|
|
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
2014-06-03 22:32:59 +02:00
|
|
|
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
2014-04-01 18:44:30 +02:00
|
|
|
*
|
|
|
|
***************************************************************************/
|
|
|
|
|
|
|
|
#include "crossbar.h"
|
|
|
|
|
|
|
|
#define ASPECT_THRESHOLD .8
|
|
|
|
#define ADJ 1
|
|
|
|
|
|
|
|
Crossbar::Crossbar(
|
|
|
|
double n_inp_,
|
|
|
|
double n_out_,
|
|
|
|
double flit_size_,
|
|
|
|
TechnologyParameter::DeviceType *dt
|
2014-06-03 22:32:59 +02:00
|
|
|
): n_inp(n_inp_), n_out(n_out_), flit_size(flit_size_), deviceType(dt) {
|
|
|
|
min_w_pmos = deviceType->n_to_p_eff_curr_drv_ratio * g_tp.min_w_nmos_;
|
|
|
|
Vdd = dt->Vdd;
|
|
|
|
CB_ADJ = 1;
|
2014-04-01 18:44:30 +02:00
|
|
|
}
|
|
|
|
|
2014-06-03 22:32:59 +02:00
|
|
|
Crossbar::~Crossbar() {}
|
2014-04-01 18:44:30 +02:00
|
|
|
|
2014-06-03 22:32:59 +02:00
|
|
|
double Crossbar::output_buffer() {
|
2014-04-01 18:44:30 +02:00
|
|
|
|
2014-06-03 22:32:59 +02:00
|
|
|
//Wire winit(4, 4);
|
|
|
|
double l_eff = n_inp * flit_size * g_tp.wire_outside_mat.pitch;
|
|
|
|
Wire w1(g_ip->wt, l_eff);
|
|
|
|
//double s1 = w1.repeater_size *l_eff*ADJ/w1.repeater_spacing;
|
|
|
|
double s1 = w1.repeater_size * (l_eff < w1.repeater_spacing ?
|
|
|
|
l_eff * ADJ / w1.repeater_spacing : ADJ);
|
|
|
|
double pton_size = deviceType->n_to_p_eff_curr_drv_ratio;
|
|
|
|
// the model assumes input capacitance of the wire driver = input capacitance of nand + nor = input cap of the driver transistor
|
|
|
|
TriS1 = s1 * (1 + pton_size) / (2 + pton_size + 1 + 2 * pton_size);
|
|
|
|
TriS2 = s1; //driver transistor
|
2014-04-01 18:44:30 +02:00
|
|
|
|
2014-06-03 22:32:59 +02:00
|
|
|
if (TriS1 < 1)
|
|
|
|
TriS1 = 1;
|
2014-04-01 18:44:30 +02:00
|
|
|
|
2014-06-03 22:32:59 +02:00
|
|
|
double input_cap = gate_C(TriS1 * (2 * min_w_pmos + g_tp.min_w_nmos_), 0) +
|
|
|
|
gate_C(TriS1 * (min_w_pmos + 2 * g_tp.min_w_nmos_), 0);
|
2014-04-01 18:44:30 +02:00
|
|
|
// input_cap += drain_C_(TriS1*g_tp.min_w_nmos_, NCH, 1, 1, g_tp.cell_h_def) +
|
|
|
|
// drain_C_(TriS1*min_w_pmos, PCH, 1, 1, g_tp.cell_h_def)*2 +
|
|
|
|
// gate_C(TriS2*g_tp.min_w_nmos_, 0)+
|
|
|
|
// drain_C_(TriS1*min_w_pmos, NCH, 1, 1, g_tp.cell_h_def)*2 +
|
|
|
|
// drain_C_(TriS1*min_w_pmos, PCH, 1, 1, g_tp.cell_h_def) +
|
|
|
|
// gate_C(TriS2*min_w_pmos, 0);
|
2014-06-03 22:32:59 +02:00
|
|
|
tri_int_cap = drain_C_(TriS1 * g_tp.min_w_nmos_, NCH, 1, 1, g_tp.cell_h_def) +
|
|
|
|
drain_C_(TriS1 * min_w_pmos, PCH, 1, 1, g_tp.cell_h_def) * 2 +
|
|
|
|
gate_C(TriS2 * g_tp.min_w_nmos_, 0) +
|
|
|
|
drain_C_(TriS1 * min_w_pmos, NCH, 1, 1, g_tp.cell_h_def) * 2 +
|
|
|
|
drain_C_(TriS1 * min_w_pmos, PCH, 1, 1, g_tp.cell_h_def) +
|
|
|
|
gate_C(TriS2 * min_w_pmos, 0);
|
|
|
|
double output_cap = drain_C_(TriS2 * g_tp.min_w_nmos_, NCH, 1, 1,
|
|
|
|
g_tp.cell_h_def) +
|
|
|
|
drain_C_(TriS2 * min_w_pmos, PCH, 1, 1, g_tp.cell_h_def);
|
|
|
|
double ctr_cap = gate_C(TriS2 * (min_w_pmos + g_tp.min_w_nmos_), 0);
|
|
|
|
|
|
|
|
tri_inp_cap = input_cap;
|
|
|
|
tri_out_cap = output_cap;
|
|
|
|
tri_ctr_cap = ctr_cap;
|
|
|
|
return input_cap + output_cap + ctr_cap;
|
2014-04-01 18:44:30 +02:00
|
|
|
}
|
|
|
|
|
2014-06-03 22:32:59 +02:00
|
|
|
void Crossbar::compute_power() {
|
|
|
|
|
|
|
|
Wire winit(4, 4);
|
|
|
|
double tri_cap = output_buffer();
|
|
|
|
assert(tri_cap > 0);
|
|
|
|
//area of a tristate logic
|
|
|
|
double g_area = compute_gate_area(INV, 1, TriS2 * g_tp.min_w_nmos_,
|
|
|
|
TriS2 * min_w_pmos, g_tp.cell_h_def);
|
|
|
|
g_area *= 2; // to model area of output transistors
|
|
|
|
g_area += compute_gate_area (NAND, 2, TriS1 * 2 * g_tp.min_w_nmos_,
|
|
|
|
TriS1 * min_w_pmos, g_tp.cell_h_def);
|
|
|
|
g_area += compute_gate_area (NOR, 2, TriS1 * g_tp.min_w_nmos_,
|
|
|
|
TriS1 * 2 * min_w_pmos, g_tp.cell_h_def);
|
|
|
|
double width /*per tristate*/ = g_area / (CB_ADJ * g_tp.cell_h_def);
|
|
|
|
// effective no. of tristate buffers that need to be laid side by side
|
|
|
|
int ntri = (int)ceil(g_tp.cell_h_def / (g_tp.wire_outside_mat.pitch));
|
|
|
|
double wire_len = MAX(width * ntri * n_out,
|
|
|
|
flit_size * g_tp.wire_outside_mat.pitch * n_out);
|
|
|
|
Wire w1(g_ip->wt, wire_len);
|
|
|
|
|
|
|
|
area.w = wire_len;
|
|
|
|
area.h = g_tp.wire_outside_mat.pitch * n_inp * flit_size * CB_ADJ;
|
|
|
|
Wire w2(g_ip->wt, area.h);
|
|
|
|
|
|
|
|
double aspect_ratio_cb = (area.h / area.w) * (n_out / n_inp);
|
|
|
|
if (aspect_ratio_cb > 1) aspect_ratio_cb = 1 / aspect_ratio_cb;
|
|
|
|
|
|
|
|
if (aspect_ratio_cb < ASPECT_THRESHOLD) {
|
|
|
|
if (n_out > 2 && n_inp > 2) {
|
|
|
|
CB_ADJ += 0.2;
|
|
|
|
//cout << "CB ADJ " << CB_ADJ << endl;
|
|
|
|
if (CB_ADJ < 4) {
|
|
|
|
this->compute_power();
|
|
|
|
}
|
|
|
|
}
|
2014-04-01 18:44:30 +02:00
|
|
|
}
|
2014-06-03 22:32:59 +02:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
power.readOp.dynamic =
|
|
|
|
(w1.power.readOp.dynamic + w2.power.readOp.dynamic +
|
|
|
|
(tri_inp_cap * n_out + tri_out_cap * n_inp + tri_ctr_cap +
|
|
|
|
tri_int_cap) * Vdd * Vdd) * flit_size;
|
|
|
|
power.readOp.leakage = n_inp * n_out * flit_size * (
|
|
|
|
cmos_Isub_leakage(g_tp.min_w_nmos_ * TriS2 * 2, min_w_pmos * TriS2 * 2,
|
|
|
|
1, inv) * Vdd +
|
|
|
|
cmos_Isub_leakage(g_tp.min_w_nmos_ * TriS1 * 3, min_w_pmos * TriS1 * 3,
|
|
|
|
2, nand) * Vdd +
|
|
|
|
cmos_Isub_leakage(g_tp.min_w_nmos_ * TriS1 * 3, min_w_pmos * TriS1 * 3,
|
|
|
|
2, nor) * Vdd +
|
|
|
|
w1.power.readOp.leakage + w2.power.readOp.leakage);
|
|
|
|
power.readOp.gate_leakage = n_inp * n_out * flit_size * (
|
|
|
|
cmos_Ig_leakage(g_tp.min_w_nmos_ * TriS2 * 2, min_w_pmos * TriS2 * 2,
|
|
|
|
1, inv) * Vdd +
|
|
|
|
cmos_Ig_leakage(g_tp.min_w_nmos_ * TriS1 * 3, min_w_pmos * TriS1 * 3,
|
|
|
|
2, nand) * Vdd +
|
|
|
|
cmos_Ig_leakage(g_tp.min_w_nmos_ * TriS1 * 3, min_w_pmos * TriS1 * 3,
|
|
|
|
2, nor) * Vdd +
|
|
|
|
w1.power.readOp.gate_leakage + w2.power.readOp.gate_leakage);
|
|
|
|
|
|
|
|
// delay calculation
|
|
|
|
double l_eff = n_inp * flit_size * g_tp.wire_outside_mat.pitch;
|
|
|
|
Wire wdriver(g_ip->wt, l_eff);
|
|
|
|
double res = g_tp.wire_outside_mat.R_per_um * (area.w + area.h) +
|
|
|
|
tr_R_on(g_tp.min_w_nmos_ * wdriver.repeater_size, NCH, 1);
|
|
|
|
double cap = g_tp.wire_outside_mat.C_per_um * (area.w + area.h) + n_out *
|
|
|
|
tri_inp_cap + n_inp * tri_out_cap;
|
|
|
|
delay = horowitz(w1.signal_rise_time(), res * cap, deviceType->Vth /
|
|
|
|
deviceType->Vdd, deviceType->Vth / deviceType->Vdd, RISE);
|
|
|
|
|
|
|
|
Wire wreset();
|
2014-04-01 18:44:30 +02:00
|
|
|
}
|
|
|
|
|
2014-06-03 22:32:59 +02:00
|
|
|
void Crossbar::print_crossbar() {
|
|
|
|
cout << "\nCrossbar Stats (" << n_inp << "x" << n_out << ")\n\n";
|
|
|
|
cout << "Flit size : " << flit_size << " bits" << endl;
|
|
|
|
cout << "Width : " << area.w << " u" << endl;
|
|
|
|
cout << "Height : " << area.h << " u" << endl;
|
|
|
|
cout << "Dynamic Power : " << power.readOp.dynamic*1e9 *
|
|
|
|
MIN(n_inp, n_out) << " (nJ)" << endl;
|
|
|
|
cout << "Leakage Power : " << power.readOp.leakage*1e3 << " (mW)"
|
|
|
|
<< endl;
|
|
|
|
cout << "Gate Leakage Power : " << power.readOp.gate_leakage*1e3
|
|
|
|
<< " (mW)" << endl;
|
|
|
|
cout << "Crossbar Delay : " << delay*1e12 << " ps\n";
|
2014-04-01 18:44:30 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|