rr_graph area estimator adopted RRGraph object

This commit is contained in:
tangxifan 2020-02-01 21:53:31 -07:00
parent 12a8f79869
commit a99835e1c1
3 changed files with 60 additions and 65 deletions

View File

@ -33,7 +33,7 @@ static void count_unidir_routing_transistors(std::vector<t_segment_inf>& segment
float R_minW_pmos, float R_minW_pmos,
const float trans_sram_bit); const float trans_sram_bit);
static float get_cblock_trans(int* num_inputs_to_cblock, int wire_to_ipin_switch, int max_inputs_to_cblock, float trans_sram_bit); static float get_cblock_trans(const vtr::vector<RRNodeId, int>& num_inputs_to_cblock, int wire_to_ipin_switch, int max_inputs_to_cblock, float trans_sram_bit);
static float* alloc_and_load_unsharable_switch_trans(int num_switch, static float* alloc_and_load_unsharable_switch_trans(int num_switch,
float trans_sram_bit, float trans_sram_bit,
@ -101,7 +101,7 @@ void count_bidir_routing_transistors(int num_switch, int wire_to_ipin_switch, fl
* optimistic (but I still think it's pretty reasonable). */ * optimistic (but I still think it's pretty reasonable). */
auto& device_ctx = g_vpr_ctx.device(); auto& device_ctx = g_vpr_ctx.device();
int* num_inputs_to_cblock; /* [0..device_ctx.rr_nodes.size()-1], but all entries not */ vtr::vector<RRNodeId, int> num_inputs_to_cblock; /* [0..device_ctx.rr_nodes.size()-1], but all entries not */
/* corresponding to IPINs will be 0. */ /* corresponding to IPINs will be 0. */
@ -110,7 +110,7 @@ void count_bidir_routing_transistors(int num_switch, int wire_to_ipin_switch, fl
float *unsharable_switch_trans, *sharable_switch_trans; /* [0..num_switch-1] */ float *unsharable_switch_trans, *sharable_switch_trans; /* [0..num_switch-1] */
t_rr_type from_rr_type, to_rr_type; t_rr_type from_rr_type, to_rr_type;
int iedge, num_edges, maxlen; int maxlen;
int iswitch, i, j, iseg, max_inputs_to_cblock; int iswitch, i, j, iseg, max_inputs_to_cblock;
float input_cblock_trans, shared_opin_buffer_trans; float input_cblock_trans, shared_opin_buffer_trans;
@ -144,7 +144,7 @@ void count_bidir_routing_transistors(int num_switch, int wire_to_ipin_switch, fl
trans_track_to_cblock_buf = 0; trans_track_to_cblock_buf = 0;
} }
num_inputs_to_cblock = (int*)vtr::calloc(device_ctx.rr_nodes.size(), sizeof(int)); num_inputs_to_cblock.resize(device_ctx.rr_graph.nodes().size(), 0);
maxlen = std::max(device_ctx.grid.width(), device_ctx.grid.height()); maxlen = std::max(device_ctx.grid.width(), device_ctx.grid.height());
cblock_counted = (bool*)vtr::calloc(maxlen, sizeof(bool)); cblock_counted = (bool*)vtr::calloc(maxlen, sizeof(bool));
@ -156,29 +156,27 @@ void count_bidir_routing_transistors(int num_switch, int wire_to_ipin_switch, fl
sharable_switch_trans = alloc_and_load_sharable_switch_trans(num_switch, sharable_switch_trans = alloc_and_load_sharable_switch_trans(num_switch,
R_minW_nmos, R_minW_pmos); R_minW_nmos, R_minW_pmos);
for (size_t from_node = 0; from_node < device_ctx.rr_nodes.size(); from_node++) { for (const RRNodeId& from_node : device_ctx.rr_graph.nodes()) {
from_rr_type = device_ctx.rr_nodes[from_node].type(); from_rr_type = device_ctx.rr_graph.node_type(from_node);
switch (from_rr_type) { switch (from_rr_type) {
case CHANX: case CHANX:
case CHANY: case CHANY:
num_edges = device_ctx.rr_nodes[from_node].num_edges(); for (const RREdgeId& iedge : device_ctx.rr_graph.node_out_edges(from_node)) {
RRNodeId to_node = device_ctx.rr_graph.edge_sink_node(iedge);
for (iedge = 0; iedge < num_edges; iedge++) { to_rr_type = device_ctx.rr_graph.node_type(to_node);
size_t to_node = device_ctx.rr_nodes[from_node].edge_sink_node(iedge);
to_rr_type = device_ctx.rr_nodes[to_node].type();
/* Ignore any uninitialized rr_graph nodes */ /* Ignore any uninitialized rr_graph nodes */
if ((device_ctx.rr_nodes[to_node].type() == SOURCE) if ((device_ctx.rr_graph.node_type(to_node) == SOURCE)
&& (device_ctx.rr_nodes[to_node].xlow() == 0) && (device_ctx.rr_nodes[to_node].ylow() == 0) && (device_ctx.rr_graph.node_xlow(to_node) == 0) && (device_ctx.rr_graph.node_ylow(to_node) == 0)
&& (device_ctx.rr_nodes[to_node].xhigh() == 0) && (device_ctx.rr_nodes[to_node].yhigh() == 0)) { && (device_ctx.rr_graph.node_xhigh(to_node) == 0) && (device_ctx.rr_graph.node_yhigh(to_node) == 0)) {
continue; continue;
} }
switch (to_rr_type) { switch (to_rr_type) {
case CHANX: case CHANX:
case CHANY: case CHANY:
iswitch = device_ctx.rr_nodes[from_node].edge_switch(iedge); iswitch = (short)size_t(device_ctx.rr_graph.edge_switch(iedge));
if (device_ctx.rr_switch_inf[iswitch].buffered()) { if (device_ctx.rr_switch_inf[iswitch].buffered()) {
iseg = seg_index_of_sblock(from_node, to_node); iseg = seg_index_of_sblock(from_node, to_node);
@ -214,8 +212,8 @@ void count_bidir_routing_transistors(int num_switch, int wire_to_ipin_switch, fl
default: default:
VPR_ERROR(VPR_ERROR_ROUTE, VPR_ERROR(VPR_ERROR_ROUTE,
"in count_routing_transistors:\n" "in count_routing_transistors:\n"
"\tUnexpected connection from node %d (type %s) to node %d (type %s).\n", "\tUnexpected connection from node %ld (type %s) to node %ld (type %s).\n",
from_node, rr_node_typename[from_rr_type], to_node, rr_node_typename[to_rr_type]); size_t(from_node), rr_node_typename[from_rr_type], size_t(to_node), rr_node_typename[to_rr_type]);
break; break;
} /* End switch on to_rr_type. */ } /* End switch on to_rr_type. */
@ -225,35 +223,34 @@ void count_bidir_routing_transistors(int num_switch, int wire_to_ipin_switch, fl
/* Now add in the shared buffer transistors, and reset some flags. */ /* Now add in the shared buffer transistors, and reset some flags. */
if (from_rr_type == CHANX) { if (from_rr_type == CHANX) {
for (i = device_ctx.rr_nodes[from_node].xlow() - 1; for (i = device_ctx.rr_graph.node_xlow(from_node) - 1;
i <= device_ctx.rr_nodes[from_node].xhigh(); i++) { i <= device_ctx.rr_graph.node_xhigh(from_node); i++) {
ntrans_sharing += shared_buffer_trans[i]; ntrans_sharing += shared_buffer_trans[i];
shared_buffer_trans[i] = 0.; shared_buffer_trans[i] = 0.;
} }
for (i = device_ctx.rr_nodes[from_node].xlow(); i <= device_ctx.rr_nodes[from_node].xhigh(); for (i = device_ctx.rr_graph.node_xlow(from_node); i <= device_ctx.rr_graph.node_xhigh(from_node);
i++) i++)
cblock_counted[i] = false; cblock_counted[i] = false;
} else { /* CHANY */ } else { /* CHANY */
for (j = device_ctx.rr_nodes[from_node].ylow() - 1; for (j = device_ctx.rr_graph.node_ylow(from_node) - 1;
j <= device_ctx.rr_nodes[from_node].yhigh(); j++) { j <= device_ctx.rr_graph.node_yhigh(from_node); j++) {
ntrans_sharing += shared_buffer_trans[j]; ntrans_sharing += shared_buffer_trans[j];
shared_buffer_trans[j] = 0.; shared_buffer_trans[j] = 0.;
} }
for (j = device_ctx.rr_nodes[from_node].ylow(); j <= device_ctx.rr_nodes[from_node].yhigh(); for (j = device_ctx.rr_graph.node_ylow(from_node); j <= device_ctx.rr_graph.node_yhigh(from_node);
j++) j++)
cblock_counted[j] = false; cblock_counted[j] = false;
} }
break; break;
case OPIN: case OPIN:
num_edges = device_ctx.rr_nodes[from_node].num_edges();
shared_opin_buffer_trans = 0.; shared_opin_buffer_trans = 0.;
for (iedge = 0; iedge < num_edges; iedge++) { for (const RREdgeId& iedge : device_ctx.rr_graph.node_out_edges(from_node)) {
iswitch = device_ctx.rr_nodes[from_node].edge_switch(iedge); iswitch = (short)size_t(device_ctx.rr_graph.edge_switch(iedge));
ntrans_no_sharing += unsharable_switch_trans[iswitch] ntrans_no_sharing += unsharable_switch_trans[iswitch]
+ sharable_switch_trans[iswitch]; + sharable_switch_trans[iswitch];
ntrans_sharing += unsharable_switch_trans[iswitch]; ntrans_sharing += unsharable_switch_trans[iswitch];
@ -281,7 +278,7 @@ void count_bidir_routing_transistors(int num_switch, int wire_to_ipin_switch, fl
input_cblock_trans = get_cblock_trans(num_inputs_to_cblock, wire_to_ipin_switch, input_cblock_trans = get_cblock_trans(num_inputs_to_cblock, wire_to_ipin_switch,
max_inputs_to_cblock, trans_sram_bit); max_inputs_to_cblock, trans_sram_bit);
free(num_inputs_to_cblock); num_inputs_to_cblock.clear();
ntrans_sharing += input_cblock_trans; ntrans_sharing += input_cblock_trans;
ntrans_no_sharing += input_cblock_trans; ntrans_no_sharing += input_cblock_trans;
@ -303,13 +300,12 @@ void count_unidir_routing_transistors(std::vector<t_segment_inf>& /*segment_inf*
auto& device_ctx = g_vpr_ctx.device(); auto& device_ctx = g_vpr_ctx.device();
bool* cblock_counted; /* [0..max(device_ctx.grid.width(),device_ctx.grid.height())] -- 0th element unused. */ bool* cblock_counted; /* [0..max(device_ctx.grid.width(),device_ctx.grid.height())] -- 0th element unused. */
int* num_inputs_to_cblock; /* [0..device_ctx.rr_nodes.size()-1], but all entries not */ vtr::vector<RRNodeId, int> num_inputs_to_cblock; /* [0..device_ctx.rr_nodes.size()-1], but all entries not */
/* corresponding to IPINs will be 0. */ /* corresponding to IPINs will be 0. */
t_rr_type from_rr_type, to_rr_type; t_rr_type from_rr_type, to_rr_type;
int i, j, iseg, iedge, num_edges, maxlen; int i, j, iseg, maxlen;
RRNodeId to_node;
int max_inputs_to_cblock; int max_inputs_to_cblock;
float input_cblock_trans; float input_cblock_trans;
@ -318,8 +314,7 @@ void count_unidir_routing_transistors(std::vector<t_segment_inf>& /*segment_inf*
* a single mux. We should count this mux only once as we look at the outgoing * a single mux. We should count this mux only once as we look at the outgoing
* switches of all rr nodes. Thus we keep track of which muxes we have already * switches of all rr nodes. Thus we keep track of which muxes we have already
* counted via the variable below. */ * counted via the variable below. */
bool* chan_node_switch_done; vtr::vector<RRNodeId, bool> chan_node_switch_done(device_ctx.rr_graph.nodes().size(), false);
chan_node_switch_done = (bool*)vtr::calloc(device_ctx.rr_graph.nodes().size(), sizeof(bool));
/* The variable below is an accumulator variable that will add up all the * /* The variable below is an accumulator variable that will add up all the *
* transistors in the routing. Make double so that it doesn't stop * * transistors in the routing. Make double so that it doesn't stop *
@ -349,7 +344,7 @@ void count_unidir_routing_transistors(std::vector<t_segment_inf>& /*segment_inf*
trans_track_to_cblock_buf = 0; trans_track_to_cblock_buf = 0;
} }
num_inputs_to_cblock = (int*)vtr::calloc(device_ctx.rr_graph.nodes().size(), sizeof(int)); num_inputs_to_cblock.resize(device_ctx.rr_graph.nodes().size(), 0);
maxlen = std::max(device_ctx.grid.width(), device_ctx.grid.height()); maxlen = std::max(device_ctx.grid.width(), device_ctx.grid.height());
cblock_counted = (bool*)vtr::calloc(maxlen, sizeof(bool)); cblock_counted = (bool*)vtr::calloc(maxlen, sizeof(bool));
@ -376,10 +371,10 @@ void count_unidir_routing_transistors(std::vector<t_segment_inf>& /*segment_inf*
case CHANX: case CHANX:
case CHANY: case CHANY:
if (!chan_node_switch_done[to_node]) { if (!chan_node_switch_done[to_node]) {
int switch_index = device_ctx.rr_nodes[from_node].edge_switch(iedge); int switch_index = (int)size_t(device_ctx.rr_graph.edge_switch(iedge));
auto switch_type = device_ctx.rr_switch_inf[switch_index].type(); auto switch_type = device_ctx.rr_switch_inf[switch_index].type();
int fan_in = device_ctx.rr_nodes[to_node].fan_in(); int fan_in = device_ctx.rr_graph.node_in_edges(to_node).size();
if (device_ctx.rr_switch_inf[switch_index].type() == SwitchType::MUX) { if (device_ctx.rr_switch_inf[switch_index].type() == SwitchType::MUX) {
/* Each wire segment begins with a multipexer followed by a driver for unidirectional */ /* Each wire segment begins with a multipexer followed by a driver for unidirectional */
@ -433,8 +428,8 @@ void count_unidir_routing_transistors(std::vector<t_segment_inf>& /*segment_inf*
default: default:
VPR_ERROR(VPR_ERROR_ROUTE, VPR_ERROR(VPR_ERROR_ROUTE,
"in count_routing_transistors:\n" "in count_routing_transistors:\n"
"\tUnexpected connection from node %d (type %d) to node %d (type %d).\n", "\tUnexpected connection from node %ld (type %d) to node %ld (type %d).\n",
from_node, from_rr_type, to_node, to_rr_type); size_t(from_node), from_rr_type, size_t(to_node), to_rr_type);
break; break;
} /* End switch on to_rr_type. */ } /* End switch on to_rr_type. */
@ -443,11 +438,11 @@ void count_unidir_routing_transistors(std::vector<t_segment_inf>& /*segment_inf*
/* Reset some flags */ /* Reset some flags */
if (from_rr_type == CHANX) { if (from_rr_type == CHANX) {
for (i = device_ctx.rr_nodes[from_node].xlow(); i <= device_ctx.rr_nodes[from_node].xhigh(); i++) for (i = device_ctx.rr_graph.node_xlow(from_node); i <= device_ctx.rr_graph.node_xhigh(from_node); i++)
cblock_counted[i] = false; cblock_counted[i] = false;
} else { /* CHANY */ } else { /* CHANY */
for (j = device_ctx.rr_nodes[from_node].ylow(); j <= device_ctx.rr_nodes[from_node].yhigh(); for (j = device_ctx.rr_graph.node_ylow(from_node); j <= device_ctx.rr_graph.node_yhigh(from_node);
j++) j++)
cblock_counted[j] = false; cblock_counted[j] = false;
} }
@ -467,8 +462,8 @@ void count_unidir_routing_transistors(std::vector<t_segment_inf>& /*segment_inf*
max_inputs_to_cblock, trans_sram_bit); max_inputs_to_cblock, trans_sram_bit);
free(cblock_counted); free(cblock_counted);
free(num_inputs_to_cblock); num_inputs_to_cblock.clear();
free(chan_node_switch_done); chan_node_switch_done.clear();
ntrans += input_cblock_trans; ntrans += input_cblock_trans;
@ -477,7 +472,7 @@ void count_unidir_routing_transistors(std::vector<t_segment_inf>& /*segment_inf*
VTR_LOG("\tTotal routing area: %#g, per logic tile: %#g\n", ntrans, ntrans / (float)(device_ctx.grid.width() * device_ctx.grid.height())); VTR_LOG("\tTotal routing area: %#g, per logic tile: %#g\n", ntrans, ntrans / (float)(device_ctx.grid.width() * device_ctx.grid.height()));
} }
static float get_cblock_trans(int* num_inputs_to_cblock, int wire_to_ipin_switch, int max_inputs_to_cblock, float trans_sram_bit) { static float get_cblock_trans(const vtr::vector<RRNodeId, int>& num_inputs_to_cblock, int wire_to_ipin_switch, int max_inputs_to_cblock, float trans_sram_bit) {
/* Computes the transistors in the input connection block multiplexers and * /* Computes the transistors in the input connection block multiplexers and *
* the buffers from connection block outputs to the logic block input pins. * * the buffers from connection block outputs to the logic block input pins. *
* For speed, I precompute the number of transistors in the multiplexers of * * For speed, I precompute the number of transistors in the multiplexers of *
@ -505,7 +500,7 @@ static float get_cblock_trans(int* num_inputs_to_cblock, int wire_to_ipin_switch
trans_count = 0.; trans_count = 0.;
for (size_t i = 0; i < device_ctx.rr_nodes.size(); i++) { for (const RRNodeId& i : device_ctx.rr_graph.nodes()) {
num_inputs = num_inputs_to_cblock[i]; num_inputs = num_inputs_to_cblock[i];
trans_count += trans_per_cblock[num_inputs]; trans_count += trans_per_cblock[num_inputs];
} }

View File

@ -6,20 +6,20 @@
#include "globals.h" #include "globals.h"
#include "rr_graph_util.h" #include "rr_graph_util.h"
int seg_index_of_cblock(t_rr_type from_rr_type, int to_node) { int seg_index_of_cblock(t_rr_type from_rr_type, const RRNodeId& to_node) {
/* Returns the segment number (distance along the channel) of the connection * /* Returns the segment number (distance along the channel) of the connection *
* box from from_rr_type (CHANX or CHANY) to to_node (IPIN). */ * box from from_rr_type (CHANX or CHANY) to to_node (IPIN). */
auto& device_ctx = g_vpr_ctx.device(); auto& device_ctx = g_vpr_ctx.device();
if (from_rr_type == CHANX) if (from_rr_type == CHANX)
return (device_ctx.rr_nodes[to_node].xlow()); return (device_ctx.rr_graph.node_xlow(to_node));
else else
/* CHANY */ /* CHANY */
return (device_ctx.rr_nodes[to_node].ylow()); return (device_ctx.rr_graph.node_ylow(to_node));
} }
int seg_index_of_sblock(int from_node, int to_node) { int seg_index_of_sblock(const RRNodeId& from_node, const RRNodeId& to_node) {
/* Returns the segment number (distance along the channel) of the switch box * /* Returns the segment number (distance along the channel) of the switch box *
* box from from_node (CHANX or CHANY) to to_node (CHANX or CHANY). The * * box from from_node (CHANX or CHANY) to to_node (CHANX or CHANY). The *
* switch box on the left side of a CHANX segment at (i,j) has seg_index = * * switch box on the left side of a CHANX segment at (i,j) has seg_index = *
@ -31,47 +31,47 @@ int seg_index_of_sblock(int from_node, int to_node) {
auto& device_ctx = g_vpr_ctx.device(); auto& device_ctx = g_vpr_ctx.device();
from_rr_type = device_ctx.rr_nodes[from_node].type(); from_rr_type = device_ctx.rr_graph.node_type(from_node);
to_rr_type = device_ctx.rr_nodes[to_node].type(); to_rr_type = device_ctx.rr_graph.node_type(to_node);
if (from_rr_type == CHANX) { if (from_rr_type == CHANX) {
if (to_rr_type == CHANY) { if (to_rr_type == CHANY) {
return (device_ctx.rr_nodes[to_node].xlow()); return (device_ctx.rr_graph.node_xlow(to_node));
} else if (to_rr_type == CHANX) { } else if (to_rr_type == CHANX) {
if (device_ctx.rr_nodes[to_node].xlow() > device_ctx.rr_nodes[from_node].xlow()) { /* Going right */ if (device_ctx.rr_graph.node_xlow(to_node) > device_ctx.rr_graph.node_xlow(from_node)) { /* Going right */
return (device_ctx.rr_nodes[from_node].xhigh()); return (device_ctx.rr_graph.node_xhigh(from_node));
} else { /* Going left */ } else { /* Going left */
return (device_ctx.rr_nodes[to_node].xhigh()); return (device_ctx.rr_graph.node_xhigh(to_node));
} }
} else { } else {
VPR_FATAL_ERROR(VPR_ERROR_ROUTE, VPR_FATAL_ERROR(VPR_ERROR_ROUTE,
"in seg_index_of_sblock: to_node %d is of type %d.\n", "in seg_index_of_sblock: to_node %ld is of type %d.\n",
to_node, to_rr_type); size_t(to_node), to_rr_type);
return OPEN; //Should not reach here once thrown return OPEN; //Should not reach here once thrown
} }
} }
/* End from_rr_type is CHANX */ /* End from_rr_type is CHANX */
else if (from_rr_type == CHANY) { else if (from_rr_type == CHANY) {
if (to_rr_type == CHANX) { if (to_rr_type == CHANX) {
return (device_ctx.rr_nodes[to_node].ylow()); return (device_ctx.rr_graph.node_ylow(to_node));
} else if (to_rr_type == CHANY) { } else if (to_rr_type == CHANY) {
if (device_ctx.rr_nodes[to_node].ylow() > device_ctx.rr_nodes[from_node].ylow()) { /* Going up */ if (device_ctx.rr_graph.node_ylow(to_node) > device_ctx.rr_graph.node_ylow(from_node)) { /* Going up */
return (device_ctx.rr_nodes[from_node].yhigh()); return (device_ctx.rr_graph.node_yhigh(from_node));
} else { /* Going down */ } else { /* Going down */
return (device_ctx.rr_nodes[to_node].yhigh()); return (device_ctx.rr_graph.node_yhigh(to_node));
} }
} else { } else {
VPR_FATAL_ERROR(VPR_ERROR_ROUTE, VPR_FATAL_ERROR(VPR_ERROR_ROUTE,
"in seg_index_of_sblock: to_node %d is of type %d.\n", "in seg_index_of_sblock: to_node %ld is of type %d.\n",
to_node, to_rr_type); size_t(to_node), to_rr_type);
return OPEN; //Should not reach here once thrown return OPEN; //Should not reach here once thrown
} }
} }
/* End from_rr_type is CHANY */ /* End from_rr_type is CHANY */
else { else {
VPR_FATAL_ERROR(VPR_ERROR_ROUTE, VPR_FATAL_ERROR(VPR_ERROR_ROUTE,
"in seg_index_of_sblock: from_node %d is of type %d.\n", "in seg_index_of_sblock: from_node %ld is of type %d.\n",
from_node, from_rr_type); size_t(from_node), from_rr_type);
return OPEN; //Should not reach here once thrown return OPEN; //Should not reach here once thrown
} }
} }

View File

@ -1,8 +1,8 @@
#ifndef RR_GRAPH_UTIL_H #ifndef RR_GRAPH_UTIL_H
#define RR_GRAPH_UTIL_H #define RR_GRAPH_UTIL_H
int seg_index_of_cblock(t_rr_type from_rr_type, int to_node); int seg_index_of_cblock(t_rr_type from_rr_type, const RRNodeId& to_node);
int seg_index_of_sblock(int from_node, int to_node); int seg_index_of_sblock(const RRNodeId& from_node, const RRNodeId& to_node);
#endif #endif