/*
|
/*
|
Asynchronous SDM NoC
|
Asynchronous SDM NoC
|
(C)2011 Wei Song
|
(C)2011 Wei Song
|
Advanced Processor Technologies Group
|
Advanced Processor Technologies Group
|
Computer Science, the Univ. of Manchester, UK
|
Computer Science, the Univ. of Manchester, UK
|
|
|
Authors:
|
Authors:
|
Wei Song wsong83@gmail.com
|
Wei Song wsong83@gmail.com
|
|
|
License: LGPL 3.0 or later
|
License: LGPL 3.0 or later
|
|
|
The port driver between NI and router.
|
The port driver between NI and router.
|
|
|
History:
|
History:
|
27/04/2010 Initial version. <wsong83@gmail.com>
|
27/04/2010 Initial version. <wsong83@gmail.com>
|
16/10/2010 Support SDM. <wsong83@gmail.com>
|
16/10/2010 Support SDM. <wsong83@gmail.com>
|
31/05/2011 Remove the sc_unit datatype to support data width larger than 64. <wsong83@gmail.com>
|
31/05/2011 Remove the sc_unit datatype to support data width larger than 64. <wsong83@gmail.com>
|
|
|
*/
|
*/
|
|
|
#include "rtdriver.h"
|
#include "rtdriver.h"
|
|
|
RTDriver::RTDriver(sc_module_name mname)
|
RTDriver::RTDriver(sc_module_name mname)
|
: sc_module(mname),
|
: sc_module(mname),
|
NI2P("NI2P"),
|
NI2P("NI2P"),
|
P2NI("P2NI")
|
P2NI("P2NI")
|
{
|
{
|
SC_METHOD(IPdetect);
|
SC_METHOD(IPdetect);
|
sensitive << rtia;
|
sensitive << rtia;
|
|
|
SC_METHOD(OPdetect);
|
SC_METHOD(OPdetect);
|
sensitive << rtod[0] << rtod[1] << rtod[2] << rtod[3] << rtod4;
|
sensitive << rtod[0] << rtod[1] << rtod[2] << rtod[3] << rtod4;
|
|
|
SC_THREAD(send);
|
SC_THREAD(send);
|
SC_THREAD(recv);
|
SC_THREAD(recv);
|
|
|
rtinp_sig = false;
|
rtinp_sig = false;
|
rtoutp_sig = false;
|
rtoutp_sig = false;
|
}
|
}
|
|
|
void RTDriver::IPdetect() {
|
void RTDriver::IPdetect() {
|
sc_logic ack_lv_high, ack_lv_low; // the sc_logic ack
|
sc_logic ack_lv_high, ack_lv_low; // the sc_logic ack
|
|
|
// read the ack
|
// read the ack
|
#ifdef ENABLE_CHANNEL_CLISING
|
#ifdef ENABLE_CHANNEL_CLISING
|
ack_lv_high = rtia.read().and_reduce();
|
ack_lv_high = rtia.read().and_reduce();
|
ack_lv_low = rtia.read().or_reduce();
|
ack_lv_low = rtia.read().or_reduce();
|
#else
|
#else
|
ack_lv_high = rtia.read();
|
ack_lv_high = rtia.read();
|
ack_lv_low = rtia.read();
|
ack_lv_low = rtia.read();
|
#endif
|
#endif
|
|
|
if(ack_lv_high.is_01() && ack_lv_high.to_bool())
|
if(ack_lv_high.is_01() && ack_lv_high.to_bool())
|
rtinp_sig = true;
|
rtinp_sig = true;
|
|
|
if(ack_lv_low.is_01() && (!ack_lv_low.to_bool()))
|
if(ack_lv_low.is_01() && (!ack_lv_low.to_bool()))
|
rtinp_sig = false;
|
rtinp_sig = false;
|
}
|
}
|
|
|
void RTDriver::OPdetect() {
|
void RTDriver::OPdetect() {
|
sc_lv<ChBW*4> data_lv; // the ORed data
|
sc_lv<ChBW*4> data_lv; // the ORed data
|
sc_logic data_lv_high, data_lv_low;
|
sc_logic data_lv_high, data_lv_low;
|
|
|
#ifdef ENABLE_CHANNEL_CLISING
|
#ifdef ENABLE_CHANNEL_CLISING
|
data_lv = rtod[0].read() | rtod[1].read() | rtod[2].read() | rtod[3].read() | rtod4.read();
|
data_lv = rtod[0].read() | rtod[1].read() | rtod[2].read() | rtod[3].read() | rtod4.read();
|
data_lv_high = data_lv.and_reduce();
|
data_lv_high = data_lv.and_reduce();
|
data_lv_low = data_lv.or_reduce();
|
data_lv_low = data_lv.or_reduce();
|
#else
|
#else
|
data_lv = rtod[0].read() | rtod[1].read() | rtod[2].read() | rtod[3].read();
|
data_lv = rtod[0].read() | rtod[1].read() | rtod[2].read() | rtod[3].read();
|
data_lv_high = data_lv.and_reduce() | rtod4.read();
|
data_lv_high = data_lv.and_reduce() | rtod4.read();
|
data_lv_low = data_lv.or_reduce() | rtod4.read();
|
data_lv_low = data_lv.or_reduce() | rtod4.read();
|
#endif
|
#endif
|
|
|
if(data_lv_high.is_01() && data_lv_high.to_bool())
|
if(data_lv_high.is_01() && data_lv_high.to_bool())
|
rtoutp_sig = true;
|
rtoutp_sig = true;
|
|
|
if(data_lv_high.is_01() && (!data_lv_low.to_bool()))
|
if(data_lv_high.is_01() && (!data_lv_low.to_bool()))
|
rtoutp_sig = false;
|
rtoutp_sig = false;
|
}
|
}
|
|
|
void RTDriver::send() {
|
void RTDriver::send() {
|
FLIT mflit; // the local flit buffer
|
FLIT mflit; // the local flit buffer
|
unsigned int i, j; // local loop index
|
unsigned int i, j; // local loop index
|
sc_lv<ChBW*4> mdata[4]; // local data copy
|
sc_lv<ChBW*4> mdata[4]; // local data copy
|
#ifdef ENABLE_CHANNEL_CLISING
|
#ifdef ENABLE_CHANNEL_CLISING
|
sc_lv<ChBW*4> mdata4; // local copy of eof
|
sc_lv<ChBW*4> mdata4; // local copy of eof
|
#else
|
#else
|
sc_logic mdata4; // local copy of eof
|
sc_logic mdata4; // local copy of eof
|
#endif
|
#endif
|
|
|
// initialize the output ports
|
// initialize the output ports
|
mdata[0] = 0;
|
mdata[0] = 0;
|
mdata[1] = 0;
|
mdata[1] = 0;
|
mdata[2] = 0;
|
mdata[2] = 0;
|
mdata[3] = 0;
|
mdata[3] = 0;
|
#ifdef ENABLE_CHANNEL_CLISING
|
#ifdef ENABLE_CHANNEL_CLISING
|
mdata4 = 0;
|
mdata4 = 0;
|
#else
|
#else
|
mdata4 = false;
|
mdata4 = false;
|
#endif
|
#endif
|
|
|
rtid[0].write(mdata[0]);
|
rtid[0].write(mdata[0]);
|
rtid[1].write(mdata[1]);
|
rtid[1].write(mdata[1]);
|
rtid[2].write(mdata[2]);
|
rtid[2].write(mdata[2]);
|
rtid[3].write(mdata[3]);
|
rtid[3].write(mdata[3]);
|
rtid4.write(mdata4);
|
rtid4.write(mdata4);
|
|
|
while(true) {
|
while(true) {
|
mflit = NI2P->read(); // read in the flit
|
mflit = NI2P->read(); // read in the flit
|
|
|
// write the flit
|
// write the flit
|
if(mflit.ftype == F_HD) {
|
if(mflit.ftype == F_HD) {
|
// the target address
|
// the target address
|
mdata[mflit.addrx&0x3][0] = SC_LOGIC_1;
|
mdata[mflit.addrx&0x3][0] = SC_LOGIC_1;
|
mdata[(mflit.addrx&0xc)>>2][1] = SC_LOGIC_1;
|
mdata[(mflit.addrx&0xc)>>2][1] = SC_LOGIC_1;
|
mdata[mflit.addry&0x3][2] = SC_LOGIC_1;
|
mdata[mflit.addry&0x3][2] = SC_LOGIC_1;
|
mdata[(mflit.addry&0xc)>>2][3] = SC_LOGIC_1;
|
mdata[(mflit.addry&0xc)>>2][3] = SC_LOGIC_1;
|
|
|
for(i=0,j=4; i<(ChBW-1)*4; i++, j++) {
|
for(i=0,j=4; i<(ChBW-1)*4; i++, j++) {
|
switch((mflit[i/4] >> ((i%4)*2)) & 0x3) {
|
switch((mflit[i/4] >> ((i%4)*2)) & 0x3) {
|
case 0: mdata[0][j] = SC_LOGIC_1; break;
|
case 0: mdata[0][j] = SC_LOGIC_1; break;
|
case 1: mdata[1][j] = SC_LOGIC_1; break;
|
case 1: mdata[1][j] = SC_LOGIC_1; break;
|
case 2: mdata[2][j] = SC_LOGIC_1; break;
|
case 2: mdata[2][j] = SC_LOGIC_1; break;
|
case 3: mdata[3][j] = SC_LOGIC_1; break;
|
case 3: mdata[3][j] = SC_LOGIC_1; break;
|
}
|
}
|
}
|
}
|
} else {
|
} else {
|
for(i=0; i<ChBW*4; i++) {
|
for(i=0; i<ChBW*4; i++) {
|
switch((mflit[i/4] >> ((i%4)*2)) & 0x3) {
|
switch((mflit[i/4] >> ((i%4)*2)) & 0x3) {
|
case 0: mdata[0][i] = SC_LOGIC_1; break;
|
case 0: mdata[0][i] = SC_LOGIC_1; break;
|
case 1: mdata[1][i] = SC_LOGIC_1; break;
|
case 1: mdata[1][i] = SC_LOGIC_1; break;
|
case 2: mdata[2][i] = SC_LOGIC_1; break;
|
case 2: mdata[2][i] = SC_LOGIC_1; break;
|
case 3: mdata[3][i] = SC_LOGIC_1; break;
|
case 3: mdata[3][i] = SC_LOGIC_1; break;
|
}
|
}
|
}
|
}
|
}
|
}
|
|
|
// write to the port
|
// write to the port
|
rtid[0].write(mdata[0]);
|
rtid[0].write(mdata[0]);
|
rtid[1].write(mdata[1]);
|
rtid[1].write(mdata[1]);
|
rtid[2].write(mdata[2]);
|
rtid[2].write(mdata[2]);
|
rtid[3].write(mdata[3]);
|
rtid[3].write(mdata[3]);
|
|
|
// wait for the router to capture the data
|
// wait for the router to capture the data
|
wait(rtinp_sig.posedge_event());
|
wait(rtinp_sig.posedge_event());
|
wait(0.2, SC_NS); // a delay to avoid data override
|
wait(0.2, SC_NS); // a delay to avoid data override
|
|
|
// clear the data
|
// clear the data
|
mdata[0] = 0;
|
mdata[0] = 0;
|
mdata[1] = 0;
|
mdata[1] = 0;
|
mdata[2] = 0;
|
mdata[2] = 0;
|
mdata[3] = 0;
|
mdata[3] = 0;
|
|
|
rtid[0].write(mdata[0]);
|
rtid[0].write(mdata[0]);
|
rtid[1].write(mdata[1]);
|
rtid[1].write(mdata[1]);
|
rtid[2].write(mdata[2]);
|
rtid[2].write(mdata[2]);
|
rtid[3].write(mdata[3]);
|
rtid[3].write(mdata[3]);
|
|
|
// wait for the input port be ready again
|
// wait for the input port be ready again
|
wait(rtinp_sig.negedge_event());
|
wait(rtinp_sig.negedge_event());
|
wait(0.2, SC_NS); // a delay to avoid data override
|
wait(0.2, SC_NS); // a delay to avoid data override
|
|
|
// check whether a tailf flit is needed
|
// check whether a tailf flit is needed
|
if(mflit.ftype == F_TL) {
|
if(mflit.ftype == F_TL) {
|
// write the eof
|
// write the eof
|
rtid4.write(~mdata4);
|
rtid4.write(~mdata4);
|
|
|
// wait for the router to capture the data
|
// wait for the router to capture the data
|
wait(rtinp_sig.posedge_event());
|
wait(rtinp_sig.posedge_event());
|
wait(0.2, SC_NS); // a delay to avoid data override
|
wait(0.2, SC_NS); // a delay to avoid data override
|
|
|
// clear the eof
|
// clear the eof
|
rtid4.write(mdata4);
|
rtid4.write(mdata4);
|
|
|
// wait for the input port be ready again
|
// wait for the input port be ready again
|
wait(rtinp_sig.negedge_event());
|
wait(rtinp_sig.negedge_event());
|
wait(0.2, SC_NS); // a delay to avoid data override
|
wait(0.2, SC_NS); // a delay to avoid data override
|
}
|
}
|
}
|
}
|
}
|
}
|
|
|
void RTDriver::recv() {
|
void RTDriver::recv() {
|
FLIT mflit; // the local flit buffer
|
FLIT mflit; // the local flit buffer
|
sc_lv<ChBW*4> mdata[4]; // local data copy
|
sc_lv<ChBW*4> mdata[4]; // local data copy
|
#ifdef ENABLE_CHANNEL_CLISING
|
#ifdef ENABLE_CHANNEL_CLISING
|
sc_lv<ChBW*4> mdata4; // local copy of eof
|
sc_lv<ChBW*4> mdata4; // local copy of eof
|
sc_lv<ChBW*4> mack = 0; // local copy of ack
|
sc_lv<ChBW*4> mack = 0; // local copy of ack
|
#else
|
#else
|
sc_logic mdata4; // local copy of eof
|
sc_logic mdata4; // local copy of eof
|
sc_logic mack = SC_LOGIC_0; // local copy of ack
|
sc_logic mack = SC_LOGIC_0; // local copy of ack
|
#endif
|
#endif
|
sc_lv<4> dd; // the current 1-of-4 data under process
|
sc_lv<4> dd; // the current 1-of-4 data under process
|
unsigned int i, j; // local loop index
|
unsigned int i, j; // local loop index
|
|
|
bool is_hd = true; // the current flit is a header flit
|
bool is_hd = true; // the current flit is a header flit
|
|
|
// initialize the ack signal
|
// initialize the ack signal
|
rtoa.write(mack);
|
rtoa.write(mack);
|
|
|
while(true) {
|
while(true) {
|
// clear the flit
|
// clear the flit
|
mflit.clear();
|
mflit.clear();
|
|
|
// wait for an incoming flit
|
// wait for an incoming flit
|
wait(rtoutp_sig.posedge_event());
|
wait(rtoutp_sig.posedge_event());
|
|
|
// analyse the flit
|
// analyse the flit
|
mdata[0] = rtod[0].read();
|
mdata[0] = rtod[0].read();
|
mdata[1] = rtod[1].read();
|
mdata[1] = rtod[1].read();
|
mdata[2] = rtod[2].read();
|
mdata[2] = rtod[2].read();
|
mdata[3] = rtod[3].read();
|
mdata[3] = rtod[3].read();
|
mdata4 = rtod4.read();
|
mdata4 = rtod4.read();
|
|
|
if(is_hd) {
|
if(is_hd) {
|
mflit.ftype = F_HD;
|
mflit.ftype = F_HD;
|
is_hd = false;
|
is_hd = false;
|
}
|
}
|
#ifdef ENABLE_CHANNEL_CLISING
|
#ifdef ENABLE_CHANNEL_CLISING
|
else if(mdata4[0].to_bool()) {
|
else if(mdata4[0].to_bool()) {
|
mflit.ftype = F_TL;
|
mflit.ftype = F_TL;
|
is_hd = true;
|
is_hd = true;
|
}
|
}
|
#else
|
#else
|
else if(mdata4.to_bool()) {
|
else if(mdata4.to_bool()) {
|
mflit.ftype = F_TL;
|
mflit.ftype = F_TL;
|
is_hd = true;
|
is_hd = true;
|
}
|
}
|
#endif
|
#endif
|
else {
|
else {
|
mflit.ftype = F_DAT;
|
mflit.ftype = F_DAT;
|
}
|
}
|
|
|
if(mflit.ftype == F_HD) {
|
if(mflit.ftype == F_HD) {
|
// fetch the address
|
// fetch the address
|
dd[0] = mdata[0][0]; dd[1] = mdata[1][0]; dd[2] = mdata[2][0]; dd[3] = mdata[3][0];
|
dd[0] = mdata[0][0]; dd[1] = mdata[1][0]; dd[2] = mdata[2][0]; dd[3] = mdata[3][0];
|
mflit.addrx |= (c1o42b(dd.to_uint()) << 0);
|
mflit.addrx |= (c1o42b(dd.to_uint()) << 0);
|
dd[0] = mdata[0][1]; dd[1] = mdata[1][1]; dd[2] = mdata[2][1]; dd[3] = mdata[3][1];
|
dd[0] = mdata[0][1]; dd[1] = mdata[1][1]; dd[2] = mdata[2][1]; dd[3] = mdata[3][1];
|
mflit.addrx |= (c1o42b(dd.to_uint()) << 2);
|
mflit.addrx |= (c1o42b(dd.to_uint()) << 2);
|
dd[0] = mdata[0][2]; dd[1] = mdata[1][2]; dd[2] = mdata[2][2]; dd[3] = mdata[3][2];
|
dd[0] = mdata[0][2]; dd[1] = mdata[1][2]; dd[2] = mdata[2][2]; dd[3] = mdata[3][2];
|
mflit.addry |= (c1o42b(dd.to_uint()) << 0);
|
mflit.addry |= (c1o42b(dd.to_uint()) << 0);
|
dd[0] = mdata[0][3]; dd[1] = mdata[1][3]; dd[2] = mdata[2][3]; dd[3] = mdata[3][3];
|
dd[0] = mdata[0][3]; dd[1] = mdata[1][3]; dd[2] = mdata[2][3]; dd[3] = mdata[3][3];
|
mflit.addry |= (c1o42b(dd.to_uint()) << 2);
|
mflit.addry |= (c1o42b(dd.to_uint()) << 2);
|
|
|
// fill in data
|
// fill in data
|
for(i=1; i<ChBW; i++) {
|
for(i=1; i<ChBW; i++) {
|
for(j=0; j<4; j++) {
|
for(j=0; j<4; j++) {
|
dd[0] = mdata[0][i*4+j];
|
dd[0] = mdata[0][i*4+j];
|
dd[1] = mdata[1][i*4+j];
|
dd[1] = mdata[1][i*4+j];
|
dd[2] = mdata[2][i*4+j];
|
dd[2] = mdata[2][i*4+j];
|
dd[3] = mdata[3][i*4+j];
|
dd[3] = mdata[3][i*4+j];
|
mflit[i-1] |= c1o42b(dd.to_uint()) << j*2;
|
mflit[i-1] |= c1o42b(dd.to_uint()) << j*2;
|
}
|
}
|
}
|
}
|
} else if (mflit.ftype != F_TL) {
|
} else if (mflit.ftype != F_TL) {
|
// fill in data
|
// fill in data
|
for(i=0; i<ChBW; i++) {
|
for(i=0; i<ChBW; i++) {
|
for(j=0; j<4; j++) {
|
for(j=0; j<4; j++) {
|
dd[0] = mdata[0][i*4+j];
|
dd[0] = mdata[0][i*4+j];
|
dd[1] = mdata[1][i*4+j];
|
dd[1] = mdata[1][i*4+j];
|
dd[2] = mdata[2][i*4+j];
|
dd[2] = mdata[2][i*4+j];
|
dd[3] = mdata[3][i*4+j];
|
dd[3] = mdata[3][i*4+j];
|
mflit[i] |= c1o42b(dd.to_uint()) << j*2;
|
mflit[i] |= c1o42b(dd.to_uint()) << j*2;
|
}
|
}
|
}
|
}
|
}
|
}
|
|
|
// send the flit to the NI
|
// send the flit to the NI
|
P2NI->write(mflit);
|
P2NI->write(mflit);
|
|
|
wait(0.2, SC_NS); // a delay to avoid data override
|
wait(0.2, SC_NS); // a delay to avoid data override
|
rtoa.write(~mack); // notify that data is captured
|
rtoa.write(~mack); // notify that data is captured
|
|
|
// wait for the data withdrawal
|
// wait for the data withdrawal
|
wait(rtoutp_sig.negedge_event());
|
wait(rtoutp_sig.negedge_event());
|
wait(0.2, SC_NS); // a delay to avoid data override
|
wait(0.2, SC_NS); // a delay to avoid data override
|
rtoa.write(mack); // notify that data is captured
|
rtoa.write(mack); // notify that data is captured
|
|
|
}
|
}
|
}
|
}
|
|
|
unsigned int RTDriver::c1o42b(unsigned int dd) {
|
unsigned int RTDriver::c1o42b(unsigned int dd) {
|
switch(dd) {
|
switch(dd) {
|
case 1: return 0;
|
case 1: return 0;
|
case 2: return 1;
|
case 2: return 1;
|
case 4: return 2;
|
case 4: return 2;
|
case 8: return 3;
|
case 8: return 3;
|
default: return 0xff;
|
default: return 0xff;
|
}
|
}
|
}
|
}
|
|
|