“…Blocking instructions are also supported with minor modification. CAS cas0(clk, net[0], net [1], net [4], net [5]); 29 CAS cas1(clk, net[2], net [3], net [6], net [7]); 30 31 CAS cas2(clk, net [4], net [7], net [8], net [11]); 32 CAS cas3(clk, net [5], net [6], net [9], net [10]); 33 34 CAS cas4(clk, net [8], net [9], net [12], net [13]); 35 CAS cas5(clk, net [10], net [11], net [14], net [15]); 36 37 // Assigning input and output to wires in the sorting network 38 // (only using 1 input and 1 output reg. for this instruction) 39 for (i=0; i<4; i=i+i) assign net[i]=in_vdata1[32*(i+1)-1-:32]; 40 assign out_vdata1={net [12], net [13], net [14], net [15]}; The example instruction implementation in Algorithm 1 is a bitonic sorter of 4 inputs.…”