You cannot select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

468 lines
15 KiB
Verilog

// © IBM Corp. 2020
// Licensed under the Apache License, Version 2.0 (the "License"), as modified by
// the terms below; you may not use the files in this repository except in
// compliance with the License as modified.
// You may obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0
//
// Modified Terms:
//
// 1) For the purpose of the patent license granted to you in Section 3 of the
// License, the "Work" hereby includes implementations of the work of authorship
// in physical form.
//
// 2) Notwithstanding any terms to the contrary in the License, any licenses
// necessary for implementation of the Work that are available from OpenPOWER
// via the Power ISA End User License Agreement (EULA) are explicitly excluded
// hereunder, and may be obtained from OpenPOWER under the terms and conditions
// of the EULA.
//
// Unless required by applicable law or agreed to in writing, the reference design
// distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
// WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License
// for the specific language governing permissions and limitations under the License.
//
// Additional rights, including the ability to physically implement a softcore that
// is compliant with the required sections of the Power ISA Specification, are
// available at no cost under the terms of the OpenPOWER Power ISA EULA, which can be
// obtained (along with the Power ISA) here: https://openpowerfoundation.org.
`timescale 1 ns / 1 ns
//*****************************************************************************
// Description: XU Population Count
//
//*****************************************************************************
`include "tri_a2o.vh"
module tri_st_popcnt(
clk,
rst,
vdd,
gnd,
delay_lclkr_dc,
mpw1_dc_b,
mpw2_dc_b,
d_mode_dc,
func_sl_force,
func_sl_thold_0_b,
sg_0,
scan_in,
scan_out,
ex1_act,
ex1_instr,
ex2_popcnt_rs1,
ex4_popcnt_rt
);
//-------------------------------------------------------------------
// Clocks & Power
//-------------------------------------------------------------------
input clk;
input rst;
inout vdd;
inout gnd;
//-------------------------------------------------------------------
// Pervasive
//-------------------------------------------------------------------
input delay_lclkr_dc;
input mpw1_dc_b;
input mpw2_dc_b;
input d_mode_dc;
input func_sl_force;
input func_sl_thold_0_b;
input sg_0;
(* pin_data="PIN_FUNCTION=/SCAN_IN/" *) // scan_in
input scan_in;
(* pin_data="PIN_FUNCTION=/SCAN_OUT/" *) // scan_out
output scan_out;
input ex1_act;
input [22:23] ex1_instr;
input [0:63] ex2_popcnt_rs1;
output [0:63] ex4_popcnt_rt;
// Latches
wire [2:3] exx_act_q; // input=>exx_act_d ,act=>1
wire [2:3] exx_act_d;
wire [22:23] ex2_instr_q; // input=>ex1_instr ,act=>exx_act(1)
wire [0:2] ex3_popcnt_sel_q; // input=>ex2_popcnt_sel ,act=>exx_act(2)
wire [0:2] ex2_popcnt_sel;
wire [0:7] ex3_b3_q; // input=>ex2_b3 ,act=>exx_act(2)
wire [0:7] ex2_b3;
wire [0:7] ex3_b2_q; // input=>ex2_b2 ,act=>exx_act(2)
wire [0:7] ex2_b2;
wire [0:7] ex3_b1_q; // input=>ex2_b1 ,act=>exx_act(2)
wire [0:7] ex2_b1;
wire [0:7] ex3_b0_q; // input=>ex2_b0 ,act=>exx_act(2)
wire [0:7] ex2_b0;
wire [0:7] ex4_b3_q; // input=>ex3_b3_q ,act=>exx_act(3)
wire [0:7] ex4_b2_q; // input=>ex3_b2_q ,act=>exx_act(3)
wire [0:7] ex4_b1_q; // input=>ex3_b1_q ,act=>exx_act(3)
wire [0:7] ex4_b0_q; // input=>ex3_b0_q ,act=>exx_act(3)
wire [0:5] ex4_word0_q; // input=>ex3_word0 ,act=>exx_act(3)
wire [0:5] ex3_word0;
wire [0:5] ex4_word1_q; // input=>ex3_word1 ,act=>exx_act(3)
wire [0:5] ex3_word1;
wire [0:2] ex4_popcnt_sel_q; // input=>ex3_popcnt_sel_q ,act=>exx_act(3)
// Scanchain
parameter exx_act_offset = 0;
parameter ex2_instr_offset = exx_act_offset + 2;
parameter ex3_popcnt_sel_offset = ex2_instr_offset + 2;
parameter ex3_b3_offset = ex3_popcnt_sel_offset + 3;
parameter ex3_b2_offset = ex3_b3_offset + 8;
parameter ex3_b1_offset = ex3_b2_offset + 8;
parameter ex3_b0_offset = ex3_b1_offset + 8;
parameter ex4_b3_offset = ex3_b0_offset + 8;
parameter ex4_b2_offset = ex4_b3_offset + 8;
parameter ex4_b1_offset = ex4_b2_offset + 8;
parameter ex4_b0_offset = ex4_b1_offset + 8;
parameter ex4_word0_offset = ex4_b0_offset + 8;
parameter ex4_word1_offset = ex4_word0_offset + 6;
parameter ex4_popcnt_sel_offset = ex4_word1_offset + 6;
parameter scan_right = ex4_popcnt_sel_offset + 3;
wire [0:scan_right-1] siv;
wire [0:scan_right-1] sov;
// Signals
wire [0:63] ex4_popcnt_byte;
wire [0:63] ex4_popcnt_word;
wire [0:63] ex4_popcnt_dword;
wire [1:3] exx_act;
assign exx_act_d[2:3] = exx_act[1:2];
assign exx_act[1:3] = {ex1_act, exx_act_q[2:3]};
generate
genvar i;
for (i = 0; i <= 7; i = i + 1)
begin : byte_gen
tri_st_popcnt_byte bytes(
.b0(ex2_popcnt_rs1[8*i:8*i+7]),
.y({ex2_b3[i],ex2_b2[i],ex2_b1[i],ex2_b0[i]}),
.vdd(vdd),
.gnd(gnd)
);
assign ex4_popcnt_byte[8*i+0:8*i+3] = 0;
assign ex4_popcnt_byte[8*i+4] = ex4_b3_q[i];
assign ex4_popcnt_byte[8*i+5] = ex4_b2_q[i];
assign ex4_popcnt_byte[8*i+6] = ex4_b1_q[i];
assign ex4_popcnt_byte[8*i+7] = ex4_b0_q[i];
end
endgenerate
tri_st_popcnt_word word0(
.b0(ex3_b0_q[0:3]),
.b1(ex3_b1_q[0:3]),
.b2(ex3_b2_q[0:3]),
.b3(ex3_b3_q[0:3]),
.y(ex3_word0),
.vdd(vdd),
.gnd(gnd)
);
tri_st_popcnt_word word1(
.b0(ex3_b0_q[4:7]),
.b1(ex3_b1_q[4:7]),
.b2(ex3_b2_q[4:7]),
.b3(ex3_b3_q[4:7]),
.y(ex3_word1),
.vdd(vdd),
.gnd(gnd)
);
assign ex4_popcnt_word[00:25] = {26{1'b0}};
assign ex4_popcnt_word[26:31] = ex4_word0_q;
assign ex4_popcnt_word[32:57] = {26{1'b0}};
assign ex4_popcnt_word[58:63] = ex4_word1_q;
assign ex4_popcnt_dword[00:56] = {57{1'b0}};
assign ex4_popcnt_dword[57:63] = {1'b0, ex4_word0_q} + {1'b0, ex4_word1_q};
assign ex2_popcnt_sel[0] = (ex2_instr_q == 2'b00) ? 1'b1 : 1'b0;
assign ex2_popcnt_sel[1] = (ex2_instr_q == 2'b10) ? 1'b1 : 1'b0;
assign ex2_popcnt_sel[2] = (ex2_instr_q == 2'b11) ? 1'b1 : 1'b0;
assign ex4_popcnt_rt = (ex4_popcnt_byte & {64{ex4_popcnt_sel_q[0]}}) |
(ex4_popcnt_word & {64{ex4_popcnt_sel_q[1]}}) |
(ex4_popcnt_dword & {64{ex4_popcnt_sel_q[2]}});
//-------------------------------------------------------------------
// Latch instances
//-------------------------------------------------------------------
tri_rlmreg_p #(.WIDTH(2), .INIT(0), .NEEDS_SRESET(1)) exx_act_latch(
.clk(clk),
.rst(rst),
.vd(vdd),
.gd(gnd),
.act(1'b1),
.force_t(func_sl_force),
.d_mode(d_mode_dc),
.delay_lclkr(delay_lclkr_dc),
.mpw1_b(mpw1_dc_b),
.mpw2_b(mpw2_dc_b),
.thold_b(func_sl_thold_0_b),
.sg(sg_0),
.scin(siv[exx_act_offset:exx_act_offset + 2 - 1]),
.scout(sov[exx_act_offset:exx_act_offset + 2 - 1]),
.din(exx_act_d),
.dout(exx_act_q)
);
tri_rlmreg_p #(.WIDTH(2), .INIT(0), .NEEDS_SRESET(1)) ex2_instr_latch(
.clk(clk),
.rst(rst),
.vd(vdd),
.gd(gnd),
.act(exx_act[1]),
.force_t(func_sl_force),
.d_mode(d_mode_dc),
.delay_lclkr(delay_lclkr_dc),
.mpw1_b(mpw1_dc_b),
.mpw2_b(mpw2_dc_b),
.thold_b(func_sl_thold_0_b),
.sg(sg_0),
.scin(siv[ex2_instr_offset:ex2_instr_offset + 2 - 1]),
.scout(sov[ex2_instr_offset:ex2_instr_offset + 2 - 1]),
.din(ex1_instr),
.dout(ex2_instr_q)
);
tri_rlmreg_p #(.WIDTH(3), .INIT(0), .NEEDS_SRESET(1)) ex3_popcnt_sel_latch(
.clk(clk),
.rst(rst),
.vd(vdd),
.gd(gnd),
.act(exx_act[2]),
.force_t(func_sl_force),
.d_mode(d_mode_dc),
.delay_lclkr(delay_lclkr_dc),
.mpw1_b(mpw1_dc_b),
.mpw2_b(mpw2_dc_b),
.thold_b(func_sl_thold_0_b),
.sg(sg_0),
.scin(siv[ex3_popcnt_sel_offset:ex3_popcnt_sel_offset + 3 - 1]),
.scout(sov[ex3_popcnt_sel_offset:ex3_popcnt_sel_offset + 3 - 1]),
.din(ex2_popcnt_sel),
.dout(ex3_popcnt_sel_q)
);
tri_rlmreg_p #(.WIDTH(8), .INIT(0), .NEEDS_SRESET(1)) ex3_b3_latch(
.clk(clk),
.rst(rst),
.vd(vdd),
.gd(gnd),
.act(exx_act[2]),
.force_t(func_sl_force),
.d_mode(d_mode_dc),
.delay_lclkr(delay_lclkr_dc),
.mpw1_b(mpw1_dc_b),
.mpw2_b(mpw2_dc_b),
.thold_b(func_sl_thold_0_b),
.sg(sg_0),
.scin(siv[ex3_b3_offset:ex3_b3_offset + 8 - 1]),
.scout(sov[ex3_b3_offset:ex3_b3_offset + 8 - 1]),
.din(ex2_b3),
.dout(ex3_b3_q)
);
tri_rlmreg_p #(.WIDTH(8), .INIT(0), .NEEDS_SRESET(1)) ex3_b2_latch(
.clk(clk),
.rst(rst),
.vd(vdd),
.gd(gnd),
.act(exx_act[2]),
.force_t(func_sl_force),
.d_mode(d_mode_dc),
.delay_lclkr(delay_lclkr_dc),
.mpw1_b(mpw1_dc_b),
.mpw2_b(mpw2_dc_b),
.thold_b(func_sl_thold_0_b),
.sg(sg_0),
.scin(siv[ex3_b2_offset:ex3_b2_offset + 8 - 1]),
.scout(sov[ex3_b2_offset:ex3_b2_offset + 8 - 1]),
.din(ex2_b2),
.dout(ex3_b2_q)
);
tri_rlmreg_p #(.WIDTH(8), .INIT(0), .NEEDS_SRESET(1)) ex3_b1_latch(
.clk(clk),
.rst(rst),
.vd(vdd),
.gd(gnd),
.act(exx_act[2]),
.force_t(func_sl_force),
.d_mode(d_mode_dc),
.delay_lclkr(delay_lclkr_dc),
.mpw1_b(mpw1_dc_b),
.mpw2_b(mpw2_dc_b),
.thold_b(func_sl_thold_0_b),
.sg(sg_0),
.scin(siv[ex3_b1_offset:ex3_b1_offset + 8 - 1]),
.scout(sov[ex3_b1_offset:ex3_b1_offset + 8 - 1]),
.din(ex2_b1),
.dout(ex3_b1_q)
);
tri_rlmreg_p #(.WIDTH(8), .INIT(0), .NEEDS_SRESET(1)) ex3_b0_latch(
.clk(clk),
.rst(rst),
.vd(vdd),
.gd(gnd),
.act(exx_act[2]),
.force_t(func_sl_force),
.d_mode(d_mode_dc),
.delay_lclkr(delay_lclkr_dc),
.mpw1_b(mpw1_dc_b),
.mpw2_b(mpw2_dc_b),
.thold_b(func_sl_thold_0_b),
.sg(sg_0),
.scin(siv[ex3_b0_offset:ex3_b0_offset + 8 - 1]),
.scout(sov[ex3_b0_offset:ex3_b0_offset + 8 - 1]),
.din(ex2_b0),
.dout(ex3_b0_q)
);
tri_rlmreg_p #(.WIDTH(8), .INIT(0), .NEEDS_SRESET(1)) ex4_b3_latch(
.clk(clk),
.rst(rst),
.vd(vdd),
.gd(gnd),
.act(exx_act[3]),
.force_t(func_sl_force),
.d_mode(d_mode_dc),
.delay_lclkr(delay_lclkr_dc),
.mpw1_b(mpw1_dc_b),
.mpw2_b(mpw2_dc_b),
.thold_b(func_sl_thold_0_b),
.sg(sg_0),
.scin(siv[ex4_b3_offset:ex4_b3_offset + 8 - 1]),
.scout(sov[ex4_b3_offset:ex4_b3_offset + 8 - 1]),
.din(ex3_b3_q),
.dout(ex4_b3_q)
);
tri_rlmreg_p #(.WIDTH(8), .INIT(0), .NEEDS_SRESET(1)) ex4_b2_latch(
.clk(clk),
.rst(rst),
.vd(vdd),
.gd(gnd),
.act(exx_act[3]),
.force_t(func_sl_force),
.d_mode(d_mode_dc),
.delay_lclkr(delay_lclkr_dc),
.mpw1_b(mpw1_dc_b),
.mpw2_b(mpw2_dc_b),
.thold_b(func_sl_thold_0_b),
.sg(sg_0),
.scin(siv[ex4_b2_offset:ex4_b2_offset + 8 - 1]),
.scout(sov[ex4_b2_offset:ex4_b2_offset + 8 - 1]),
.din(ex3_b2_q),
.dout(ex4_b2_q)
);
tri_rlmreg_p #(.WIDTH(8), .INIT(0), .NEEDS_SRESET(1)) ex4_b1_latch(
.clk(clk),
.rst(rst),
.vd(vdd),
.gd(gnd),
.act(exx_act[3]),
.force_t(func_sl_force),
.d_mode(d_mode_dc),
.delay_lclkr(delay_lclkr_dc),
.mpw1_b(mpw1_dc_b),
.mpw2_b(mpw2_dc_b),
.thold_b(func_sl_thold_0_b),
.sg(sg_0),
.scin(siv[ex4_b1_offset:ex4_b1_offset + 8 - 1]),
.scout(sov[ex4_b1_offset:ex4_b1_offset + 8 - 1]),
.din(ex3_b1_q),
.dout(ex4_b1_q)
);
tri_rlmreg_p #(.WIDTH(8), .INIT(0), .NEEDS_SRESET(1)) ex4_b0_latch(
.clk(clk),
.rst(rst),
.vd(vdd),
.gd(gnd),
.act(exx_act[3]),
.force_t(func_sl_force),
.d_mode(d_mode_dc),
.delay_lclkr(delay_lclkr_dc),
.mpw1_b(mpw1_dc_b),
.mpw2_b(mpw2_dc_b),
.thold_b(func_sl_thold_0_b),
.sg(sg_0),
.scin(siv[ex4_b0_offset:ex4_b0_offset + 8 - 1]),
.scout(sov[ex4_b0_offset:ex4_b0_offset + 8 - 1]),
.din(ex3_b0_q),
.dout(ex4_b0_q)
);
tri_rlmreg_p #(.WIDTH(6), .INIT(0), .NEEDS_SRESET(1)) ex4_word0_latch(
.clk(clk),
.rst(rst),
.vd(vdd),
.gd(gnd),
.act(exx_act[3]),
.force_t(func_sl_force),
.d_mode(d_mode_dc),
.delay_lclkr(delay_lclkr_dc),
.mpw1_b(mpw1_dc_b),
.mpw2_b(mpw2_dc_b),
.thold_b(func_sl_thold_0_b),
.sg(sg_0),
.scin(siv[ex4_word0_offset:ex4_word0_offset + 6 - 1]),
.scout(sov[ex4_word0_offset:ex4_word0_offset + 6 - 1]),
.din(ex3_word0),
.dout(ex4_word0_q)
);
tri_rlmreg_p #(.WIDTH(6), .INIT(0), .NEEDS_SRESET(1)) ex4_word1_latch(
.clk(clk),
.rst(rst),
.vd(vdd),
.gd(gnd),
.act(exx_act[3]),
.force_t(func_sl_force),
.d_mode(d_mode_dc),
.delay_lclkr(delay_lclkr_dc),
.mpw1_b(mpw1_dc_b),
.mpw2_b(mpw2_dc_b),
.thold_b(func_sl_thold_0_b),
.sg(sg_0),
.scin(siv[ex4_word1_offset:ex4_word1_offset + 6 - 1]),
.scout(sov[ex4_word1_offset:ex4_word1_offset + 6 - 1]),
.din(ex3_word1),
.dout(ex4_word1_q)
);
tri_rlmreg_p #(.WIDTH(3), .INIT(0), .NEEDS_SRESET(1)) ex4_popcnt_sel_latch(
.clk(clk),
.rst(rst),
.vd(vdd),
.gd(gnd),
.act(exx_act[3]),
.force_t(func_sl_force),
.d_mode(d_mode_dc),
.delay_lclkr(delay_lclkr_dc),
.mpw1_b(mpw1_dc_b),
.mpw2_b(mpw2_dc_b),
.thold_b(func_sl_thold_0_b),
.sg(sg_0),
.scin(siv[ex4_popcnt_sel_offset:ex4_popcnt_sel_offset + 3 - 1]),
.scout(sov[ex4_popcnt_sel_offset:ex4_popcnt_sel_offset + 3 - 1]),
.din(ex3_popcnt_sel_q),
.dout(ex4_popcnt_sel_q)
);
assign siv[0:scan_right-1] = {sov[1:scan_right-1], scan_in};
assign scan_out = sov[0];
endmodule