diff options
Diffstat (limited to 'techlibs')
-rw-r--r-- | techlibs/fabulous/Makefile.inc | 10 | ||||
-rw-r--r-- | techlibs/fabulous/cells_map.v | 29 | ||||
-rw-r--r-- | techlibs/fabulous/cells_map_ff.v | 54 | ||||
-rw-r--r-- | techlibs/fabulous/ff_map.v | 26 | ||||
-rw-r--r-- | techlibs/fabulous/latches_map.v | 11 | ||||
-rw-r--r-- | techlibs/fabulous/prims.v | 335 | ||||
-rw-r--r-- | techlibs/fabulous/prims_ff.v | 575 | ||||
-rw-r--r-- | techlibs/fabulous/synth_fabulous.cc | 242 |
8 files changed, 1282 insertions, 0 deletions
diff --git a/techlibs/fabulous/Makefile.inc b/techlibs/fabulous/Makefile.inc new file mode 100644 index 000000000..eb5adc0eb --- /dev/null +++ b/techlibs/fabulous/Makefile.inc @@ -0,0 +1,10 @@ + +OBJS += techlibs/fabulous/synth_fabulous.o + +$(eval $(call add_share_file,share/fabulous,techlibs/fabulous/cells_map.v)) +$(eval $(call add_share_file,share/fabulous,techlibs/fabulous/cells_map_ff.v)) +$(eval $(call add_share_file,share/fabulous,techlibs/fabulous/prims.v)) +$(eval $(call add_share_file,share/fabulous,techlibs/fabulous/prims_ff.v)) +$(eval $(call add_share_file,share/fabulous,techlibs/fabulous/latches_map.v)) +$(eval $(call add_share_file,share/fabulous,techlibs/fabulous/ff_map.v)) + diff --git a/techlibs/fabulous/cells_map.v b/techlibs/fabulous/cells_map.v new file mode 100644 index 000000000..eadd18b6f --- /dev/null +++ b/techlibs/fabulous/cells_map.v @@ -0,0 +1,29 @@ +module \$lut (A, Y); + parameter WIDTH = 0; + parameter LUT = 0; + + input [WIDTH-1:0] A; + output Y; + + generate + if (WIDTH == 1) begin + LUT1 #(.INIT(LUT)) _TECHMAP_REPLACE_ (.O(Y), .I0(A[0])); + + end else + if (WIDTH == 2) begin + LUT2 #(.INIT(LUT)) _TECHMAP_REPLACE_ (.O(Y), .I0(A[0]), .I1(A[1])); + + end else + if (WIDTH == 3) begin + LUT3 #(.INIT(LUT)) _TECHMAP_REPLACE_ (.O(Y), .I0(A[0]), .I1(A[1]), .I2(A[2])); + + end else + if (WIDTH == 4) begin + LUT4 #(.INIT(LUT)) _TECHMAP_REPLACE_ (.O(Y), .I0(A[0]), .I1(A[1]), .I2(A[2]), .I3(A[3])); + end else begin + wire _TECHMAP_FAIL_ = 1; + end + endgenerate +endmodule + +module \$_DFF_P_ (input D, C, output Q); LUTFF _TECHMAP_REPLACE_ (.D(D), .O(Q), .CLK(C)); endmodule diff --git a/techlibs/fabulous/cells_map_ff.v b/techlibs/fabulous/cells_map_ff.v new file mode 100644 index 000000000..6df001d21 --- /dev/null +++ b/techlibs/fabulous/cells_map_ff.v @@ -0,0 +1,54 @@ +module \$lut (A, Y); + parameter WIDTH = 0; + parameter LUT = 0; + + input [WIDTH-1:0] A; + output Y; + + generate + if (WIDTH == 1) begin + LUT1 #(.INIT(LUT)) _TECHMAP_REPLACE_ (.O(Y), .I0(A[0])); + + end else + if (WIDTH == 2) begin + LUT2 #(.INIT(LUT)) _TECHMAP_REPLACE_ (.O(Y), .I0(A[0]), .I1(A[1])); + + end else + if (WIDTH == 3) begin + LUT3 #(.INIT(LUT)) _TECHMAP_REPLACE_ (.O(Y), .I0(A[0]), .I1(A[1]), .I2(A[2])); + + end else + if (WIDTH == 4) begin + LUT4 #(.INIT(LUT)) _TECHMAP_REPLACE_ (.O(Y), .I0(A[0]), .I1(A[1]), .I2(A[2]), .I3(A[3])); + end else begin + wire _TECHMAP_FAIL_ = 1; + end + endgenerate +endmodule + +/* module \$_DFF_P_ (input D, C, output Q); LUTFF _TECHMAP_REPLACE_ (.D(D), .O(Q), .CLK(C)); endmodule +module \$_DFF_N_ (input D, C, output Q); SB_DFFN _TECHMAP_REPLACE_ (.D(D), .Q(Q), .C(C)); endmodule +module \$_DFF_P_ (input D, C, output Q); SB_DFF _TECHMAP_REPLACE_ (.D(D), .Q(Q), .C(C)); endmodule + +module \$_DFFE_NP_ (input D, C, E, output Q); SB_DFFNE _TECHMAP_REPLACE_ (.D(D), .Q(Q), .C(C), .E(E)); endmodule +module \$_DFFE_PP_ (input D, C, E, output Q); SB_DFFE _TECHMAP_REPLACE_ (.D(D), .Q(Q), .C(C), .E(E)); endmodule + +module \$_DFF_NP0_ (input D, C, R, output Q); SB_DFFNR _TECHMAP_REPLACE_ (.D(D), .Q(Q), .C(C), .R(R)); endmodule +module \$_DFF_NP1_ (input D, C, R, output Q); SB_DFFNS _TECHMAP_REPLACE_ (.D(D), .Q(Q), .C(C), .S(R)); endmodule +module \$_DFF_PP0_ (input D, C, R, output Q); SB_DFFR _TECHMAP_REPLACE_ (.D(D), .Q(Q), .C(C), .R(R)); endmodule +module \$_DFF_PP1_ (input D, C, R, output Q); SB_DFFS _TECHMAP_REPLACE_ (.D(D), .Q(Q), .C(C), .S(R)); endmodule + +module \$_DFFE_NP0P_ (input D, C, E, R, output Q); SB_DFFNER _TECHMAP_REPLACE_ (.D(D), .Q(Q), .C(C), .E(E), .R(R)); endmodule +module \$_DFFE_NP1P_ (input D, C, E, R, output Q); SB_DFFNES _TECHMAP_REPLACE_ (.D(D), .Q(Q), .C(C), .E(E), .S(R)); endmodule +module \$_DFFE_PP0P_ (input D, C, E, R, output Q); SB_DFFER _TECHMAP_REPLACE_ (.D(D), .Q(Q), .C(C), .E(E), .R(R)); endmodule +module \$_DFFE_PP1P_ (input D, C, E, R, output Q); SB_DFFES _TECHMAP_REPLACE_ (.D(D), .Q(Q), .C(C), .E(E), .S(R)); endmodule + +module \$_SDFF_NP0_ (input D, C, R, output Q); SB_DFFNSR _TECHMAP_REPLACE_ (.D(D), .Q(Q), .C(C), .R(R)); endmodule +module \$_SDFF_NP1_ (input D, C, R, output Q); SB_DFFNSS _TECHMAP_REPLACE_ (.D(D), .Q(Q), .C(C), .S(R)); endmodule +module \$_SDFF_PP0_ (input D, C, R, output Q); SB_DFFSR _TECHMAP_REPLACE_ (.D(D), .Q(Q), .C(C), .R(R)); endmodule +module \$_SDFF_PP1_ (input D, C, R, output Q); SB_DFFSS _TECHMAP_REPLACE_ (.D(D), .Q(Q), .C(C), .S(R)); endmodule + +module \$_SDFFCE_NP0P_ (input D, C, E, R, output Q); SB_DFFNESR _TECHMAP_REPLACE_ (.D(D), .Q(Q), .C(C), .E(E), .R(R)); endmodule +module \$_SDFFCE_NP1P_ (input D, C, E, R, output Q); SB_DFFNESS _TECHMAP_REPLACE_ (.D(D), .Q(Q), .C(C), .E(E), .S(R)); endmodule +module \$_SDFFCE_PP0P_ (input D, C, E, R, output Q); SB_DFFESR _TECHMAP_REPLACE_ (.D(D), .Q(Q), .C(C), .E(E), .R(R)); endmodule +module \$_SDFFCE_PP1P_ (input D, C, E, R, output Q); SB_DFFESS _TECHMAP_REPLACE_ (.D(D), .Q(Q), .C(C), .E(E), .S(R)); endmodule */
\ No newline at end of file diff --git a/techlibs/fabulous/ff_map.v b/techlibs/fabulous/ff_map.v new file mode 100644 index 000000000..d623063c9 --- /dev/null +++ b/techlibs/fabulous/ff_map.v @@ -0,0 +1,26 @@ +module \$_DFF_P_ (input D, C, output Q); LUTFF _TECHMAP_REPLACE_ (.D(D), .O(Q), .CLK(C)); endmodule +//module \$_DFF_N_ (input D, C, output Q); SB_DFFN _TECHMAP_REPLACE_ (.D(D), .O(Q), .C(C)); endmodule +//module \$_DFF_P_ (input D, C, output Q); SB_DFF _TECHMAP_REPLACE_ (.D(D), .O(Q), .C(C)); endmodule + +//module \$_DFFE_NP_ (input D, C, E, output Q); SB_DFFNE _TECHMAP_REPLACE_ (.D(D), .O(Q), .C(C), .E(E)); endmodule +module \$_DFFE_PP_ (input D, C, E, output Q); LUTFF_E _TECHMAP_REPLACE_ (.D(D), .O(Q), .CLK(C), .E(E)); endmodule + +//module \$_DFF_NP0_ (input D, C, R, output Q); SB_DFFNR _TECHMAP_REPLACE_ (.D(D), .O(Q), .CLK(C), .R(R)); endmodule +//module \$_DFF_NP1_ (input D, C, R, output Q); SB_DFFNS _TECHMAP_REPLACE_ (.D(D), .O(Q), .CLK(C), .S(R)); endmodule +//module \$_DFF_PP0_ (input D, C, R, output Q); LUTFF_R _TECHMAP_REPLACE_ (.D(D), .O(Q), .CLK(C), .R(R)); endmodule +//module \$_DFF_PP1_ (input D, C, R, output Q); LUTFF_S _TECHMAP_REPLACE_ (.D(D), .O(Q), .CLK(C), .S(R)); endmodule + +//module \$_DFFE_NP0P_ (input D, C, E, R, output Q); SB_DFFNER _TECHMAP_REPLACE_ (.D(D), .O(Q), .CLK(C), .E(E), .R(R)); endmodule +//module \$_DFFE_NP1P_ (input D, C, E, R, output Q); SB_DFFNES _TECHMAP_REPLACE_ (.D(D), .O(Q), .CLK(C), .E(E), .S(R)); endmodule +//module \$_DFFE_PP0P_ (input D, C, E, R, output Q); LUTFF_ER _TECHMAP_REPLACE_ (.D(D), .O(Q), .CLK(C), .E(E), .R(R)); endmodule +//module \$_DFFE_PP1P_ (input D, C, E, R, output Q); LUTFF_ES _TECHMAP_REPLACE_ (.D(D), .O(Q), .CLK(C), .E(E), .S(R)); endmodule + +//module \$_SDFF_NP0_ (input D, C, R, output Q); SB_DFFNSR _TECHMAP_REPLACE_ (.D(D), .O(Q), .CLK(C), .R(R)); endmodule +//module \$_SDFF_NP1_ (input D, C, R, output Q); SB_DFFNSS _TECHMAP_REPLACE_ (.D(D), .O(Q), .CLK(C), .S(R)); endmodule +module \$_SDFF_PP0_ (input D, C, R, output Q); LUTFF_SR _TECHMAP_REPLACE_ (.D(D), .O(Q), .CLK(C), .R(R)); endmodule +module \$_SDFF_PP1_ (input D, C, R, output Q); LUTFF_SS _TECHMAP_REPLACE_ (.D(D), .O(Q), .CLK(C), .S(R)); endmodule + +//module \$_SDFFCE_NP0P_ (input D, C, E, R, output Q); SB_DFFNESR _TECHMAP_REPLACE_ (.D(D), .O(Q), .CLK(C), .E(E), .R(R)); endmodule +//module \$_SDFFCE_NP1P_ (input D, C, E, R, output Q); SB_DFFNESS _TECHMAP_REPLACE_ (.D(D), .O(Q), .CLK(C), .E(E), .S(R)); endmodule +module \$_SDFFCE_PP0P_ (input D, C, E, R, output Q); LUTFF_ESR _TECHMAP_REPLACE_ (.D(D), .O(Q), .CLK(C), .E(E), .R(R)); endmodule +module \$_SDFFCE_PP1P_ (input D, C, E, R, output Q); LUTFF_ESS _TECHMAP_REPLACE_ (.D(D), .O(Q), .CLK(C), .E(E), .S(R)); endmodule
\ No newline at end of file diff --git a/techlibs/fabulous/latches_map.v b/techlibs/fabulous/latches_map.v new file mode 100644 index 000000000..c28f88cf7 --- /dev/null +++ b/techlibs/fabulous/latches_map.v @@ -0,0 +1,11 @@ +module \$_DLATCH_N_ (E, D, Q); + wire [1023:0] _TECHMAP_DO_ = "simplemap; opt"; + input E, D; + output Q = !E ? D : Q; +endmodule + +module \$_DLATCH_P_ (E, D, Q); + wire [1023:0] _TECHMAP_DO_ = "simplemap; opt"; + input E, D; + output Q = E ? D : Q; +endmodule diff --git a/techlibs/fabulous/prims.v b/techlibs/fabulous/prims.v new file mode 100644 index 000000000..e9a525502 --- /dev/null +++ b/techlibs/fabulous/prims.v @@ -0,0 +1,335 @@ +// LUT and DFF are combined to a GENERIC_SLICE + +/*module LUT #( + parameter K = 4, + parameter [2**K-1:0] INIT = 0 +) ( + input [K-1:0] I, + output Q +); + wire [K-1:0] I_pd; + + genvar ii; + generate + for (ii = 0; ii < K; ii = ii + 1'b1) + assign I_pd[ii] = (I[ii] === 1'bz) ? 1'b0 : I[ii]; + endgenerate + + assign Q = INIT[I_pd]; +endmodule*/ + +module LUT1(output O, input I0); + parameter [1:0] INIT = 0; + assign O = I0 ? INIT[1] : INIT[0]; +endmodule + +module LUT2(output O, input I0, I1); + parameter [3:0] INIT = 0; + wire [ 1: 0] s1 = I1 ? INIT[ 3: 2] : INIT[ 1: 0]; + assign O = I0 ? s1[1] : s1[0]; +endmodule + +module LUT3(output O, input I0, I1, I2); + parameter [7:0] INIT = 0; + wire [ 3: 0] s2 = I2 ? INIT[ 7: 4] : INIT[ 3: 0]; + wire [ 1: 0] s1 = I1 ? s2[ 3: 2] : s2[ 1: 0]; + assign O = I0 ? s1[1] : s1[0]; +endmodule + +module LUT4(output O, input I0, I1, I2, I3); + parameter [15:0] INIT = 0; + wire [ 7: 0] s3 = I3 ? INIT[15: 8] : INIT[ 7: 0]; + wire [ 3: 0] s2 = I2 ? s3[ 7: 4] : s3[ 3: 0]; + wire [ 1: 0] s1 = I1 ? s2[ 3: 2] : s2[ 1: 0]; + assign O = I0 ? s1[1] : s1[0]; +endmodule + +module LUTFF(input CLK, D, output reg O); +initial O = 1'b0; +always @ (posedge CLK) begin + O <= D; +end +endmodule + +module FABULOUS_LC #( + parameter K = 4, + parameter [2**K-1:0] INIT = 0, + parameter DFF_ENABLE = 1'b0 +) ( + input CLK, + input [K-1:0] I, + output O, + output Q +); + wire f_wire; + + //LUT #(.K(K), .INIT(INIT)) lut_i(.I(I), .Q(f_wire)); + generate + if (K == 1) begin + LUT1 #(.INIT(INIT)) lut1 (.O(f_wire), .I0(A[0])); + end else + if (K == 2) begin + LUT2 #(.INIT(INIT)) lut2 (.O(f_wire), .I0(A[0]), .I1(A[1])); + end else + if (K == 3) begin + LUT3 #(.INIT(INIT)) lut3 (.O(f_wire), .I0(A[0]), .I1(A[1]), .I2(A[2])); + end else + if (K == 4) begin + LUT4 #(.INIT(INIT)) lut4 (.O(f_wire), .I0(A[0]), .I1(A[1]), .I2(A[2]), .I3(A[3])); + end + endgenerate + + LUTFF dff_i(.CLK(CLK), .D(f_wire), .Q(Q)); + + assign O = f_wire; +endmodule + +(* blackbox *) +module Global_Clock (output CLK); + //initial CLK = 0; + //always #10 CLK = ~CLK; +endmodule + +(* blackbox *) +module InPass4_frame_config (output O0, O1, O2, O3); + +endmodule + + +(* blackbox *) +module OutPass4_frame_config (input I0, I1, I2, I3); + +endmodule + +(* blackbox *) +module IO_1_bidirectional_frame_config_pass (input T, I, output Q, O); +endmodule + + +module MULADD (A7, A6, A5, A4, A3, A2, A1, A0, B7, B6, B5, B4, B3, B2, B1, B0, C19, C18, C17, C16, C15, C14, C13, C12, C11, C10, C9, C8, C7, C6, C5, C4, C3, C2, C1, C0, Q19, Q18, Q17, Q16, Q15, Q14, Q13, Q12, Q11, Q10, Q9, Q8, Q7, Q6, Q5, Q4, Q3, Q2, Q1, Q0, clr, CLK); + parameter ConfigBits = 6'b000000; + //parameter NoConfigBits = 6;// has to be adjusted manually (we don't use an arithmetic parser for the value) + // IMPORTANT: this has to be in a dedicated line + input A7;// operand A + input A6; + input A5; + input A4; + input A3; + input A2; + input A1; + input A0; + input B7;// operand B + input B6; + input B5; + input B4; + input B3; + input B2; + input B1; + input B0; + input C19;// operand C + input C18; + input C17; + input C16; + input C15; + input C14; + input C13; + input C12; + input C11; + input C10; + input C9; + input C8; + input C7; + input C6; + input C5; + input C4; + input C3; + input C2; + input C1; + input C0; + output Q19;// result + output Q18; + output Q17; + output Q16; + output Q15; + output Q14; + output Q13; + output Q12; + output Q11; + output Q10; + output Q9; + output Q8; + output Q7; + output Q6; + output Q5; + output Q4; + output Q3; + output Q2; + output Q1; + output Q0; + + input clr; + input CLK; // EXTERNAL // SHARED_PORT // ## the EXTERNAL keyword will send this sisgnal all the way to top and the //SHARED Allows multiple BELs using the same port (e.g. for exporting a clock to the top) + // GLOBAL all primitive pins that are connected to the switch matrix have to go before the GLOBAL label + + + wire [7:0] A; // port A read data + wire [7:0] B; // port B read data + wire [19:0] C; // port B read data + reg [7:0] A_reg; // port A read data register + reg [7:0] B_reg; // port B read data register + reg [19:0] C_reg; // port B read data register + wire [7:0] OPA; // port A + wire [7:0] OPB; // port B + wire [19:0] OPC; // port B + reg [19:0] ACC ; // accumulator register + wire [19:0] sum;// port B read data register + wire [19:0] sum_in;// port B read data register + wire [15:0] product; + wire [19:0] product_extended; + + assign A = {A7,A6,A5,A4,A3,A2,A1,A0}; + assign B = {B7,B6,B5,B4,B3,B2,B1,B0}; + assign C = {C19,C18,C17,C16,C15,C14,C13,C12,C11,C10,C9,C8,C7,C6,C5,C4,C3,C2,C1,C0}; + + assign OPA = ConfigBits[0] ? A_reg : A; + assign OPB = ConfigBits[1] ? B_reg : B; + assign OPC = ConfigBits[2] ? C_reg : C; + + assign sum_in = ConfigBits[3] ? ACC : OPC;// we can + + assign product = OPA * OPB; + +// The sign extension was not tested + assign product_extended = ConfigBits[4] ? {product[15],product[15],product[15],product[15],product} : {4'b0000,product}; + + assign sum = product_extended + sum_in; + + assign Q19 = ConfigBits[5] ? ACC[19] : sum[19]; + assign Q18 = ConfigBits[5] ? ACC[18] : sum[18]; + assign Q17 = ConfigBits[5] ? ACC[17] : sum[17]; + assign Q16 = ConfigBits[5] ? ACC[16] : sum[16]; + assign Q15 = ConfigBits[5] ? ACC[15] : sum[15]; + assign Q14 = ConfigBits[5] ? ACC[14] : sum[14]; + assign Q13 = ConfigBits[5] ? ACC[13] : sum[13]; + assign Q12 = ConfigBits[5] ? ACC[12] : sum[12]; + assign Q11 = ConfigBits[5] ? ACC[11] : sum[11]; + assign Q10 = ConfigBits[5] ? ACC[10] : sum[10]; + assign Q9 = ConfigBits[5] ? ACC[9] : sum[9]; + assign Q8 = ConfigBits[5] ? ACC[8] : sum[8]; + assign Q7 = ConfigBits[5] ? ACC[7] : sum[7]; + assign Q6 = ConfigBits[5] ? ACC[6] : sum[6]; + assign Q5 = ConfigBits[5] ? ACC[5] : sum[5]; + assign Q4 = ConfigBits[5] ? ACC[4] : sum[4]; + assign Q3 = ConfigBits[5] ? ACC[3] : sum[3]; + assign Q2 = ConfigBits[5] ? ACC[2] : sum[2]; + assign Q1 = ConfigBits[5] ? ACC[1] : sum[1]; + assign Q0 = ConfigBits[5] ? ACC[0] : sum[0]; + + always @ (posedge CLK) + begin + A_reg <= A; + B_reg <= B; + C_reg <= C; + if (clr == 1'b1) begin + ACC <= 20'b00000000000000000000; + end else begin + ACC <= sum; + end + end + +endmodule + +module RegFile_32x4 (D0, D1, D2, D3, W_ADR0, W_ADR1, W_ADR2, W_ADR3, W_ADR4, W_en, AD0, AD1, AD2, AD3, A_ADR0, A_ADR1, A_ADR2, A_ADR3, A_ADR4, BD0, BD1, BD2, BD3, B_ADR0, B_ADR1, B_ADR2, B_ADR3, B_ADR4, CLK); + //parameter NoConfigBits = 2;// has to be adjusted manually (we don't use an arithmetic parser for the value) + parameter ConfigBits = 2'b00; + // IMPORTANT: this has to be in a dedicated line + input D0; // Register File write port + input D1; + input D2; + input D3; + input W_ADR0; + input W_ADR1; + input W_ADR2; + input W_ADR3; + input W_ADR4; + input W_en; + + output AD0;// Register File read port A + output AD1; + output AD2; + output AD3; + input A_ADR0; + input A_ADR1; + input A_ADR2; + input A_ADR3; + input A_ADR4; + + output BD0;//Register File read port B + output BD1; + output BD2; + output BD3; + input B_ADR0; + input B_ADR1; + input B_ADR2; + input B_ADR3; + input B_ADR4; + + input CLK;// EXTERNAL // SHARED_PORT // ## the EXTERNAL keyword will send this sisgnal all the way to top and the //SHARED Allows multiple BELs using the same port (e.g. for exporting a clock to the top) + + // GLOBAL all primitive pins that are connected to the switch matrix have to go before the GLOBAL label + + + //type memtype is array (31 downto 0) of std_logic_vector(3 downto 0); // 32 entries of 4 bit + //signal mem : memtype := (others => (others => '0')); + reg [3:0] mem [31:0]; + + wire [4:0] W_ADR;// write address + wire [4:0] A_ADR;// port A read address + wire [4:0] B_ADR;// port B read address + + wire [3:0] D; // write data + wire [3:0] AD; // port A read data + wire [3:0] BD; // port B read data + + reg [3:0] AD_reg; // port A read data register + reg [3:0] BD_reg; // port B read data register + + integer i; + + assign W_ADR = {W_ADR4,W_ADR3,W_ADR2,W_ADR1,W_ADR0}; + assign A_ADR = {A_ADR4,A_ADR3,A_ADR2,A_ADR1,A_ADR0}; + assign B_ADR = {B_ADR4,B_ADR3,B_ADR2,B_ADR1,B_ADR0}; + + assign D = {D3,D2,D1,D0}; + + initial begin + for (i=0; i<32; i=i+1) begin + mem[i] = 4'b0000; + end + end + + always @ (posedge CLK) begin : P_write + if (W_en == 1'b1) begin + mem[W_ADR] <= D ; + end + end + + assign AD = mem[A_ADR]; + assign BD = mem[B_ADR]; + + always @ (posedge UserCLK) begin + AD_reg <= AD; + BD_reg <= BD; + end + + assign AD0 = ConfigBits[0] ? AD_reg[0] : AD[0]; + assign AD1 = ConfigBits[0] ? AD_reg[1] : AD[1]; + assign AD2 = ConfigBits[0] ? AD_reg[2] : AD[2]; + assign AD3 = ConfigBits[0] ? AD_reg[3] : AD[3]; + + assign BD0 = ConfigBits[1] ? BD_reg[0] : BD[0]; + assign BD1 = ConfigBits[1] ? BD_reg[1] : BD[1]; + assign BD2 = ConfigBits[1] ? BD_reg[2] : BD[2]; + assign BD3 = ConfigBits[1] ? BD_reg[3] : BD[3]; + +endmodule
\ No newline at end of file diff --git a/techlibs/fabulous/prims_ff.v b/techlibs/fabulous/prims_ff.v new file mode 100644 index 000000000..01eddb150 --- /dev/null +++ b/techlibs/fabulous/prims_ff.v @@ -0,0 +1,575 @@ +// LUT and DFF are combined to a GENERIC_SLICE + +/*module LUT #( + parameter K = 4, + parameter [2**K-1:0] INIT = 0 +) ( + input [K-1:0] I, + output Q +); + wire [K-1:0] I_pd; + + genvar ii; + generate + for (ii = 0; ii < K; ii = ii + 1'b1) + assign I_pd[ii] = (I[ii] === 1'bz) ? 1'b0 : I[ii]; + endgenerate + + assign Q = INIT[I_pd]; +endmodule*/ + +module LUT1(output O, input I0); + parameter [1:0] INIT = 0; + assign O = I0 ? INIT[1] : INIT[0]; +endmodule + +module LUT2(output O, input I0, I1); + parameter [3:0] INIT = 0; + wire [ 1: 0] s1 = I1 ? INIT[ 3: 2] : INIT[ 1: 0]; + assign O = I0 ? s1[1] : s1[0]; +endmodule + +module LUT3(output O, input I0, I1, I2); + parameter [7:0] INIT = 0; + wire [ 3: 0] s2 = I2 ? INIT[ 7: 4] : INIT[ 3: 0]; + wire [ 1: 0] s1 = I1 ? s2[ 3: 2] : s2[ 1: 0]; + assign O = I0 ? s1[1] : s1[0]; +endmodule + +module LUT4(output O, input I0, I1, I2, I3); + parameter [15:0] INIT = 0; + wire [ 7: 0] s3 = I3 ? INIT[15: 8] : INIT[ 7: 0]; + wire [ 3: 0] s2 = I2 ? s3[ 7: 4] : s3[ 3: 0]; + wire [ 1: 0] s1 = I1 ? s2[ 3: 2] : s2[ 1: 0]; + assign O = I0 ? s1[1] : s1[0]; +endmodule + +module LUTFF(input CLK, D, output reg O); +initial O = 1'b0; +always @ (posedge CLK) begin + O <= D; +end +endmodule + +module FABULOUS_LC #( + parameter K = 4, + parameter [2**K-1:0] INIT = 0, + parameter DFF_ENABLE = 1'b0, + parameter IOmux = 1'b0, + parameter SET_NORESET = 1'b0 +) ( + input CLK, + input I0, + input I1, + input I2, + input I3, + input SR, + input EN, + output O, + output Q, + input Ci, + output Co +); + wire f_wire; + wire I0_mux; + + assign I0_mux = IOmux ? Ci : I0; + + //LUT #(.K(K), .INIT(INIT)) lut_i(.I(I), .Q(f_wire)); + generate + if (K == 1) begin + LUT1 #(.INIT(INIT)) lut1 (.O(f_wire), .I0(I0_mux)); + end else + if (K == 2) begin + LUT2 #(.INIT(INIT)) lut2 (.O(f_wire), .I0(I0_mux), .I1(I1)); + end else + if (K == 3) begin + LUT3 #(.INIT(INIT)) lut3 (.O(f_wire), .I0(I0_mux), .I1(I2), .I2(I2)); + end else + if (K == 4) begin + LUT4 #(.INIT(INIT)) lut4 (.O(f_wire), .I0(I0_mux), .I1(I1), .I2(I2), .I3(I3)); + end + endgenerate + + + assign Co = (Ci & A[1]) | (Ci & A[2]) | (A[1] & A[2]); + + if (SET_NORESET) begin + LUTFF_ESS dffs_i(.CLK(CLK), .E(EN), .S(SR), .D(f_wire), .O(Q)); + end else begin + LUTFF_ESR dffr_i(.CLK(CLK), .E(EN), .R(SR), .D(f_wire), .O(Q)); + end + + assign O = f_wire; +endmodule + +(* blackbox *) +module Global_Clock (output CLK); + //initial CLK = 0; + //always #10 CLK = ~CLK; +endmodule + +(* blackbox *) +module InPass4_frame_config (output O0, O1, O2, O3); + +endmodule + + +(* blackbox *) +module OutPass4_frame_config (input I0, I1, I2, I3); + +endmodule + +(* blackbox *) +module IO_1_bidirectional_frame_config_pass (input T, I, output Q, O); +endmodule + + +module MULADD (A7, A6, A5, A4, A3, A2, A1, A0, B7, B6, B5, B4, B3, B2, B1, B0, C19, C18, C17, C16, C15, C14, C13, C12, C11, C10, C9, C8, C7, C6, C5, C4, C3, C2, C1, C0, Q19, Q18, Q17, Q16, Q15, Q14, Q13, Q12, Q11, Q10, Q9, Q8, Q7, Q6, Q5, Q4, Q3, Q2, Q1, Q0, clr, CLK); + parameter ConfigBits = 6'b000000; + //parameter NoConfigBits = 6;// has to be adjusted manually (we don't use an arithmetic parser for the value) + // IMPORTANT: this has to be in a dedicated line + input A7;// operand A + input A6; + input A5; + input A4; + input A3; + input A2; + input A1; + input A0; + input B7;// operand B + input B6; + input B5; + input B4; + input B3; + input B2; + input B1; + input B0; + input C19;// operand C + input C18; + input C17; + input C16; + input C15; + input C14; + input C13; + input C12; + input C11; + input C10; + input C9; + input C8; + input C7; + input C6; + input C5; + input C4; + input C3; + input C2; + input C1; + input C0; + output Q19;// result + output Q18; + output Q17; + output Q16; + output Q15; + output Q14; + output Q13; + output Q12; + output Q11; + output Q10; + output Q9; + output Q8; + output Q7; + output Q6; + output Q5; + output Q4; + output Q3; + output Q2; + output Q1; + output Q0; + + input clr; + input CLK; // EXTERNAL // SHARED_PORT // ## the EXTERNAL keyword will send this sisgnal all the way to top and the //SHARED Allows multiple BELs using the same port (e.g. for exporting a clock to the top) + // GLOBAL all primitive pins that are connected to the switch matrix have to go before the GLOBAL label + + + wire [7:0] A; // port A read data + wire [7:0] B; // port B read data + wire [19:0] C; // port B read data + reg [7:0] A_reg; // port A read data register + reg [7:0] B_reg; // port B read data register + reg [19:0] C_reg; // port B read data register + wire [7:0] OPA; // port A + wire [7:0] OPB; // port B + wire [19:0] OPC; // port B + reg [19:0] ACC ; // accumulator register + wire [19:0] sum;// port B read data register + wire [19:0] sum_in;// port B read data register + wire [15:0] product; + wire [19:0] product_extended; + + assign A = {A7,A6,A5,A4,A3,A2,A1,A0}; + assign B = {B7,B6,B5,B4,B3,B2,B1,B0}; + assign C = {C19,C18,C17,C16,C15,C14,C13,C12,C11,C10,C9,C8,C7,C6,C5,C4,C3,C2,C1,C0}; + + assign OPA = ConfigBits[0] ? A_reg : A; + assign OPB = ConfigBits[1] ? B_reg : B; + assign OPC = ConfigBits[2] ? C_reg : C; + + assign sum_in = ConfigBits[3] ? ACC : OPC;// we can + + assign product = OPA * OPB; + +// The sign extension was not tested + assign product_extended = ConfigBits[4] ? {product[15],product[15],product[15],product[15],product} : {4'b0000,product}; + + assign sum = product_extended + sum_in; + + assign Q19 = ConfigBits[5] ? ACC[19] : sum[19]; + assign Q18 = ConfigBits[5] ? ACC[18] : sum[18]; + assign Q17 = ConfigBits[5] ? ACC[17] : sum[17]; + assign Q16 = ConfigBits[5] ? ACC[16] : sum[16]; + assign Q15 = ConfigBits[5] ? ACC[15] : sum[15]; + assign Q14 = ConfigBits[5] ? ACC[14] : sum[14]; + assign Q13 = ConfigBits[5] ? ACC[13] : sum[13]; + assign Q12 = ConfigBits[5] ? ACC[12] : sum[12]; + assign Q11 = ConfigBits[5] ? ACC[11] : sum[11]; + assign Q10 = ConfigBits[5] ? ACC[10] : sum[10]; + assign Q9 = ConfigBits[5] ? ACC[9] : sum[9]; + assign Q8 = ConfigBits[5] ? ACC[8] : sum[8]; + assign Q7 = ConfigBits[5] ? ACC[7] : sum[7]; + assign Q6 = ConfigBits[5] ? ACC[6] : sum[6]; + assign Q5 = ConfigBits[5] ? ACC[5] : sum[5]; + assign Q4 = ConfigBits[5] ? ACC[4] : sum[4]; + assign Q3 = ConfigBits[5] ? ACC[3] : sum[3]; + assign Q2 = ConfigBits[5] ? ACC[2] : sum[2]; + assign Q1 = ConfigBits[5] ? ACC[1] : sum[1]; + assign Q0 = ConfigBits[5] ? ACC[0] : sum[0]; + + always @ (posedge CLK) + begin + A_reg <= A; + B_reg <= B; + C_reg <= C; + if (clr == 1'b1) begin + ACC <= 20'b00000000000000000000; + end else begin + ACC <= sum; + end + end + +endmodule + +module RegFile_32x4 (D0, D1, D2, D3, W_ADR0, W_ADR1, W_ADR2, W_ADR3, W_ADR4, W_en, AD0, AD1, AD2, AD3, A_ADR0, A_ADR1, A_ADR2, A_ADR3, A_ADR4, BD0, BD1, BD2, BD3, B_ADR0, B_ADR1, B_ADR2, B_ADR3, B_ADR4, CLK); + //parameter NoConfigBits = 2;// has to be adjusted manually (we don't use an arithmetic parser for the value) + parameter ConfigBits = 2'b00; + // IMPORTANT: this has to be in a dedicated line + input D0; // Register File write port + input D1; + input D2; + input D3; + input W_ADR0; + input W_ADR1; + input W_ADR2; + input W_ADR3; + input W_ADR4; + input W_en; + + output AD0;// Register File read port A + output AD1; + output AD2; + output AD3; + input A_ADR0; + input A_ADR1; + input A_ADR2; + input A_ADR3; + input A_ADR4; + + output BD0;//Register File read port B + output BD1; + output BD2; + output BD3; + input B_ADR0; + input B_ADR1; + input B_ADR2; + input B_ADR3; + input B_ADR4; + + input CLK;// EXTERNAL // SHARED_PORT // ## the EXTERNAL keyword will send this sisgnal all the way to top and the //SHARED Allows multiple BELs using the same port (e.g. for exporting a clock to the top) + + // GLOBAL all primitive pins that are connected to the switch matrix have to go before the GLOBAL label + + + //type memtype is array (31 downto 0) of std_logic_vector(3 downto 0); // 32 entries of 4 bit + //signal mem : memtype := (others => (others => '0')); + reg [3:0] mem [31:0]; + + wire [4:0] W_ADR;// write address + wire [4:0] A_ADR;// port A read address + wire [4:0] B_ADR;// port B read address + + wire [3:0] D; // write data + wire [3:0] AD; // port A read data + wire [3:0] BD; // port B read data + + reg [3:0] AD_reg; // port A read data register + reg [3:0] BD_reg; // port B read data register + + integer i; + + assign W_ADR = {W_ADR4,W_ADR3,W_ADR2,W_ADR1,W_ADR0}; + assign A_ADR = {A_ADR4,A_ADR3,A_ADR2,A_ADR1,A_ADR0}; + assign B_ADR = {B_ADR4,B_ADR3,B_ADR2,B_ADR1,B_ADR0}; + + assign D = {D3,D2,D1,D0}; + + initial begin + for (i=0; i<32; i=i+1) begin + mem[i] = 4'b0000; + end + end + + always @ (posedge CLK) begin : P_write + if (W_en == 1'b1) begin + mem[W_ADR] <= D ; + end + end + + assign AD = mem[A_ADR]; + assign BD = mem[B_ADR]; + + always @ (posedge UserCLK) begin + AD_reg <= AD; + BD_reg <= BD; + end + + assign AD0 = ConfigBits[0] ? AD_reg[0] : AD[0]; + assign AD1 = ConfigBits[0] ? AD_reg[1] : AD[1]; + assign AD2 = ConfigBits[0] ? AD_reg[2] : AD[2]; + assign AD3 = ConfigBits[0] ? AD_reg[3] : AD[3]; + + assign BD0 = ConfigBits[1] ? BD_reg[0] : BD[0]; + assign BD1 = ConfigBits[1] ? BD_reg[1] : BD[1]; + assign BD2 = ConfigBits[1] ? BD_reg[2] : BD[2]; + assign BD3 = ConfigBits[1] ? BD_reg[3] : BD[3]; + +endmodule + +module LUTFF_E ( + output reg O, + input CLK, E, D +); + initial O = 1'b0; + always @(posedge CLK) + if (E) + O <= D; +endmodule + +module LUTFF_SR ( + output reg O, + input CLK, R, D +); + initial O = 1'b0; + always @(posedge CLK) + if (R) + O <= 0; + else + O <= D; +endmodule + +module LUTFF_SS ( + output reg O, + input CLK, S, D +); + initial O = 1'b0; + always @(posedge CLK) + if (S) + O <= 1; + else + O <= D; +endmodule + +module LUTFF_ESR ( + output reg O, + input CLK, E, R, D +); + initial O = 1'b0; + always @(posedge CLK) + if (E) begin + if (R) + O <= 0; + else + O <= D; + end +endmodule + +module LUTFF_ESS ( + output reg O, + input CLK, E, S, D +); + initial O = 1'b0; + always @(posedge CLK) + if (E) begin + if (S) + O <= 1; + else + O <= D; + end +endmodule + +/* module LUTFF_R ( + output Q, + input C, R, D +); + always @(posedge CLK, posedge R) + if (R) + Q <= 0; + else + Q <= D; +endmodule */ + + + +/* module LUTFF_S ( + output Q, + input C, S, D +); + always @(posedge CLK, posedge S) + if (S) + Q <= 1; + else + Q <= D; +endmodule */ + + + +/* module LUTFF_ER ( + output Q, + input C, E, R, D +); + always @(posedge CLK, posedge R) + if (R) + Q <= 0; + else if (E) + Q <= D; +endmodule */ + + + +/* module LUTFF_ES ( + output Q, + input C, E, S, D +); + always @(posedge CLK, posedge S) + if (S) + Q <= 1; + else if (E) + Q <= D; +endmodule */ + +/* module LUTFFN ( + output Q, + input C, D +); + always @(negedge C) + Q <= D; +endmodule + +module LUTFFNE ( + output Q, + input C, E, D +); + always @(negedge C) + if (E) + Q <= D; +endmodule + +module LUTFFNSR ( + output Q, + input C, R, D +); + always @(negedge C) + if (R) + Q <= 0; + else + Q <= D; +endmodule + +module LUTFFNR ( + output Q, + input C, R, D +); + always @(negedge C, posedge R) + if (R) + Q <= 0; + else + Q <= D; +endmodule + +module LUTFFNSS ( + output Q, + input C, S, D +); + always @(negedge C) + if (S) + Q <= 1; + else + Q <= D; +endmodule + +module LUTFFNS ( + output Q, + input C, S, D +); + always @(negedge C, posedge S) + if (S) + Q <= 1; + else + Q <= D; +endmodule + +module LUTFFNESR ( + output Q, + input C, E, R, D +); + always @(negedge C) + if (E) begin + if (R) + Q <= 0; + else + Q <= D; + end +endmodule + +module LUTFFNER ( + output Q, + input C, E, R, D +); + always @(negedge C, posedge R) + if (R) + Q <= 0; + else if (E) + Q <= D; +endmodule + +module LUTFFNESS ( + output Q, + input C, E, S, D +); + always @(negedge C) + if (E) begin + if (S) + Q <= 1; + else + Q <= D; + end +endmodule + +module LUTFFNES ( + output Q, + input C, E, S, D +); + always @(negedge C, posedge S) + if (S) + Q <= 1; + else if (E) + Q <= D; +endmodule */
\ No newline at end of file diff --git a/techlibs/fabulous/synth_fabulous.cc b/techlibs/fabulous/synth_fabulous.cc new file mode 100644 index 000000000..da1245527 --- /dev/null +++ b/techlibs/fabulous/synth_fabulous.cc @@ -0,0 +1,242 @@ +/* + * yosys -- Yosys Open SYnthesis Suite + * + * Copyright (C) 2012 Claire Xenia Wolf <claire@yosyshq.com> + * + * Permission to use, copy, modify, and/or distribute this software for any + * purpose with or without fee is hereby granted, provided that the above + * copyright notice and this permission notice appear in all copies. + * + * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES + * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF + * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR + * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES + * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN + * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF + * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. + * + */ + +#include "kernel/register.h" +#include "kernel/celltypes.h" +#include "kernel/rtlil.h" +#include "kernel/log.h" + +USING_YOSYS_NAMESPACE +PRIVATE_NAMESPACE_BEGIN + +struct SynthPass : public ScriptPass +{ + SynthPass() : ScriptPass("synth_fabulous", "FABulous synthesis script") { } + + void help() override + { + // |---v---|---v---|---v---|---v---|---v---|---v---|---v---|---v---|---v---|---v---| + log("\n"); + log(" synth_fabulous [options]\n"); + log("\n"); + log("This command runs synthesis for FPGA fabrics generated with FABulous. This command does not operate\n"); + log("on partly selected designs.\n"); + log("\n"); + log(" -top <module>\n"); + log(" use the specified module as top module (default='top')\n"); + log("\n"); + log(" -auto-top\n"); + log(" automatically determine the top of the design hierarchy\n"); + log("\n"); + log(" -flatten\n"); + log(" flatten the design before synthesis. this will pass '-auto-top' to\n"); + log(" 'hierarchy' if no top module is specified.\n"); + log("\n"); + log(" -encfile <file>\n"); + log(" passed to 'fsm_recode' via 'fsm'\n"); + log("\n"); + log(" -lut <k>\n"); + log(" perform synthesis for a k-LUT architecture (default 4).\n"); + log("\n"); + log(" -nofsm\n"); + log(" do not run FSM optimization\n"); + log("\n"); + log(" -noabc\n"); + log(" do not run abc (as if yosys was compiled without ABC support)\n"); + log("\n"); + log(" -noalumacc\n"); + log(" do not run 'alumacc' pass. i.e. keep arithmetic operators in\n"); + log(" their direct form ($add, $sub, etc.).\n"); + log("\n"); + log(" -nordff\n"); + log(" passed to 'memory'. prohibits merging of FFs into memory read ports\n"); + log("\n"); + log(" -noshare\n"); + log(" do not run SAT-based resource sharing\n"); + log("\n"); + log(" -run <from_label>[:<to_label>]\n"); + log(" only run the commands between the labels (see below). an empty\n"); + log(" from label is synonymous to 'begin', and empty to label is\n"); + log(" synonymous to the end of the command list.\n"); + log("\n"); + log(" -abc9\n"); + log(" use new ABC9 flow (EXPERIMENTAL)\n"); + log("\n"); + log(" -flowmap\n"); + log(" use FlowMap LUT techmapping instead of ABC\n"); + log("\n"); + log(" -no-rw-check\n"); + log(" marks all recognized read ports as \"return don't-care value on\n"); + log(" read/write collision\" (same result as setting the no_rw_check\n"); + log(" attribute on all memories).\n"); + log("\n"); + log("\n"); + log("The following commands are executed by this synthesis command:\n"); + help_script(); + log("\n"); + } + + string top_module, fsm_opts, memory_opts, abc; + bool autotop, flatten, noalumacc, nofsm, noabc, noshare, flowmap, forvpr; + int lut; + + void clear_flags() override + { + top_module.clear(); + fsm_opts.clear(); + memory_opts.clear(); + + autotop = false; + flatten = false; + lut = 4; + noalumacc = false; + nofsm = false; + noabc = false; + noshare = false; + flowmap = false; + forvpr = false; + abc = "abc"; + } + + void execute(std::vector<std::string> args, RTLIL::Design *design) override + { + string run_from, run_to; + clear_flags(); + + size_t argidx; + for (argidx = 1; argidx < args.size(); argidx++) + { + if (args[argidx] == "-top" && argidx+1 < args.size()) { + top_module = args[++argidx]; + continue; + } + if (args[argidx] == "-encfile" && argidx+1 < args.size()) { + fsm_opts = " -encfile " + args[++argidx]; + continue; + } + if (args[argidx] == "-run" && argidx+1 < args.size()) { + size_t pos = args[argidx+1].find(':'); + if (pos == std::string::npos) { + run_from = args[++argidx]; + run_to = args[argidx]; + } else { + run_from = args[++argidx].substr(0, pos); + run_to = args[argidx].substr(pos+1); + } + continue; + } + if (args[argidx] == "-vpr") { + forvpr = true; + continue; + } + if (args[argidx] == "-auto-top") { + autotop = true; + continue; + } + if (args[argidx] == "-flatten") { + flatten = true; + continue; + } + if (args[argidx] == "-lut") { + lut = atoi(args[++argidx].c_str()); + continue; + } + if (args[argidx] == "-nofsm") { + nofsm = true; + continue; + } + if (args[argidx] == "-noabc") { + noabc = true; + continue; + } + if (args[argidx] == "-noalumacc") { + noalumacc = true; + continue; + } + if (args[argidx] == "-nordff") { + memory_opts += " -nordff"; + continue; + } + if (args[argidx] == "-noshare") { + noshare = true; + continue; + } + if (args[argidx] == "-abc9") { + abc = "abc9"; + continue; + } + if (args[argidx] == "-flowmap") { + flowmap = true; + continue; + } + if (args[argidx] == "-no-rw-check") { + memory_opts += " -no-rw-check"; + continue; + } + break; + } + extra_args(args, argidx, design); + + if (!design->full_selection()) + log_cmd_error("This command only operates on fully selected designs!\n"); + + if (abc == "abc9" && !lut) + log_cmd_error("ABC9 flow only supported for FPGA synthesis (using '-lut' option)\n"); + if (flowmap && !lut) + log_cmd_error("FlowMap is only supported for FPGA synthesis (using '-lut' option)\n"); + + log_header(design, "Executing SYNTH pass.\n"); + log_push(); + + run_script(design, run_from, run_to); + + log_pop(); + } + + void script() override + { + if (top_module.empty()) { + if (flatten || autotop) + run("hierarchy -check -auto-top"); + else + run("hierarchy -check"); + } else + run(stringf("hierarchy -check -top %s", top_module.c_str())); + + run("proc"); + run("tribuf -logic"); + run("deminout"); + run("synth -run coarse"); + run("memory_map"); + run("opt -full"); + run("techmap -map +/techmap.v"); + run("opt -fast"); + run("dfflegalize -cell $_DFF_P_ 0 -cell $_DLATCH_?_ x"); + run("techmap -map +/fabulous/latches_map.v"); + run("abc -lut $LUT_K -dress"); + run("clean"); + if (forvpr) + run("yosys techmap -D LUT_K=$LUT_K -map +/fabulous/cells_map.v"); + run("clean"); + run("hierarchy -check"); + run("stat"); + } +} SynthPass; + +PRIVATE_NAMESPACE_END |