Add parameter to disable input buffer fall through

rfiorani · rfiorani · commit 8e2eff774d9d · 2025-11-12T14:44:37.000+01:00
diff --git a/README.md b/README.md
@@ -5,47 +5,48 @@ The implementation is taylored to cv32e40p (formerly known as RI5CY). This means
 The coprocessors main module is named `fpu_ss` and can be found in [fpu_ss.sv](src/fpu_ss.sv "fpu_ss.sv"). Below, the instantiation template is given and the parameters are described.
 ### Integration Template
 	fpu_ss #(
-	    .PULP_ZFINX           ( 0 ),
-	    .INPUT_BUFFER_DEPTH   ( 0 ),
-	    .OUT_OF_ORDER         ( 1 ),
-	    .FORWARDING           ( 1 ),
-	    .FPU_FEATURES         (   ),
-	    .FPU_IMPLEMENTATION   (   )
+	    .PULP_ZFINX          		 ( 0 ),
+	    .INPUT_BUFFER_DEPTH  		 ( 0 ),
+		.INPUT_BUFFER_FALL_THROUGH   ( 1 ),
+	    .OUT_OF_ORDER        		 ( 1 ),
+	    .FORWARDING          		 ( 1 ),
+	    .FPU_FEATURES         		 (   ),
+	    .FPU_IMPLEMENTATION          (   )
 	) fpu_ss_i (
 	    // clock and reset
-	    .clk_i                (),
-	    .rst_ni               (),
+	    .clk_i               		 (),
+	    .rst_ni               	     (),
 
 	    // Compressed Interface
-	    .x_compressed_valid_i (),
-	    .x_compressed_ready_o (),
-	    .x_compressed_req_i   (),
-	    .x_compressed_resp_o  (),
+	    .x_compressed_valid_i 		 (),
+	    .x_compressed_ready_o 		 (),
+	    .x_compressed_req_i   		 (),
+	    .x_compressed_resp_o  		 (),
 
 	    // Issue Interface
-	    .x_issue_valid_i      (),
-	    .x_issue_ready_o      (),
-	    .x_issue_req_i        (),
-	    .x_issue_resp_o       (),
+	    .x_issue_valid_i      		 (),
+	    .x_issue_ready_o      		 (),
+	    .x_issue_req_i        		 (),
+	    .x_issue_resp_o       		 (),
 
 	    // Commit Interface
-	    .x_commit_valid_i     (),
-	    .x_commit_i           (),
+	    .x_commit_valid_i     		 (),
+	    .x_commit_i           		 (),
 
 	    // Memory Request/Response Interface
-	    .x_mem_valid_o        (),
-	    .x_mem_ready_i        (),
-	    .x_mem_req_o          (),
-	    .x_mem_resp_i         (),
+	    .x_mem_valid_o        		 (),
+	    .x_mem_ready_i        		 (),
+	    .x_mem_req_o          		 (),
+	    .x_mem_resp_i         		 (),
 
 	    // Memory Result Interface
-	    .x_mem_result_valid_i (),
-	    .x_mem_result_i       (),
+	    .x_mem_result_valid_i 		 (),
+	    .x_mem_result_i       		 (),
 
 	    // Result Interface
-	    .x_result_valid_o     (),
-	    .x_result_ready_i     (),
-	    .x_result_o           ()
+	    .x_result_valid_o     		 (),
+	    .x_result_ready_i     		 (),
+	    .x_result_o           		 ()
 	);
 
 ### Dependencies
@@ -58,14 +59,15 @@ to load the FPnew or use
 to clone the repository with the Fpnew.
 ### Parameters
 
-| Parameter Name       | Values                                                                                          | Description                                  | Default |
-| -------------------- | ----------------------------------------------------------------------------------------------- | -------------------------------------------- | ------- |
-| `PULP_ZFINX`         | {0,1}                                                                                           | Use F or zfinx extension                     | 0       |
-| `INPUT_BUFFER_DEPTH` | {0, ... , 2^32-1}                                                                               | Input buffer depth                           | 0       |
-| `OUT_OF_ORDER`       | {0, 1}                                                                                          | Enabling out-of-order execution              | 1       |
-| `FORWARDING`         | {0, 1}                                                                                          | Enabling forwarding inside the fpu subsystem | 1       |
-| `FPU_FEATURES`       | see [FPnew](https://github.com/pulp-platform/fpnew/tree/develop/docs/README.md#parameters) docs | -                                            | -       |
-| `FPU_IMPLEMENTATION` | see [FPnew](https://github.com/pulp-platform/fpnew/tree/develop/docs/README.md#parameters) docs | -                                            | -       |
+| Parameter Name              | Values                                                                                          | Description                                  | Default |
+| --------------------------- | ----------------------------------------------------------------------------------------------- | -------------------------------------------- | ------- |
+| `PULP_ZFINX`                | {0,1}                                                                                           | Use F or zfinx extension                     | 0       |
+| `INPUT_BUFFER_DEPTH`        | {0, ... , 2^32-1}                                                                               | Input buffer depth                           | 0       |
+| `INPUT_BUFFER_FALL_THROUGH` | {0,1}                                                                                           | Input buffer fall through enable             | 1       |
+| `OUT_OF_ORDER`              | {0, 1}                                                                                          | Enabling out-of-order execution              | 1       |
+| `FORWARDING`                | {0, 1}                                                                                          | Enabling forwarding inside the fpu subsystem | 1       |
+| `FPU_FEATURES`              | see [FPnew](https://github.com/pulp-platform/fpnew/tree/develop/docs/README.md#parameters) docs | -                                            | -       |
+| `FPU_IMPLEMENTATION`        | see [FPnew](https://github.com/pulp-platform/fpnew/tree/develop/docs/README.md#parameters) docs | -                                            | -       |
 
 
 #### Extended parameter descriptions
diff --git a/src/fpu_ss.sv b/src/fpu_ss.sv
@@ -10,53 +10,57 @@
 //
 // Description: Top level Module of the FPU subsystem
 //
-// Parameters:  PULP_ZFINX:         Enable support for "Zfinx" standard extension (and thereby removing support for
-//                                  "F" standard extension)
+// Parameters:  PULP_ZFINX:               Enable support for "Zfinx" standard extension (and thereby removing support for
+//                                        "F" standard extension)
 //
-//              INPUT_BUFFER_DEPTH: Set depth of the FIFO input buffer. If parameter is set to 0, no buffer will be
-//                                  instantiated
+//              INPUT_BUFFER_DEPTH:       Set depth of the FIFO input buffer. If parameter is set to 0, no buffer will be
+//                                        instantiated
 //
-//              OUT_OF_ORDER:       Enable out-of-order execution for instructions that go through
-//                                  the FPnew.
-//                                  For example with OUT_OF_ORDER = 1
-//                                      fdiv.s fa1, fa2, fa3 // suppose takes 3 cycles
-//                                      fmul.s fa4, fa5, fa6 // suppose takes 1 cycles
-//                                      fmul.s fa2, fa5, fa6 // suppose takes 1 cycles
-//                                      fmul.s fa3, fa5, fa6 // suppose takes 1 cycles
-//                                  --> This sequence takes 4 clock cycles
-//                                  With OUT_OF_ORDER this instruction sequence would take 5 clock cycles
-//                                  Possible values for this parameter are 0 and 1
+//              OUT_OF_ORDER:             Enable out-of-order execution for instructions that go through
+//                                        the FPnew.
+//                                        For example with OUT_OF_ORDER = 1
+//                                            fdiv.s fa1, fa2, fa3 // suppose takes 3 cycles
+//                                            fmul.s fa4, fa5, fa6 // suppose takes 1 cycles
+//                                            fmul.s fa2, fa5, fa6 // suppose takes 1 cycles
+//                                            fmul.s fa3, fa5, fa6 // suppose takes 1 cycles
+//                                        --> This sequence takes 4 clock cycles
+//                                        With OUT_OF_ORDER this instruction sequence would take 5 clock cycles
+//                                        Possible values for this parameter are 0 and 1
 //
-//             FORWARDING:          Enable forwarding of floating-point results in the subsystem.
-//                                  For examle take this sequence:
-//                                      fmul.s fa4, fa5, fa6 // suppose takes 1 cycles
-//                                      fmul.s fa1, fa4, fa6 // suppose takes 1 cycles
-//                                  There is a source register dependency for the second instruction on the
-//                                  first instructions result. With FORWARDING = 1 this sequence takes 2 clock cycles
-//                                  while with FORWARDING = 0 this sequence takes 3 clock cycles.
+//             FORWARDING:                Enable forwarding of floating-point results in the subsystem.
+//                                        For examle take this sequence:
+//                                            fmul.s fa4, fa5, fa6 // suppose takes 1 cycles
+//                                            fmul.s fa1, fa4, fa6 // suppose takes 1 cycles
+//                                        There is a source register dependency for the second instruction on the
+//                                        first instructions result. With FORWARDING = 1 this sequence takes 2 clock cycles
+//                                        while with FORWARDING = 0 this sequence takes 3 clock cycles.
 //
-//             FPU_FEATURES:        Parameter to configure the FPnew. The subsystem was designed for the configuration found here:
-//                                  https://github.com/moimfeld/cv32e40p/blob/x-interface/example_tb/core/fpu_ss/fpu_ss_pkg.sv
-//                                  Other configurations might not work
+//             FPU_FEATURES:              Parameter to configure the FPnew. The subsystem was designed for the configuration found here:
+//                                        https://github.com/moimfeld/cv32e40p/blob/x-interface/example_tb/core/fpu_ss/fpu_ss_pkg.sv
+//                                        Other configurations might not work
 //
-//             FPU_IMPLEMENTATION:  Parameter to configure the FPnew. The subsystem was designed for the configuration found here:
-//                                  https://github.com/moimfeld/cv32e40p/blob/x-interface/example_tb/core/fpu_ss/fpu_ss_pkg.sv
-//                                  Other configurations might not work
+//             FPU_IMPLEMENTATION:        Parameter to configure the FPnew. The subsystem was designed for the configuration found here:
+//                                        https://github.com/moimfeld/cv32e40p/blob/x-interface/example_tb/core/fpu_ss/fpu_ss_pkg.sv
+//                                        Other configurations might not work
+//
+//             INPUT_BUFFER_FALL_THROUGH: Set depth of the FIFO input buffer FALL_THROUGH. If INPUT_BUFFER_DEPTH is set to 0, this
+//                                        parameter doesn't have any effect
 //
 // Contributor: Moritz Imfeld <moimfeld@student.ethz.ch>
 //              Davide Schiavone <davide@openhwgroup.org>
 
 module fpu_ss
     import fpu_ss_pkg::*;
 #(
-    parameter                                 PULP_ZFINX         = 0,
-    parameter                                 INPUT_BUFFER_DEPTH = 0,
-    parameter                                 OUT_OF_ORDER       = 1,
-    parameter                                 FORWARDING         = 1,
+    parameter                                 PULP_ZFINX                = 0,
+    parameter                                 INPUT_BUFFER_DEPTH        = 0,
+    parameter bit                             INPUT_BUFFER_FALL_THROUGH = 1,
+    parameter                                 OUT_OF_ORDER              = 1,
+    parameter                                 FORWARDING                = 1,
     // PulpDivSqrt = 0 enables T-head-based DivSqrt unit. Supported only for FP32-only instances of Fpnew
-    parameter logic                           PulpDivsqrt        = 1'b0,
-    parameter fpnew_pkg::fpu_features_t       FPU_FEATURES       = fpu_ss_pkg::FPU_FEATURES,
-    parameter fpnew_pkg::fpu_implementation_t FPU_IMPLEMENTATION = fpu_ss_pkg::FPU_IMPLEMENTATION
+    parameter logic                           PulpDivsqrt               = 1'b0,
+    parameter fpnew_pkg::fpu_features_t       FPU_FEATURES              = fpu_ss_pkg::FPU_FEATURES,
+    parameter fpnew_pkg::fpu_implementation_t FPU_IMPLEMENTATION        = fpu_ss_pkg::FPU_IMPLEMENTATION
 ) (
     // Clock and Reset
     input logic clk_i,
@@ -287,7 +291,7 @@ module fpu_ss
   generate
     if (INPUT_BUFFER_DEPTH > 0) begin : gen_input_stream_fifo
       stream_fifo #(
-          .FALL_THROUGH(1),
+          .FALL_THROUGH(INPUT_BUFFER_FALL_THROUGH),
           .DATA_WIDTH  (32),
           .DEPTH       (INPUT_BUFFER_DEPTH),
           .T           (offloaded_data_t)