1 | // ========== Copyright Header Begin ========================================== |
---|
2 | // |
---|
3 | // OpenSPARC T1 Processor File: sparc_exu_eclccr.v |
---|
4 | // Copyright (c) 2006 Sun Microsystems, Inc. All Rights Reserved. |
---|
5 | // DO NOT ALTER OR REMOVE COPYRIGHT NOTICES. |
---|
6 | // |
---|
7 | // The above named program is free software; you can redistribute it and/or |
---|
8 | // modify it under the terms of the GNU General Public |
---|
9 | // License version 2 as published by the Free Software Foundation. |
---|
10 | // |
---|
11 | // The above named program is distributed in the hope that it will be |
---|
12 | // useful, but WITHOUT ANY WARRANTY; without even the implied warranty of |
---|
13 | // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
---|
14 | // General Public License for more details. |
---|
15 | // |
---|
16 | // You should have received a copy of the GNU General Public |
---|
17 | // License along with this work; if not, write to the Free Software |
---|
18 | // Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA. |
---|
19 | // |
---|
20 | // ========== Copyright Header End ============================================ |
---|
21 | //////////////////////////////////////////////////////////////////////// |
---|
22 | /* |
---|
23 | // Module Name: sparc_exu_eclccr |
---|
24 | // Description: 4 bit condition code registers with forwarding. Takes |
---|
25 | // the e_stage result and writes on the w stage. |
---|
26 | */ |
---|
27 | |
---|
28 | module sparc_exu_eclccr (/*AUTOARG*/ |
---|
29 | // Outputs |
---|
30 | exu_ifu_cc_d, exu_tlu_ccr0_w, exu_tlu_ccr1_w, exu_tlu_ccr2_w, |
---|
31 | exu_tlu_ccr3_w, |
---|
32 | // Inputs |
---|
33 | clk, se, alu_xcc_e, alu_icc_e, tid_d, thrdec_d, thr_match_dm, |
---|
34 | thr_match_de, tid_w, thr_w, ifu_exu_kill_e, ifu_exu_setcc_d, |
---|
35 | byp_ecl_wrccr_data_w, wb_ccr_wrccr_w, wb_ccr_setcc_g, |
---|
36 | divcntl_ccr_cc_w2, wb_ccr_thr_g, tlu_exu_cwpccr_update_m, |
---|
37 | tlu_exu_ccr_m, ifu_exu_inst_vld_w, ifu_tlu_flush_w, early_flush_w |
---|
38 | ) ; |
---|
39 | input clk; |
---|
40 | input se; |
---|
41 | input [3:0] alu_xcc_e; // condition codes from the alu |
---|
42 | input [3:0] alu_icc_e; |
---|
43 | input [1:0] tid_d; // thread for each stage |
---|
44 | input [3:0] thrdec_d; // decoded tid_d for mux select |
---|
45 | input thr_match_dm; |
---|
46 | input thr_match_de; |
---|
47 | input [1:0] tid_w; |
---|
48 | input [3:0] thr_w; // decoded tid_w |
---|
49 | input ifu_exu_kill_e; |
---|
50 | input ifu_exu_setcc_d; |
---|
51 | input [7:0] byp_ecl_wrccr_data_w;// for the WRCCR operation (LSBs of |
---|
52 | input wb_ccr_wrccr_w; // ALU result) + wen signal |
---|
53 | input wb_ccr_setcc_g; |
---|
54 | input [7:0] divcntl_ccr_cc_w2; |
---|
55 | input [1:0] wb_ccr_thr_g; |
---|
56 | input tlu_exu_cwpccr_update_m; |
---|
57 | input [7:0] tlu_exu_ccr_m; |
---|
58 | input ifu_exu_inst_vld_w; |
---|
59 | input ifu_tlu_flush_w; |
---|
60 | input early_flush_w; |
---|
61 | |
---|
62 | output [7:0] exu_ifu_cc_d; // condition codes for current thread |
---|
63 | output [7:0] exu_tlu_ccr0_w; |
---|
64 | output [7:0] exu_tlu_ccr1_w; |
---|
65 | output [7:0] exu_tlu_ccr2_w; |
---|
66 | output [7:0] exu_tlu_ccr3_w; |
---|
67 | |
---|
68 | wire [7:0] partial_cc_d; // partial bypassed ccr |
---|
69 | wire [7:0] alu_cc_e; // alu combined condition codes |
---|
70 | wire [7:0] alu_cc_m; // m stage alu ccs |
---|
71 | wire [7:0] alu_cc_w; |
---|
72 | wire [7:0] exu_ifu_cc_w; // writeback data |
---|
73 | wire setcc_e; // from previous stage |
---|
74 | wire setcc_m; |
---|
75 | wire setcc_w; |
---|
76 | wire valid_setcc_e; // after comparing with kill |
---|
77 | wire valid_setcc_m; |
---|
78 | wire valid_setcc_w; |
---|
79 | wire setcc_w2; |
---|
80 | wire [7:0] ccrin_thr0; |
---|
81 | wire [7:0] ccrin_thr1; |
---|
82 | wire [7:0] ccrin_thr2; |
---|
83 | wire [7:0] ccrin_thr3; |
---|
84 | wire [7:0] ccr_d; |
---|
85 | wire [7:0] ccr_thr0; |
---|
86 | wire [7:0] ccr_thr1; |
---|
87 | wire [7:0] ccr_thr2; |
---|
88 | wire [7:0] ccr_thr3; |
---|
89 | wire use_alu_cc; |
---|
90 | wire use_ccr; |
---|
91 | wire use_cc_e; |
---|
92 | wire use_cc_m; |
---|
93 | wire use_cc_w; |
---|
94 | wire [1:0] tid_dxorw; |
---|
95 | wire thr_match_de; |
---|
96 | wire thrmatch_w; |
---|
97 | wire [1:0] thr_w2; |
---|
98 | wire thr0_w2; |
---|
99 | wire thr1_w2; |
---|
100 | wire thr2_w2; |
---|
101 | wire thr3_w2; |
---|
102 | wire wen_thr0_w; // write enable for each input/thread |
---|
103 | wire wen_thr0_w2; |
---|
104 | wire wen_thr1_w; |
---|
105 | wire wen_thr1_w2; |
---|
106 | wire wen_thr2_w; |
---|
107 | wire wen_thr2_w2; |
---|
108 | wire wen_thr3_w; |
---|
109 | wire wen_thr3_w2; |
---|
110 | wire wen_thr0_l; // overall write enable for each thread |
---|
111 | wire wen_thr1_l; |
---|
112 | wire wen_thr2_l; |
---|
113 | wire wen_thr3_l; |
---|
114 | wire bypass_cc_w; |
---|
115 | |
---|
116 | wire [7:0] ccr_m; |
---|
117 | |
---|
118 | |
---|
119 | // D2E flops |
---|
120 | dff_s dff_setcc_d2e(.din(ifu_exu_setcc_d), .clk(clk), .q(setcc_e), |
---|
121 | .se(se), .si(), .so()); |
---|
122 | |
---|
123 | // E stage |
---|
124 | assign alu_cc_e = {alu_xcc_e, alu_icc_e}; |
---|
125 | assign valid_setcc_e = setcc_e & ~ifu_exu_kill_e; |
---|
126 | |
---|
127 | dff_s #(8) dff_cc_e2m(.din(alu_cc_e[7:0]), .clk(clk), .q(alu_cc_m[7:0]), |
---|
128 | .se(se), .si(), .so()); |
---|
129 | dff_s dff_setcc_e2m(.din(valid_setcc_e), .clk(clk), .q(setcc_m), |
---|
130 | .se(se), .si(), .so()); |
---|
131 | |
---|
132 | // M stage |
---|
133 | assign valid_setcc_m = setcc_m | tlu_exu_cwpccr_update_m; |
---|
134 | mux2ds #(8) mux_ccr_m(.dout(ccr_m[7:0]), |
---|
135 | .in0(alu_cc_m[7:0]), |
---|
136 | .in1(tlu_exu_ccr_m[7:0]), |
---|
137 | .sel0(~tlu_exu_cwpccr_update_m), |
---|
138 | .sel1(tlu_exu_cwpccr_update_m)); |
---|
139 | |
---|
140 | dff_s #(8) dff_cc_m2w(.din(ccr_m[7:0]), .clk(clk), .q(alu_cc_w[7:0]), |
---|
141 | .se(se), .si(), .so()); |
---|
142 | dff_s dff_setcc_m2w(.din(valid_setcc_m), .clk(clk), .q(setcc_w), |
---|
143 | .se(se), .si(), .so()); |
---|
144 | |
---|
145 | // W stage |
---|
146 | assign bypass_cc_w = ifu_exu_inst_vld_w & setcc_w; |
---|
147 | assign valid_setcc_w = ~ifu_tlu_flush_w & ~early_flush_w & ifu_exu_inst_vld_w & (setcc_w | wb_ccr_wrccr_w); |
---|
148 | |
---|
149 | // mux with wrccr |
---|
150 | assign use_alu_cc = ~(wb_ccr_wrccr_w); |
---|
151 | mux2ds #(8) mux_ccrin_cc(.dout(exu_ifu_cc_w[7:0]), .sel0(wb_ccr_wrccr_w), |
---|
152 | .sel1(use_alu_cc), |
---|
153 | .in0(byp_ecl_wrccr_data_w[7:0]), |
---|
154 | .in1(alu_cc_w[7:0])); |
---|
155 | |
---|
156 | dff_s #(3) setcc_g2w2 (.din({wb_ccr_setcc_g, wb_ccr_thr_g[1:0]}), .clk(clk), |
---|
157 | .q({setcc_w2, thr_w2[1:0]}), |
---|
158 | .se(se), .si(), .so()); |
---|
159 | |
---|
160 | |
---|
161 | ///////////////////////// |
---|
162 | // Storage of ccr |
---|
163 | ///////////////////////// |
---|
164 | `ifdef FPGA_SYN_1THREAD |
---|
165 | |
---|
166 | assign thr0_w2 = ~thr_w2[1] & ~thr_w2[0]; |
---|
167 | assign wen_thr0_w = (thr_w[0] & valid_setcc_w & ~wen_thr0_w2); |
---|
168 | assign wen_thr0_w2 = thr0_w2 & setcc_w2; |
---|
169 | assign wen_thr0_l = ~(wen_thr0_w | wen_thr0_w2); |
---|
170 | // mux between cc_w, cc_w2, old value, tlu value |
---|
171 | mux3ds #(8) mux_ccrin0(.dout(ccrin_thr0[7:0]), .sel0(wen_thr0_w), |
---|
172 | .sel1(wen_thr0_w2), .sel2(wen_thr0_l), |
---|
173 | .in0(exu_ifu_cc_w[7:0]), |
---|
174 | .in1(divcntl_ccr_cc_w2[7:0]), .in2(ccr_thr0[7:0])); |
---|
175 | // store new value |
---|
176 | dff_s #(8) dff_ccr_thr0(.din(ccrin_thr0[7:0]), .clk(clk), .q(ccr_thr0[7:0]), |
---|
177 | .se(se), .si(), .so()); |
---|
178 | assign ccr_d[7:0] = ccr_thr0[7:0]; |
---|
179 | |
---|
180 | `else // !`ifdef FPGA_SYN_1THREAD |
---|
181 | |
---|
182 | // decode thr_w2 for mux select |
---|
183 | assign thr0_w2 = ~thr_w2[1] & ~thr_w2[0]; |
---|
184 | assign thr1_w2 = ~thr_w2[1] & thr_w2[0]; |
---|
185 | assign thr2_w2 = thr_w2[1] & ~thr_w2[0]; |
---|
186 | assign thr3_w2 = thr_w2[1] & thr_w2[0]; |
---|
187 | // enable input for each thread |
---|
188 | assign wen_thr0_w = (thr_w[0] & valid_setcc_w & ~wen_thr0_w2); |
---|
189 | assign wen_thr0_w2 = thr0_w2 & setcc_w2; |
---|
190 | assign wen_thr0_l = ~(wen_thr0_w | wen_thr0_w2); |
---|
191 | assign wen_thr1_w = (thr_w[1] & valid_setcc_w & ~wen_thr1_w2); |
---|
192 | assign wen_thr1_w2 = (thr1_w2 & setcc_w2); |
---|
193 | assign wen_thr1_l = ~(wen_thr1_w | wen_thr1_w2); |
---|
194 | assign wen_thr2_w = (thr_w[2] & valid_setcc_w & ~wen_thr2_w2); |
---|
195 | assign wen_thr2_w2 = (thr2_w2 & setcc_w2); |
---|
196 | assign wen_thr2_l = ~(wen_thr2_w | wen_thr2_w2); |
---|
197 | assign wen_thr3_w = (thr_w[3] & valid_setcc_w & ~wen_thr3_w2); |
---|
198 | assign wen_thr3_w2 = (thr3_w2 & setcc_w2); |
---|
199 | assign wen_thr3_l = ~(wen_thr3_w | wen_thr3_w2); |
---|
200 | |
---|
201 | // mux between cc_w, cc_w2, old value, tlu value |
---|
202 | mux3ds #(8) mux_ccrin0(.dout(ccrin_thr0[7:0]), .sel0(wen_thr0_w), |
---|
203 | .sel1(wen_thr0_w2), .sel2(wen_thr0_l), |
---|
204 | .in0(exu_ifu_cc_w[7:0]), |
---|
205 | .in1(divcntl_ccr_cc_w2[7:0]), .in2(ccr_thr0[7:0])); |
---|
206 | mux3ds #(8) mux_ccrin1(.dout(ccrin_thr1[7:0]), .sel0(wen_thr1_w), |
---|
207 | .sel1(wen_thr1_w2), .sel2(wen_thr1_l), |
---|
208 | .in0(exu_ifu_cc_w[7:0]), |
---|
209 | .in1(divcntl_ccr_cc_w2[7:0]), .in2(ccr_thr1[7:0])); |
---|
210 | mux3ds #(8) mux_ccrin2(.dout(ccrin_thr2[7:0]), .sel0(wen_thr2_w), |
---|
211 | .sel1(wen_thr2_w2), .sel2(wen_thr2_l), |
---|
212 | .in0(exu_ifu_cc_w[7:0]), |
---|
213 | .in1(divcntl_ccr_cc_w2[7:0]), .in2(ccr_thr2[7:0])); |
---|
214 | mux3ds #(8) mux_ccrin3(.dout(ccrin_thr3[7:0]), .sel0(wen_thr3_w), |
---|
215 | .sel1(wen_thr3_w2), .sel2(wen_thr3_l), |
---|
216 | .in0(exu_ifu_cc_w[7:0]), |
---|
217 | .in1(divcntl_ccr_cc_w2[7:0]), .in2(ccr_thr3[7:0])); |
---|
218 | |
---|
219 | // store new value |
---|
220 | dff_s #(8) dff_ccr_thr0(.din(ccrin_thr0[7:0]), .clk(clk), .q(ccr_thr0[7:0]), |
---|
221 | .se(se), .si(), .so()); |
---|
222 | dff_s #(8) dff_ccr_thr1(.din(ccrin_thr1[7:0]), .clk(clk), .q(ccr_thr1[7:0]), |
---|
223 | .se(se), .si(), .so()); |
---|
224 | dff_s #(8) dff_ccr_thr2(.din(ccrin_thr2[7:0]), .clk(clk), .q(ccr_thr2[7:0]), |
---|
225 | .se(se), .si(), .so()); |
---|
226 | dff_s #(8) dff_ccr_thr3(.din(ccrin_thr3[7:0]), .clk(clk), .q(ccr_thr3[7:0]), |
---|
227 | .se(se), .si(), .so()); |
---|
228 | |
---|
229 | |
---|
230 | // mux between the 4 sets of ccrs |
---|
231 | mux4ds #(8) mux_ccr_out(.dout(ccr_d[7:0]), .sel0(thrdec_d[0]), |
---|
232 | .sel1(thrdec_d[1]), .sel2(thrdec_d[2]), |
---|
233 | .sel3(thrdec_d[3]), .in0(ccr_thr0[7:0]), |
---|
234 | .in1(ccr_thr1[7:0]), .in2(ccr_thr2[7:0]), |
---|
235 | .in3(ccr_thr3[7:0])); |
---|
236 | `endif // !`ifdef FPGA_SYN_1THREAD |
---|
237 | |
---|
238 | // bypass the ccs to the output. Only alu result needs to be bypassed |
---|
239 | assign exu_ifu_cc_d[7:0] = (use_cc_e)? alu_cc_e[7:0]: partial_cc_d[7:0]; |
---|
240 | mux3ds #(8) mux_ccr_bypass1(.dout(partial_cc_d[7:0]), |
---|
241 | .sel0(use_ccr), |
---|
242 | .sel1(use_cc_m), |
---|
243 | .sel2(use_cc_w), |
---|
244 | .in0(ccr_d[7:0]), |
---|
245 | .in1(alu_cc_m[7:0]), |
---|
246 | .in2(alu_cc_w[7:0])); |
---|
247 | |
---|
248 | assign use_cc_e = valid_setcc_e & thr_match_de; |
---|
249 | assign use_cc_m = setcc_m & thr_match_dm; |
---|
250 | assign use_cc_w = bypass_cc_w & thrmatch_w & ~use_cc_m; |
---|
251 | assign use_ccr = ~(use_cc_m | use_cc_w); |
---|
252 | |
---|
253 | assign tid_dxorw = tid_w ^ tid_d; |
---|
254 | |
---|
255 | assign thrmatch_w = ~(tid_dxorw[1] | tid_dxorw[0]); |
---|
256 | |
---|
257 | // generate ccr_w for the tlu |
---|
258 | assign exu_tlu_ccr0_w[7:0] = ccr_thr0[7:0]; |
---|
259 | assign exu_tlu_ccr1_w[7:0] = ccr_thr1[7:0]; |
---|
260 | assign exu_tlu_ccr2_w[7:0] = ccr_thr2[7:0]; |
---|
261 | assign exu_tlu_ccr3_w[7:0] = ccr_thr3[7:0]; |
---|
262 | |
---|
263 | |
---|
264 | endmodule // sparc_exu_eclccr |
---|