[6] | 1 | // ========== Copyright Header Begin ========================================== |
---|
| 2 | // |
---|
| 3 | // OpenSPARC T1 Processor File: sparc_ifu_dcl.v |
---|
| 4 | // Copyright (c) 2006 Sun Microsystems, Inc. All Rights Reserved. |
---|
| 5 | // DO NOT ALTER OR REMOVE COPYRIGHT NOTICES. |
---|
| 6 | // |
---|
| 7 | // The above named program is free software; you can redistribute it and/or |
---|
| 8 | // modify it under the terms of the GNU General Public |
---|
| 9 | // License version 2 as published by the Free Software Foundation. |
---|
| 10 | // |
---|
| 11 | // The above named program is distributed in the hope that it will be |
---|
| 12 | // useful, but WITHOUT ANY WARRANTY; without even the implied warranty of |
---|
| 13 | // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
---|
| 14 | // General Public License for more details. |
---|
| 15 | // |
---|
| 16 | // You should have received a copy of the GNU General Public |
---|
| 17 | // License along with this work; if not, write to the Free Software |
---|
| 18 | // Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA. |
---|
| 19 | // |
---|
| 20 | // ========== Copyright Header End ============================================ |
---|
| 21 | //////////////////////////////////////////////////////////////////////// |
---|
| 22 | /* |
---|
| 23 | // Module Name: sparc_ifu_dcl |
---|
| 24 | // Description: |
---|
| 25 | // The decode control logic block does branch condition evaluation, |
---|
| 26 | // delay slot management, and appropriate condition code |
---|
| 27 | // selection. It also executes the tcc instruction and kills the E |
---|
| 28 | // stage instruction if a move did not succeed. The DCL block is |
---|
| 29 | // also responsible for generating the correct select signals to |
---|
| 30 | // choose the branch offset and immediate operand. |
---|
| 31 | // |
---|
| 32 | */ |
---|
| 33 | //////////////////////////////////////////////////////////////////////// |
---|
| 34 | |
---|
| 35 | `define CC_N 3 |
---|
| 36 | `define CC_Z 2 |
---|
| 37 | `define CC_V 1 |
---|
| 38 | `define CC_C 0 |
---|
| 39 | |
---|
| 40 | `define FP_U 3 |
---|
| 41 | `define FP_G 2 |
---|
| 42 | `define FP_L 1 |
---|
| 43 | `define FP_E 0 |
---|
| 44 | |
---|
| 45 | `define FSR_FCC0_HI 11 |
---|
| 46 | `define FSR_FCC0_LO 10 |
---|
| 47 | `define FSR_FCC1_HI 33 |
---|
| 48 | `define FSR_FCC1_LO 32 |
---|
| 49 | `define FSR_FCC2_HI 35 |
---|
| 50 | `define FSR_FCC2_LO 34 |
---|
| 51 | `define FSR_FCC3_HI 37 |
---|
| 52 | `define FSR_FCC3_LO 36 |
---|
| 53 | |
---|
| 54 | |
---|
| 55 | module sparc_ifu_dcl(/*AUTOARG*/ |
---|
| 56 | // Outputs |
---|
| 57 | ifu_exu_kill_e, ifu_exu_dontmv_regz0_e, ifu_exu_dontmv_regz1_e, |
---|
| 58 | ifu_exu_tcc_e, ifu_exu_dbrinst_d, ifu_ffu_mvcnd_m, |
---|
| 59 | dcl_fcl_bcregz0_e, dcl_fcl_bcregz1_e, dtu_inst_anull_e, |
---|
| 60 | dcl_swl_tcc_done_m, dcl_imd_immdata_sel_simm13_d_l, |
---|
| 61 | dcl_imd_immdata_sel_movcc_d_l, dcl_imd_immdata_sel_sethi_d_l, |
---|
| 62 | dcl_imd_immdata_sel_movr_d_l, dcl_imd_broff_sel_call_d_l, |
---|
| 63 | dcl_imd_broff_sel_br_d_l, dcl_imd_broff_sel_bcc_d_l, |
---|
| 64 | dcl_imd_broff_sel_bpcc_d_l, dcl_imd_immbr_sel_br_d, so, |
---|
| 65 | // Inputs |
---|
| 66 | rclk, se, si, dtu_reset, exu_ifu_cc_d, fcl_dcl_regz_e, |
---|
| 67 | exu_ifu_regn_e, ffu_ifu_cc_w2, ffu_ifu_cc_vld_w2, |
---|
| 68 | tlu_ifu_flush_pipe_w, swl_dcl_thr_d, swl_dcl_thr_w2, |
---|
| 69 | imd_dcl_brcond_d, imd_dcl_mvcond_d, fdp_dcl_op_s, fdp_dcl_op3_s, |
---|
| 70 | imd_dcl_abit_d, dec_dcl_cctype_d, dtu_dcl_opf2_d, |
---|
| 71 | fcl_dtu_inst_vld_e, fcl_dtu_intr_vld_e, ifu_tlu_flush_w |
---|
| 72 | ); |
---|
| 73 | |
---|
| 74 | input rclk, |
---|
| 75 | se, |
---|
| 76 | si, |
---|
| 77 | dtu_reset; |
---|
| 78 | |
---|
| 79 | input [7:0] exu_ifu_cc_d; // latest CCs from EXU |
---|
| 80 | |
---|
| 81 | input fcl_dcl_regz_e, // rs1=0 |
---|
| 82 | exu_ifu_regn_e; // rs1<0 |
---|
| 83 | |
---|
| 84 | input [7:0] ffu_ifu_cc_w2; |
---|
| 85 | input [3:0] ffu_ifu_cc_vld_w2; |
---|
| 86 | |
---|
| 87 | input tlu_ifu_flush_pipe_w; |
---|
| 88 | |
---|
| 89 | input [3:0] swl_dcl_thr_d, |
---|
| 90 | swl_dcl_thr_w2; |
---|
| 91 | |
---|
| 92 | input [3:0] imd_dcl_brcond_d; // branch condition type |
---|
| 93 | input [7:0] imd_dcl_mvcond_d; // mov condition type |
---|
| 94 | |
---|
| 95 | input [1:0] fdp_dcl_op_s; |
---|
| 96 | input [5:0] fdp_dcl_op3_s; |
---|
| 97 | input imd_dcl_abit_d; // anull bit for cond branch |
---|
| 98 | input [2:0] dec_dcl_cctype_d; // which cond codes to use |
---|
| 99 | input dtu_dcl_opf2_d; |
---|
| 100 | |
---|
| 101 | input fcl_dtu_inst_vld_e; |
---|
| 102 | input fcl_dtu_intr_vld_e; |
---|
| 103 | input ifu_tlu_flush_w; |
---|
| 104 | |
---|
| 105 | output ifu_exu_kill_e, |
---|
| 106 | ifu_exu_dontmv_regz0_e, |
---|
| 107 | ifu_exu_dontmv_regz1_e, |
---|
| 108 | ifu_exu_tcc_e; |
---|
| 109 | output ifu_exu_dbrinst_d; |
---|
| 110 | |
---|
| 111 | output ifu_ffu_mvcnd_m; |
---|
| 112 | |
---|
| 113 | output dcl_fcl_bcregz0_e, |
---|
| 114 | dcl_fcl_bcregz1_e; |
---|
| 115 | |
---|
| 116 | output dtu_inst_anull_e; |
---|
| 117 | output dcl_swl_tcc_done_m; |
---|
| 118 | |
---|
| 119 | output dcl_imd_immdata_sel_simm13_d_l, // imm data select |
---|
| 120 | dcl_imd_immdata_sel_movcc_d_l, |
---|
| 121 | dcl_imd_immdata_sel_sethi_d_l, |
---|
| 122 | dcl_imd_immdata_sel_movr_d_l; |
---|
| 123 | |
---|
| 124 | output dcl_imd_broff_sel_call_d_l, // dir branch offset select |
---|
| 125 | dcl_imd_broff_sel_br_d_l, |
---|
| 126 | dcl_imd_broff_sel_bcc_d_l, |
---|
| 127 | dcl_imd_broff_sel_bpcc_d_l; |
---|
| 128 | |
---|
| 129 | output dcl_imd_immbr_sel_br_d; |
---|
| 130 | |
---|
| 131 | output so; |
---|
| 132 | |
---|
| 133 | //---------------------------------------------------------------------- |
---|
| 134 | // Declarations |
---|
| 135 | //---------------------------------------------------------------------- |
---|
| 136 | |
---|
| 137 | wire [7:0] cc_breval_e, |
---|
| 138 | fp_breval_d; |
---|
| 139 | |
---|
| 140 | wire abit_e; |
---|
| 141 | |
---|
| 142 | wire cond_brtaken_e, |
---|
| 143 | anull_all, |
---|
| 144 | anull_ubr, |
---|
| 145 | anull_cbr; |
---|
| 146 | |
---|
| 147 | wire [3:0] anull_next_e, |
---|
| 148 | anull_e, |
---|
| 149 | thr_anull_d; |
---|
| 150 | |
---|
| 151 | wire inst_anull_d, |
---|
| 152 | inst_anull_e; |
---|
| 153 | |
---|
| 154 | wire [3:0] flush_abit; |
---|
| 155 | wire all_flush_w, |
---|
| 156 | all_flush_w2; |
---|
| 157 | |
---|
| 158 | wire br_always_e; |
---|
| 159 | |
---|
| 160 | wire sel_movcc, |
---|
| 161 | sel_movr; |
---|
| 162 | |
---|
| 163 | wire [3:0] br_cond_e, |
---|
| 164 | br_cond_d; |
---|
| 165 | wire [3:0] thr_vld_e; |
---|
| 166 | |
---|
| 167 | wire [3:0] ls_brcond_d, |
---|
| 168 | ls_brcond_e; |
---|
| 169 | wire [1:0] ccfp_sel; |
---|
| 170 | |
---|
| 171 | wire [3:0] cc_e; |
---|
| 172 | |
---|
| 173 | wire [1:0] curr_fcc_d; |
---|
| 174 | |
---|
| 175 | wire [7:0] fcc_d; |
---|
| 176 | |
---|
| 177 | wire [7:0] t0_fcc_d, |
---|
| 178 | t1_fcc_d, |
---|
| 179 | t2_fcc_d, |
---|
| 180 | t3_fcc_d, |
---|
| 181 | t0_fcc_nxt, |
---|
| 182 | t1_fcc_nxt, |
---|
| 183 | t2_fcc_nxt, |
---|
| 184 | t3_fcc_nxt; |
---|
| 185 | |
---|
| 186 | wire use_fcc0_d, |
---|
| 187 | use_fcc1_d, |
---|
| 188 | use_fcc2_d, |
---|
| 189 | use_fcc3_d; |
---|
| 190 | |
---|
| 191 | wire [3:0] thr_e, |
---|
| 192 | thr_dec_d; |
---|
| 193 | // fcc_dec_d, |
---|
| 194 | // fcc_dec_e; |
---|
| 195 | |
---|
| 196 | wire [1:0] op_d; |
---|
| 197 | wire [5:0] op3_d; |
---|
| 198 | |
---|
| 199 | wire use_xcc_d, |
---|
| 200 | ltz_e, |
---|
| 201 | cc_eval0, |
---|
| 202 | cc_eval1, |
---|
| 203 | fp_eval0_d, |
---|
| 204 | fp_eval1_d, |
---|
| 205 | fp_eval_d, |
---|
| 206 | fp_eval_e, |
---|
| 207 | r_eval1, |
---|
| 208 | r_eval0, |
---|
| 209 | ccfp_eval, |
---|
| 210 | ccbr_taken_e, |
---|
| 211 | mvbr_sel_br_d, |
---|
| 212 | cc_mvbr_d, |
---|
| 213 | cc_mvbr_e, |
---|
| 214 | fpcond_mvbr_d, |
---|
| 215 | fpcond_mvbr_e; |
---|
| 216 | |
---|
| 217 | wire call_inst_e, |
---|
| 218 | call_inst_d, |
---|
| 219 | dbr_inst_d, |
---|
| 220 | dbr_inst_e, |
---|
| 221 | ibr_inst_d, |
---|
| 222 | ibr_inst_e, |
---|
| 223 | mov_inst_d, |
---|
| 224 | mov_inst_e, |
---|
| 225 | tcc_done_e, |
---|
| 226 | tcc_inst_d, |
---|
| 227 | tcc_inst_e; |
---|
| 228 | |
---|
| 229 | wire clk; |
---|
| 230 | |
---|
| 231 | |
---|
| 232 | |
---|
| 233 | //---------------------------------------------------------------------- |
---|
| 234 | // Code start here |
---|
| 235 | //---------------------------------------------------------------------- |
---|
| 236 | assign clk = rclk; |
---|
| 237 | |
---|
| 238 | |
---|
| 239 | // S Stage Operands |
---|
| 240 | dff_s #(2) opreg(.din (fdp_dcl_op_s), |
---|
| 241 | .clk (clk), |
---|
| 242 | .q (op_d), |
---|
| 243 | .se (se), .si(), .so()); |
---|
| 244 | |
---|
| 245 | dff_s #(6) op3_reg(.din (fdp_dcl_op3_s), |
---|
| 246 | .clk (clk), |
---|
| 247 | .q (op3_d), |
---|
| 248 | .se (se), .si(), .so()); |
---|
| 249 | |
---|
| 250 | dff_s abite_reg(.din (imd_dcl_abit_d), |
---|
| 251 | .clk (clk), |
---|
| 252 | .q (abit_e), |
---|
| 253 | .se (se), .si(), .so()); |
---|
| 254 | |
---|
| 255 | // need to protect from scan contention |
---|
| 256 | dff_s #(4) thre_reg(.din (swl_dcl_thr_d), |
---|
| 257 | .q (thr_e), |
---|
| 258 | .clk (clk), .se(se), .si(), .so()); |
---|
| 259 | |
---|
| 260 | //------------------------------ |
---|
| 261 | // Choose correct immediate data |
---|
| 262 | //------------------------------ |
---|
| 263 | // movcc if op3 = 101100 |
---|
| 264 | assign dcl_imd_immdata_sel_movcc_d_l = ~(op_d[1] & |
---|
| 265 | op3_d[5] & ~op3_d[4] & |
---|
| 266 | op3_d[3] & ~op3_d[0]); |
---|
| 267 | |
---|
| 268 | // movr if op3 = 101111 |
---|
| 269 | //+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
---|
| 270 | // Reduced the number of terms in the eqn to help with timing |
---|
| 271 | // path, the result of which is that the immediate data sent to the |
---|
| 272 | // exu for a FLUSH instruction is INCORRECT! (It is decoded as a |
---|
| 273 | // MOVR). However, since our architecture completely ignores the |
---|
| 274 | // address of the flush, this should be ok. Confirmed with Sanjay |
---|
| 275 | // 03/31/03. (v1.29 -> 1.30) |
---|
| 276 | // ++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ |
---|
| 277 | assign dcl_imd_immdata_sel_movr_d_l = ~(op_d[1] & |
---|
| 278 | op3_d[5] & op3_d[3] & |
---|
| 279 | op3_d[1] & op3_d[0]); |
---|
| 280 | |
---|
| 281 | // sethi if op3 = 100xx |
---|
| 282 | assign dcl_imd_immdata_sel_sethi_d_l = ~(~op_d[1]); |
---|
| 283 | |
---|
| 284 | // everything else |
---|
| 285 | assign dcl_imd_immdata_sel_simm13_d_l = |
---|
| 286 | ~(dcl_imd_immdata_sel_movcc_d_l & |
---|
| 287 | dcl_imd_immdata_sel_movr_d_l & |
---|
| 288 | dcl_imd_immdata_sel_sethi_d_l); |
---|
| 289 | |
---|
| 290 | //------------------------------ |
---|
| 291 | // Choose correct branch offset |
---|
| 292 | //------------------------------ |
---|
| 293 | // call or ld/store |
---|
| 294 | assign dcl_imd_broff_sel_call_d_l = ~(op_d[0]); |
---|
| 295 | |
---|
| 296 | // branch on register |
---|
| 297 | assign dcl_imd_broff_sel_br_d_l = ~(~op_d[0] & |
---|
| 298 | op3_d[4] & op3_d[3]); |
---|
| 299 | // branch w/o prediction |
---|
| 300 | assign dcl_imd_broff_sel_bcc_d_l = ~(~op_d[0] & |
---|
| 301 | op3_d[4] & ~op3_d[3]); |
---|
| 302 | // everything else |
---|
| 303 | assign dcl_imd_broff_sel_bpcc_d_l = ~(~op_d[0] & |
---|
| 304 | ~op3_d[4]); |
---|
| 305 | |
---|
| 306 | //------------------------------------ |
---|
| 307 | // mark branch/conditional instrctions |
---|
| 308 | //------------------------------------ |
---|
| 309 | // call |
---|
| 310 | assign call_inst_d = ~op_d[1] & op_d[0]; |
---|
| 311 | dff_s #(1) call_inste_reg(.din (call_inst_d), |
---|
| 312 | .clk (clk), |
---|
| 313 | .q (call_inst_e), |
---|
| 314 | .se (se), .si(), .so()); |
---|
| 315 | |
---|
| 316 | // call or branch but not nop/sethi |
---|
| 317 | assign dbr_inst_d = ~op_d[1] & (op_d[0] | op3_d[4] | op3_d[3]); |
---|
| 318 | |
---|
| 319 | // Choose between branch offset and immediate operand |
---|
| 320 | assign dcl_imd_immbr_sel_br_d = dbr_inst_d; |
---|
| 321 | |
---|
| 322 | // tell exu to use pc instead of rs1 |
---|
| 323 | assign ifu_exu_dbrinst_d = ~op_d[1]; |
---|
| 324 | |
---|
| 325 | dff_s #(1) dbr_inste_reg(.din (dbr_inst_d), |
---|
| 326 | .clk (clk), |
---|
| 327 | .q (dbr_inst_e), |
---|
| 328 | .se (se), .si(), .so()); |
---|
| 329 | |
---|
| 330 | // jmpl + return |
---|
| 331 | assign ibr_inst_d = op_d[1] & ~op_d[0] & |
---|
| 332 | op3_d[5] & op3_d[4] & op3_d[3] & |
---|
| 333 | ~op3_d[2] & ~op3_d[1]; |
---|
| 334 | dff_s #(1) ibr_inste_reg(.din (ibr_inst_d), |
---|
| 335 | .clk (clk), |
---|
| 336 | .q (ibr_inst_e), |
---|
| 337 | .se (se), .si(), .so()); |
---|
| 338 | // mov |
---|
| 339 | assign mov_inst_d = (op_d[1] & ~op_d[0] & |
---|
| 340 | op3_d[5] & ~op3_d[4] & op3_d[3] & op3_d[2] & |
---|
| 341 | (~op3_d[1] & ~op3_d[0] | op3_d[1] & op3_d[0])); |
---|
| 342 | |
---|
| 343 | dff_s #(1) mov_inste_reg(.din (mov_inst_d), |
---|
| 344 | .clk (clk), |
---|
| 345 | .q (mov_inst_e), |
---|
| 346 | .se (se), .si(), .so()); |
---|
| 347 | // tcc |
---|
| 348 | assign tcc_inst_d = op_d[1] & ~op_d[0] & |
---|
| 349 | op3_d[5] & op3_d[4] & op3_d[3] & |
---|
| 350 | ~op3_d[2] & op3_d[1] & ~op3_d[0]; |
---|
| 351 | dff_s #(1) tcc_inste_reg(.din (tcc_inst_d), |
---|
| 352 | .clk (clk), |
---|
| 353 | .q (tcc_inst_e), |
---|
| 354 | .se (se), .si(), .so()); |
---|
| 355 | |
---|
| 356 | assign mvbr_sel_br_d = ~op_d[1] & ~op_d[0] | // br |
---|
| 357 | op3_d[3] & ~op3_d[2] & op3_d[1] & ~op3_d[0]; // tcc |
---|
| 358 | |
---|
| 359 | assign cc_mvbr_d = ~(~op_d[1] & ~op_d[0] & op3_d[4] & op3_d[3] | // bpr |
---|
| 360 | op_d[1] & ~op_d[0] & op3_d[5] & ~op3_d[4] & |
---|
| 361 | op3_d[3] & op3_d[2] & op3_d[1] & op3_d[0] | // movr |
---|
| 362 | op_d[1] & ~op_d[0] & op3_d[5] & op3_d[4] & |
---|
| 363 | ~op3_d[3] & op3_d[2] & ~op3_d[1] & op3_d[0] & |
---|
| 364 | dtu_dcl_opf2_d); // fmovr |
---|
| 365 | |
---|
| 366 | |
---|
| 367 | //--------------------------- |
---|
| 368 | // FCC Logic |
---|
| 369 | //-------------------------- |
---|
| 370 | // choose current fcc |
---|
| 371 | assign use_fcc0_d = ~dec_dcl_cctype_d[1] & ~dec_dcl_cctype_d[0]; |
---|
| 372 | assign use_fcc1_d = ~dec_dcl_cctype_d[1] & dec_dcl_cctype_d[0]; |
---|
| 373 | assign use_fcc2_d = dec_dcl_cctype_d[1] & ~dec_dcl_cctype_d[0]; |
---|
| 374 | assign use_fcc3_d = dec_dcl_cctype_d[1] & dec_dcl_cctype_d[0]; |
---|
| 375 | |
---|
| 376 | mux4ds #(2) fcc_mux(.dout (curr_fcc_d[1:0]), |
---|
| 377 | .in0 (fcc_d[1:0]), |
---|
| 378 | .in1 (fcc_d[3:2]), |
---|
| 379 | .in2 (fcc_d[5:4]), |
---|
| 380 | .in3 (fcc_d[7:6]), |
---|
| 381 | .sel0 (use_fcc0_d), |
---|
| 382 | .sel1 (use_fcc1_d), |
---|
| 383 | .sel2 (use_fcc2_d), |
---|
| 384 | .sel3 (use_fcc3_d)); |
---|
| 385 | |
---|
| 386 | // decode to make next step easier |
---|
| 387 | // assign fcc_dec_d[0] = ~curr_fcc_d[1] & ~curr_fcc_d[0]; |
---|
| 388 | // assign fcc_dec_d[1] = ~curr_fcc_d[1] & curr_fcc_d[0]; |
---|
| 389 | // assign fcc_dec_d[2] = curr_fcc_d[1] & ~curr_fcc_d[0]; |
---|
| 390 | // assign fcc_dec_d[3] = curr_fcc_d[1] & curr_fcc_d[0]; |
---|
| 391 | |
---|
| 392 | // dff #(4) fcce_reg(.din (fcc_dec_d), |
---|
| 393 | // .q (fcc_dec_e), |
---|
| 394 | // .clk (clk), |
---|
| 395 | // .se (se), .si(), .so()); |
---|
| 396 | |
---|
| 397 | |
---|
| 398 | //------------------ |
---|
| 399 | // CC Logic for BCC |
---|
| 400 | //------------------ |
---|
| 401 | // Choose appropriate CCs |
---|
| 402 | // |
---|
| 403 | // dec_cctype is 3 bits |
---|
| 404 | // 10X icc |
---|
| 405 | // 11X xcc |
---|
| 406 | // 000 fcc0 |
---|
| 407 | // 001 fcc1 |
---|
| 408 | // 010 fcc2 |
---|
| 409 | // 011 fcc3 |
---|
| 410 | // assign use_xcc_d = (dec_dcl_cctype_d[2] | op3_d[3]) & dec_dcl_cctype_d[1]; |
---|
| 411 | assign use_xcc_d = dec_dcl_cctype_d[1]; |
---|
| 412 | assign fpcond_mvbr_d = ~dec_dcl_cctype_d[2] & ~tcc_inst_d; |
---|
| 413 | |
---|
| 414 | dff_s fpbr_reg(.din (fpcond_mvbr_d), |
---|
| 415 | .clk (clk), |
---|
| 416 | .q (fpcond_mvbr_e), |
---|
| 417 | .se (se), .si(), .so()); |
---|
| 418 | |
---|
| 419 | // mux between xcc and icc |
---|
| 420 | // assign cc_d = use_xcc_d ? exu_ifu_cc_d[7:4] : // xcc |
---|
| 421 | // exu_ifu_cc_d[3:0]; // icc |
---|
| 422 | // dff #(4) ccreg_e(.din (cc_d), |
---|
| 423 | // .clk (clk), |
---|
| 424 | // .q (cc_e), |
---|
| 425 | // .se (se), .si(), .so()); |
---|
| 426 | |
---|
| 427 | bw_u1_soffm2_4x UZsize_ccreg0_e(.d0 (exu_ifu_cc_d[0]), |
---|
| 428 | .d1 (exu_ifu_cc_d[4]), |
---|
| 429 | .s (use_xcc_d), |
---|
| 430 | .q (cc_e[0]), |
---|
| 431 | .ck (clk), .se(se), .sd(), .so()); |
---|
| 432 | bw_u1_soffm2_4x UZsize_ccreg1_e(.d0 (exu_ifu_cc_d[1]), |
---|
| 433 | .d1 (exu_ifu_cc_d[5]), |
---|
| 434 | .s (use_xcc_d), |
---|
| 435 | .q (cc_e[1]), |
---|
| 436 | .ck (clk), .se(se), .sd(), .so()); |
---|
| 437 | bw_u1_soffm2_4x UZsize_ccreg2_e(.d0 (exu_ifu_cc_d[2]), |
---|
| 438 | .d1 (exu_ifu_cc_d[6]), |
---|
| 439 | .s (use_xcc_d), |
---|
| 440 | .q (cc_e[2]), |
---|
| 441 | .ck (clk), .se(se), .sd(), .so()); |
---|
| 442 | bw_u1_soffm2_4x UZsize_ccreg3_e(.d0 (exu_ifu_cc_d[3]), |
---|
| 443 | .d1 (exu_ifu_cc_d[7]), |
---|
| 444 | .s (use_xcc_d), |
---|
| 445 | .q (cc_e[3]), |
---|
| 446 | .ck (clk), .se(se), .sd(), .so()); |
---|
| 447 | |
---|
| 448 | |
---|
| 449 | //------------------------------ |
---|
| 450 | // Evaluate Branch |
---|
| 451 | //------------------------------ |
---|
| 452 | // Select correct branch condition |
---|
| 453 | assign sel_movcc = ~mvbr_sel_br_d & cc_mvbr_d; |
---|
| 454 | assign sel_movr = ~mvbr_sel_br_d & ~cc_mvbr_d; |
---|
| 455 | |
---|
| 456 | // br_cond is the same as the "cond" field = inst[28:25] for bcc |
---|
| 457 | mux3ds #(4) brcond_mux(.dout (br_cond_d), |
---|
| 458 | .in0 (imd_dcl_brcond_d), // br or tcc |
---|
| 459 | .in1 (imd_dcl_mvcond_d[7:4]), // movcc |
---|
| 460 | .in2 (imd_dcl_mvcond_d[3:0]), // movr |
---|
| 461 | .sel0 (mvbr_sel_br_d), |
---|
| 462 | .sel1 (sel_movcc), |
---|
| 463 | .sel2 (sel_movr)); |
---|
| 464 | |
---|
| 465 | dff_s #(4) brcond_e_reg(.din (br_cond_d), |
---|
| 466 | .clk (clk), |
---|
| 467 | .q (br_cond_e), |
---|
| 468 | .se (se), .si(), .so()); |
---|
| 469 | |
---|
| 470 | // Branch Type Decode |
---|
| 471 | assign ls_brcond_d[0] = ~br_cond_d[1] & ~br_cond_d[0]; |
---|
| 472 | assign ls_brcond_d[1] = ~br_cond_d[1] & br_cond_d[0]; |
---|
| 473 | assign ls_brcond_d[2] = br_cond_d[1] & ~br_cond_d[0]; |
---|
| 474 | assign ls_brcond_d[3] = br_cond_d[1] & br_cond_d[0]; |
---|
| 475 | |
---|
| 476 | dff_s #(4) lsbrc_e_reg(.din (ls_brcond_d), |
---|
| 477 | .clk (clk), |
---|
| 478 | .q (ls_brcond_e), |
---|
| 479 | .se (se), .si(), .so()); |
---|
| 480 | |
---|
| 481 | // Evaluate potential integer CC branches |
---|
| 482 | assign ltz_e = (cc_e[`CC_N] ^ cc_e[`CC_V]); |
---|
| 483 | |
---|
| 484 | assign cc_breval_e[0] = 1'b0; // BPN |
---|
| 485 | assign cc_breval_e[1] = cc_e[`CC_Z]; // BPE |
---|
| 486 | assign cc_breval_e[2] = cc_e[`CC_Z] | ltz_e; // BPLE |
---|
| 487 | assign cc_breval_e[3] = ltz_e; // BPL |
---|
| 488 | assign cc_breval_e[4] = cc_e[`CC_Z] | cc_e[`CC_C]; // BPLEU |
---|
| 489 | assign cc_breval_e[5] = cc_e[`CC_C]; // BPCS |
---|
| 490 | assign cc_breval_e[6] = cc_e[`CC_N]; // BPNEG |
---|
| 491 | assign cc_breval_e[7] = cc_e[`CC_V]; // BPVS |
---|
| 492 | |
---|
| 493 | // mux to choose right condition |
---|
| 494 | assign cc_eval0 = cc_breval_e[0] & ls_brcond_e[0] | |
---|
| 495 | cc_breval_e[1] & ls_brcond_e[1] | |
---|
| 496 | cc_breval_e[2] & ls_brcond_e[2] | |
---|
| 497 | cc_breval_e[3] & ls_brcond_e[3]; |
---|
| 498 | |
---|
| 499 | assign cc_eval1 = cc_breval_e[4] & ls_brcond_e[0] | |
---|
| 500 | cc_breval_e[5] & ls_brcond_e[1] | |
---|
| 501 | cc_breval_e[6] & ls_brcond_e[2] | |
---|
| 502 | cc_breval_e[7] & ls_brcond_e[3]; |
---|
| 503 | |
---|
| 504 | // Evaluate FP CC branches in D stage |
---|
| 505 | assign fp_breval_d[0] = 1'b0; // FBN / A |
---|
| 506 | assign fp_breval_d[1] = (curr_fcc_d[1] | curr_fcc_d[0]); // FBNE / E |
---|
| 507 | assign fp_breval_d[2] = curr_fcc_d[1] ^ curr_fcc_d[0]; // FBLG / UE |
---|
| 508 | assign fp_breval_d[3] = curr_fcc_d[0]; // FBUL / GE |
---|
| 509 | assign fp_breval_d[4] = ~curr_fcc_d[1] & curr_fcc_d[0]; // FBL / UGE |
---|
| 510 | assign fp_breval_d[5] = curr_fcc_d[1]; // FBUG / LE |
---|
| 511 | assign fp_breval_d[6] = curr_fcc_d[1] & ~curr_fcc_d[0]; // FBG / ULE |
---|
| 512 | assign fp_breval_d[7] = curr_fcc_d[1] & curr_fcc_d[0]; // FBU / O |
---|
| 513 | |
---|
| 514 | assign fp_eval0_d = fp_breval_d[0] & ls_brcond_d[0] | |
---|
| 515 | fp_breval_d[1] & ls_brcond_d[1] | |
---|
| 516 | fp_breval_d[2] & ls_brcond_d[2] | |
---|
| 517 | fp_breval_d[3] & ls_brcond_d[3]; |
---|
| 518 | |
---|
| 519 | assign fp_eval1_d = fp_breval_d[4] & ls_brcond_d[0] | |
---|
| 520 | fp_breval_d[5] & ls_brcond_d[1] | |
---|
| 521 | fp_breval_d[6] & ls_brcond_d[2] | |
---|
| 522 | fp_breval_d[7] & ls_brcond_d[3]; |
---|
| 523 | |
---|
| 524 | assign fp_eval_d = br_cond_d[2] ? fp_eval1_d : |
---|
| 525 | fp_eval0_d; |
---|
| 526 | |
---|
| 527 | dff_s #(1) fpev_ff(.din (fp_eval_d), |
---|
| 528 | .q (fp_eval_e), |
---|
| 529 | .clk (clk), |
---|
| 530 | .se (se), .si(), .so()); |
---|
| 531 | |
---|
| 532 | // merge eval0, eval1 and fp condition codes |
---|
| 533 | assign ccfp_sel[0] = ~fpcond_mvbr_e & ~br_cond_e[2]; |
---|
| 534 | assign ccfp_sel[1] = ~fpcond_mvbr_e & br_cond_e[2]; |
---|
| 535 | // assign ccfp_sel[2] = fpcond_mvbr_e & ~br_cond_e[2]; |
---|
| 536 | // assign ccfp_sel[3] = fpcond_mvbr_e & br_cond_e[2]; |
---|
| 537 | |
---|
| 538 | assign ccfp_eval = ccfp_sel[0] & cc_eval0 | |
---|
| 539 | ccfp_sel[1] & cc_eval1 | |
---|
| 540 | fpcond_mvbr_e & fp_eval_e; |
---|
| 541 | |
---|
| 542 | // invert branch condition if this is an inverted br type |
---|
| 543 | // assign ccbr_taken_e = (ccfp_eval ^ br_cond_e[3]) & cc_mvbr_e; |
---|
| 544 | assign ccbr_taken_e = ccfp_eval ? (cc_mvbr_e & ~br_cond_e[3]) : |
---|
| 545 | (cc_mvbr_e & br_cond_e[3]); |
---|
| 546 | |
---|
| 547 | assign br_always_e = (~br_cond_e[0] & ~br_cond_e[1] & ~br_cond_e[2] & |
---|
| 548 | br_cond_e[3] & cc_mvbr_e); |
---|
| 549 | |
---|
| 550 | //-------------- |
---|
| 551 | // For BRZ |
---|
| 552 | // ------------- |
---|
| 553 | // Calculate Cond Assuming Z=1 And Z=0. Then Mux |
---|
| 554 | // assign r_eval1 = ((exu_ifu_regn_e | ~br_cond_e[1] | ~br_cond_e[0]) ^ |
---|
| 555 | // br_cond_e[2]) & ~cc_mvbr_e; |
---|
| 556 | assign r_eval1 = exu_ifu_regn_e ? (~br_cond_e[2] & ~cc_mvbr_e) : |
---|
| 557 | (((br_cond_e[1] & br_cond_e[0]) ^ |
---|
| 558 | ~br_cond_e[2]) & ~cc_mvbr_e); |
---|
| 559 | |
---|
| 560 | // assign r_eval0 = ((exu_ifu_regn_e & br_cond_e[1]) ^ |
---|
| 561 | // br_cond_e[2]) & ~cc_mvbr_e; |
---|
| 562 | assign r_eval0 = exu_ifu_regn_e ? ((br_cond_e[1] ^ br_cond_e[2]) & |
---|
| 563 | ~cc_mvbr_e) : |
---|
| 564 | (br_cond_e[2] & ~cc_mvbr_e); |
---|
| 565 | |
---|
| 566 | dff_s #(1) regcc_ff(.din (cc_mvbr_d), |
---|
| 567 | .clk (clk), |
---|
| 568 | .q (cc_mvbr_e), |
---|
| 569 | .se (se), .si(), .so()); |
---|
| 570 | |
---|
| 571 | // Evaluate Final Branch condition |
---|
| 572 | // 3:1 mux |
---|
| 573 | // assign cond_brtaken_e = cc_mvbr_e ? ccbr_taken_e : |
---|
| 574 | // exu_ifu_regz_e ? r_eval1 : |
---|
| 575 | // r_eval0; |
---|
| 576 | // 2:1 mux |
---|
| 577 | // assign cond_brtaken_e = exu_ifu_regz_e ? (r_eval1 | ccbr_taken_e) : |
---|
| 578 | // (r_eval0 | ccbr_taken_e); |
---|
| 579 | |
---|
| 580 | //////// Chandra //////// |
---|
| 581 | |
---|
| 582 | wire temp0, temp1, cond_brtaken_e_l; |
---|
| 583 | |
---|
| 584 | // limit loading on this signal |
---|
| 585 | // wire regz_buf_e; |
---|
| 586 | // bw_u1_buf_5x UZfix_regz_bf(.a (exu_ifu_regz_e), |
---|
| 587 | // .z (regz_buf_e)); |
---|
| 588 | |
---|
| 589 | assign temp0 = (r_eval0 | ccbr_taken_e); |
---|
| 590 | assign temp1 = (r_eval1 | ccbr_taken_e); |
---|
| 591 | |
---|
| 592 | bw_u1_muxi21_6x UZsize_cbtmux(.z(cond_brtaken_e_l), |
---|
| 593 | .d0(temp0), |
---|
| 594 | .d1(temp1), |
---|
| 595 | .s(fcl_dcl_regz_e)); |
---|
| 596 | |
---|
| 597 | bw_u1_inv_20x UZsize_cbtinv(.z(cond_brtaken_e), |
---|
| 598 | .a(cond_brtaken_e_l)); |
---|
| 599 | |
---|
| 600 | //////////////////////// |
---|
| 601 | |
---|
| 602 | assign dcl_fcl_bcregz0_e = (temp0 & dbr_inst_e | ibr_inst_e | |
---|
| 603 | call_inst_e) & ~dtu_inst_anull_e; |
---|
| 604 | assign dcl_fcl_bcregz1_e = (temp1 & dbr_inst_e | ibr_inst_e | |
---|
| 605 | call_inst_e) & ~dtu_inst_anull_e; |
---|
| 606 | |
---|
| 607 | // assign ifu_exu_dontmove_e = mov_inst_e & ~cond_brtaken_e; |
---|
| 608 | assign ifu_exu_dontmv_regz0_e = ~temp0 & mov_inst_e; |
---|
| 609 | assign ifu_exu_dontmv_regz1_e = ~temp1 & mov_inst_e; |
---|
| 610 | |
---|
| 611 | // branch condition to FPU |
---|
| 612 | dff_s #(1) fpcond_ff(.din (cond_brtaken_e), |
---|
| 613 | .q (ifu_ffu_mvcnd_m), |
---|
| 614 | .clk (clk), |
---|
| 615 | .se (se), .si(), .so()); |
---|
| 616 | |
---|
| 617 | // branch / move completion and anull signals |
---|
| 618 | // assign dtu_fcl_brtaken_e = ~dtu_inst_anull_e & |
---|
| 619 | // (ibr_inst_e | call_inst_e | |
---|
| 620 | // dbr_inst_e & cond_brtaken_e); |
---|
| 621 | |
---|
| 622 | // if mov didn't succeed kill write back and bypass |
---|
| 623 | // need to check thread as well |
---|
| 624 | // assign ifu_exu_kill_e = dtu_inst_anull_e | |
---|
| 625 | // ~fcl_dtu_inst_vld_e; // don't need this anymore |
---|
| 626 | assign ifu_exu_kill_e = dtu_inst_anull_e; |
---|
| 627 | |
---|
| 628 | |
---|
| 629 | // signal trap if tcc succeeds |
---|
| 630 | assign ifu_exu_tcc_e = ~dtu_inst_anull_e & tcc_inst_e & ccbr_taken_e & |
---|
| 631 | fcl_dtu_inst_vld_e; |
---|
| 632 | |
---|
| 633 | assign tcc_done_e = ~dtu_inst_anull_e & tcc_inst_e & ~ccbr_taken_e & |
---|
| 634 | fcl_dtu_inst_vld_e; |
---|
| 635 | |
---|
| 636 | dff_s #(1) tccm_ff(.din (tcc_done_e), |
---|
| 637 | .q (dcl_swl_tcc_done_m), |
---|
| 638 | .clk (clk), |
---|
| 639 | .se (se), .si(), .so()); |
---|
| 640 | |
---|
| 641 | // logic to anull delay slot, if this branch itsel is not anulled |
---|
| 642 | assign anull_cbr = abit_e & dbr_inst_e & ~br_always_e & ~call_inst_e; |
---|
| 643 | assign anull_ubr = abit_e & dbr_inst_e & br_always_e & ~call_inst_e; |
---|
| 644 | |
---|
| 645 | assign anull_all = anull_ubr | anull_cbr & ~cond_brtaken_e; |
---|
| 646 | |
---|
| 647 | // check which thread to anull |
---|
| 648 | assign thr_vld_e = thr_e & {4{fcl_dtu_inst_vld_e}}; |
---|
| 649 | |
---|
| 650 | assign all_flush_w = tlu_ifu_flush_pipe_w | ifu_tlu_flush_w; |
---|
| 651 | dff_s #(1) flshw2_ff(.din (all_flush_w), |
---|
| 652 | .q (all_flush_w2), |
---|
| 653 | .clk (clk), .se(se), .si(), .so()); |
---|
| 654 | |
---|
| 655 | assign flush_abit = swl_dcl_thr_w2 & {4{all_flush_w2}}; |
---|
| 656 | |
---|
| 657 | assign anull_next_e = ((~anull_e & {4{anull_all}} & thr_vld_e) | |
---|
| 658 | (anull_e & ~(thr_e & {4{fcl_dtu_inst_vld_e | |
---|
| 659 | fcl_dtu_intr_vld_e}}))) & |
---|
| 660 | ~flush_abit; |
---|
| 661 | |
---|
| 662 | // anull_e needs to be per thread |
---|
| 663 | dffr_s #(4) anull_ff(.din (anull_next_e), |
---|
| 664 | .clk (clk), |
---|
| 665 | .rst (dtu_reset), |
---|
| 666 | .q (anull_e), |
---|
| 667 | .se (se), .si(), .so()); |
---|
| 668 | |
---|
| 669 | // |
---|
| 670 | // assign thr_dec_e[0] = swl_dcl_thr_e[0] | rst_tri_enable; |
---|
| 671 | // assign thr_dec_e[3:1] = swl_dcl_thr_e[3:1] & {3{~rst_tri_enable}}; |
---|
| 672 | |
---|
| 673 | assign thr_anull_d = swl_dcl_thr_d & anull_next_e; |
---|
| 674 | assign inst_anull_d = (|thr_anull_d[3:0]); |
---|
| 675 | dff_s #(1) ina_ff(.din (inst_anull_d), |
---|
| 676 | .q (inst_anull_e), |
---|
| 677 | .clk (clk), .se (se), .si(), .so()); |
---|
| 678 | |
---|
| 679 | assign dtu_inst_anull_e = inst_anull_e; |
---|
| 680 | |
---|
| 681 | // mux4ds dcla_mux(.dout (this_inst_anull_e), |
---|
| 682 | // .in0 (anull_e[0]), |
---|
| 683 | // .in1 (anull_e[1]), |
---|
| 684 | // .in2 (anull_e[2]), |
---|
| 685 | // .in3 (anull_e[3]), |
---|
| 686 | // .sel0 (thr_dec_e[0]), |
---|
| 687 | // .sel1 (thr_dec_e[1]), |
---|
| 688 | // .sel2 (thr_dec_e[2]), |
---|
| 689 | // .sel3 (thr_dec_e[3])); |
---|
| 690 | // assign dtu_inst_anull_e = this_inst_anull_e & fcl_dtu_inst_vld_e; |
---|
| 691 | |
---|
| 692 | |
---|
| 693 | //-------------------- |
---|
| 694 | // Copy of FCC |
---|
| 695 | //-------------------- |
---|
| 696 | // FCC's are maintained in the ffu. A copy is kept here to run the |
---|
| 697 | // FP branch instructions. |
---|
| 698 | |
---|
| 699 | // load FCC from FFU |
---|
| 700 | mux2ds #(8) t0_fcc_mux(.dout (t0_fcc_nxt[7:0]), |
---|
| 701 | .in0 (t0_fcc_d[7:0]), |
---|
| 702 | .in1 (ffu_ifu_cc_w2[7:0]), |
---|
| 703 | .sel0 (~ffu_ifu_cc_vld_w2[0]), |
---|
| 704 | .sel1 (ffu_ifu_cc_vld_w2[0])); |
---|
| 705 | |
---|
| 706 | dffr_s #(8) t0_fcc_reg(.din (t0_fcc_nxt[7:0]), |
---|
| 707 | .q (t0_fcc_d[7:0]), |
---|
| 708 | .rst (dtu_reset), |
---|
| 709 | .clk (clk), .se (se), .si(), .so()); |
---|
| 710 | `ifdef FPGA_SYN_1THREAD |
---|
| 711 | assign fcc_d[7:0] = t0_fcc_d[7:0]; |
---|
| 712 | `else |
---|
| 713 | |
---|
| 714 | mux2ds #(8) t1_fcc_mux(.dout (t1_fcc_nxt[7:0]), |
---|
| 715 | .in0 (t1_fcc_d[7:0]), |
---|
| 716 | .in1 (ffu_ifu_cc_w2[7:0]), |
---|
| 717 | .sel0 (~ffu_ifu_cc_vld_w2[1]), |
---|
| 718 | .sel1 (ffu_ifu_cc_vld_w2[1])); |
---|
| 719 | |
---|
| 720 | mux2ds #(8) t2_fcc_mux(.dout (t2_fcc_nxt[7:0]), |
---|
| 721 | .in0 (t2_fcc_d[7:0]), |
---|
| 722 | .in1 (ffu_ifu_cc_w2[7:0]), |
---|
| 723 | .sel0 (~ffu_ifu_cc_vld_w2[2]), |
---|
| 724 | .sel1 (ffu_ifu_cc_vld_w2[2])); |
---|
| 725 | |
---|
| 726 | mux2ds #(8) t3_fcc_mux(.dout (t3_fcc_nxt[7:0]), |
---|
| 727 | .in0 (t3_fcc_d[7:0]), |
---|
| 728 | .in1 (ffu_ifu_cc_w2[7:0]), |
---|
| 729 | .sel0 (~ffu_ifu_cc_vld_w2[3]), |
---|
| 730 | .sel1 (ffu_ifu_cc_vld_w2[3])); |
---|
| 731 | |
---|
| 732 | // thread0 fcc registers |
---|
| 733 | |
---|
| 734 | dffr_s #(8) t1_fcc_reg(.din (t1_fcc_nxt[7:0]), |
---|
| 735 | .q (t1_fcc_d[7:0]), |
---|
| 736 | .rst (dtu_reset), |
---|
| 737 | .clk (clk), .se (se), .si(), .so()); |
---|
| 738 | dffr_s #(8) t2_fcc_reg(.din (t2_fcc_nxt[7:0]), |
---|
| 739 | .q (t2_fcc_d[7:0]), |
---|
| 740 | .rst (dtu_reset), |
---|
| 741 | .clk (clk), .se (se), .si(), .so()); |
---|
| 742 | dffr_s #(8) t3_fcc_reg(.din (t3_fcc_nxt[7:0]), |
---|
| 743 | .q (t3_fcc_d[7:0]), |
---|
| 744 | .rst (dtu_reset), |
---|
| 745 | .clk (clk), .se (se), .si(), .so()); |
---|
| 746 | |
---|
| 747 | // choose thread |
---|
| 748 | assign thr_dec_d[0] = swl_dcl_thr_d[0]; |
---|
| 749 | assign thr_dec_d[3:1] = swl_dcl_thr_d[3:1]; |
---|
| 750 | |
---|
| 751 | mux4ds #(8) fcc0d_mx(.dout (fcc_d[7:0]), |
---|
| 752 | .in0 (t0_fcc_d[7:0]), |
---|
| 753 | .in1 (t1_fcc_d[7:0]), |
---|
| 754 | .in2 (t2_fcc_d[7:0]), |
---|
| 755 | .in3 (t3_fcc_d[7:0]), |
---|
| 756 | .sel0 (thr_dec_d[0]), |
---|
| 757 | .sel1 (thr_dec_d[1]), |
---|
| 758 | .sel2 (thr_dec_d[2]), |
---|
| 759 | .sel3 (thr_dec_d[3])); |
---|
| 760 | |
---|
| 761 | `endif // !`ifdef FPGA_SYN_1THREAD |
---|
| 762 | |
---|
| 763 | endmodule // sparc_ifu_dcl |
---|
| 764 | |
---|