/*************************************************************************************** * Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences * Copyright (c) 2020-2021 Peng Cheng Laboratory * * XiangShan is licensed under Mulan PSL v2. * You can use this software according to the terms and conditions of the Mulan PSL v2. * You may obtain a copy of Mulan PSL v2 at: * http://license.coscl.org.cn/MulanPSL2 * * THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, * EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, * MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. * * See the Mulan PSL v2 for more details. * * * Acknowledgement * * This implementation is inspired by several key papers: * [1] Andrew D. Booth. "[A signed binary multiplication technique.](https://doi.org/10.1093/qjmam/4.2.236)" The * Quarterly Journal of Mechanics and Applied Mathematics 4.2: 236-240. 1951. * [2] Christopher. S. Wallace. "[A suggestion for a fast multiplier.](https://doi.org/10.1109/PGEC.1964.263830)" IEEE * Transactions on Electronic Computers 1: 14-17. 1964. ***************************************************************************************/ package xiangshan.backend.fu import org.chipsalliance.cde.config.Parameters import chisel3._ import chisel3.util._ import utility._ import utils._ import xiangshan._ import xiangshan.backend.fu.util.{C22, C32, C53} class MulDivCtrl extends Bundle{ val sign = Bool() val isW = Bool() val isHi = Bool() // return hi bits of result ? } class ArrayMulDataModule(len: Int) extends Module { val io = IO(new Bundle() { val a, b = Input(UInt(len.W)) val regEnables = Input(Vec(2, Bool())) val result = Output(UInt((2 * len).W)) }) val (a, b) = (io.a, io.b) val b_sext, bx2, neg_b, neg_bx2 = Wire(UInt((len+1).W)) b_sext := SignExt(b, len+1) bx2 := b_sext << 1 neg_b := (~b_sext).asUInt neg_bx2 := neg_b << 1 val columns: Array[Seq[Bool]] = Array.fill(2*len)(Seq()) var last_x = WireInit(0.U(3.W)) for(i <- Range(0, len, 2)){ val x = if(i==0) Cat(a(1,0), 0.U(1.W)) else if(i+1==len) SignExt(a(i, i-1), 3) else a(i+1, i-1) val pp_temp = MuxLookup(x, 0.U)(Seq( 1.U -> b_sext, 2.U -> b_sext, 3.U -> bx2, 4.U -> neg_bx2, 5.U -> neg_b, 6.U -> neg_b )) val s = pp_temp(len) val t = MuxLookup(last_x, 0.U(2.W))(Seq( 4.U -> 2.U(2.W), 5.U -> 1.U(2.W), 6.U -> 1.U(2.W) )) last_x = x val (pp, weight) = i match { case 0 => (Cat(~s, s, s, pp_temp), 0) case n if (n==len-1) || (n==len-2) => (Cat(~s, pp_temp, t), i-2) case _ => (Cat(1.U(1.W), ~s, pp_temp, t), i-2) } for(j <- columns.indices){ if(j >= weight && j < (weight + pp.getWidth)){ columns(j) = columns(j) :+ pp(j-weight) } } } def addOneColumn(col: Seq[Bool], cin: Seq[Bool]): (Seq[Bool], Seq[Bool], Seq[Bool]) = { var sum = Seq[Bool]() var cout1 = Seq[Bool]() var cout2 = Seq[Bool]() col.size match { case 1 => // do nothing sum = col ++ cin case 2 => val c22 = Module(new C22) c22.io.in := col sum = c22.io.out(0).asBool +: cin cout2 = Seq(c22.io.out(1).asBool) case 3 => val c32 = Module(new C32) c32.io.in := col sum = c32.io.out(0).asBool +: cin cout2 = Seq(c32.io.out(1).asBool) case 4 => val c53 = Module(new C53) for((x, y) <- c53.io.in.take(4) zip col){ x := y } c53.io.in.last := (if(cin.nonEmpty) cin.head else 0.U) sum = Seq(c53.io.out(0).asBool) ++ (if(cin.nonEmpty) cin.drop(1) else Nil) cout1 = Seq(c53.io.out(1).asBool) cout2 = Seq(c53.io.out(2).asBool) case n => val cin_1 = if(cin.nonEmpty) Seq(cin.head) else Nil val cin_2 = if(cin.nonEmpty) cin.drop(1) else Nil val (s_1, c_1_1, c_1_2) = addOneColumn(col take 4, cin_1) val (s_2, c_2_1, c_2_2) = addOneColumn(col drop 4, cin_2) sum = s_1 ++ s_2 cout1 = c_1_1 ++ c_2_1 cout2 = c_1_2 ++ c_2_2 } (sum, cout1, cout2) } def max(in: Iterable[Int]): Int = in.reduce((a, b) => if(a>b) a else b) def addAll(cols: Seq[Seq[Bool]], depth: Int): (UInt, UInt) = { if(max(cols.map(_.size)) <= 2){ val sum = Cat(cols.map(_(0)).reverse) var k = 0 while(cols(k).size == 1) k = k+1 val carry = Cat(cols.drop(k).map(_(1)).reverse) (sum, Cat(carry, 0.U(k.W))) } else { val columns_next = Array.fill(2*len)(Seq[Bool]()) var cout1, cout2 = Seq[Bool]() for( i <- cols.indices){ val (s, c1, c2) = addOneColumn(cols(i), cout1) columns_next(i) = s ++ cout2 cout1 = c1 cout2 = c2 } val needReg = depth == 4 val toNextLayer = if(needReg) columns_next.map(_.map(x => RegEnable(x, io.regEnables(1)))) else columns_next addAll(toNextLayer.toSeq, depth+1) } } val columns_reg = columns.map(col => col.map(b => RegEnable(b, io.regEnables(0)))) val (sum, carry) = addAll(cols = columns_reg.toSeq, depth = 0) io.result := sum + carry }