rtl/gfx/gfx_fixed_muladd.sv


1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77

module gfx_fixed_muladd
(
	input  logic      clk,

	input  gfx::fixed a,
	                  b,
	                  c,
	input  logic      stall,

	output gfx::fixed q
);

	import gfx::*;

`ifndef VERILATOR
	logic[2 * $bits(fixed) - $bits(fixed_frac) - 1:0] q_ext;

	assign q = q_ext[$bits(fixed) - 1:0];

	lpm_mult mult
	(
		.aclr(0),
		.clock(clk),
		.clken(!stall),

		.sum({c, {`FIXED_FRAC{1'b0}}}),
		.dataa(a),
		.datab(b),
		.result(q_ext)
	);

	defparam
		mult.lpm_widtha         = $bits(fixed),
		mult.lpm_widthb         = $bits(fixed),
		mult.lpm_widths         = $bits(fixed) + $bits(fixed_frac),
		/* Esto es crucial. No está documentado en ningún lado (aparte de un
		 * comentario en r/fpga). Si lpm_widthp < lpm_widtha + lpm_widthb,
		 * entonces result contiene los lpm_widthp bits más significativos
		 * del producto, no los menos significativos como tendría sentido.
		 */
		mult.lpm_widthp         = 2 * $bits(fixed) - $bits(fixed_frac),
		mult.lpm_representation = "SIGNED",
		mult.lpm_pipeline       = FIXED_MULADD_DEPTH;
`else
	logic[$bits(fixed) + $bits(fixed_frac) - 1:0] q_ext;

	fixed a_hold, b_hold, c_hold;

	assign q = q_ext[$bits(fixed) + $bits(fixed_frac) - 1:$bits(fixed_frac)] + c_hold;
	assign q_ext = a_hold * b_hold;

	gfx_pipes #(.WIDTH($bits(a)), .DEPTH(FIXED_MULADD_DEPTH)) a_pipes
	(
		.clk,
		.in(a),
		.out(a_hold),
		.stall
	);

	gfx_pipes #(.WIDTH($bits(b)), .DEPTH(FIXED_MULADD_DEPTH)) b_pipes
	(
		.clk,
		.in(b),
		.out(b_hold),
		.stall
	);

	gfx_pipes #(.WIDTH($bits(c)), .DEPTH(FIXED_MULADD_DEPTH)) c_pipes
	(
		.clk,
		.in(c),
		.out(c_hold),
		.stall
	);
`endif

endmodule