1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
|
`include "core/uarch.sv"
module core_psr
(
input logic clk,
write,
saved,
update_flags,
alu_v_valid,
input psr_flags alu_flags,
input word psr_wr,
output psr_flags flags,
output psr_intmask mask,
output psr_mode mode,
output word psr_rd
);
typedef struct packed
{
psr_flags flags;
psr_intmask mask;
psr_mode mode;
} psr_state;
typedef struct packed
{
psr_flags nzcv;
logic q;
logic[1:0] reserved0;
logic j;
logic[3:0] reserved1,
ge;
logic[5:0] reserved2;
logic e;
psr_intmask aif;
logic t;
psr_mode m;
} psr_word;
/* Este diseño de doble búfer es importante por rendimiento. Reducirlo
* a uno más "sencillo" tiene una pérdida de casi 40MHz en Fmax.
* Esto se debe a que el CPSR es el mayor mercado del core, se encuentra
* conectado a cycles, regs, alu y decode. La dependencia con decode en
* particular es crítica debido a que el condition code se especifica en
* términos de banderas de CPSR. Una ruta combinacional que atraviese flags
* iniciaría en cycles, tomaría valores de regs, llegaría a ALU, caería
* en flags y, debido al operand forwarding que se necesita por hazards de
* pipeline, esa misma señal seguiría combinacionalmente hacia decode para
* finalmente registrar en cycles nuevamente. Tal cosa es impermisible.
*/
logic pending_update;
psr_word rd_word, wr_word;
psr_flags next_flags, wr_flags;
psr_state cpsr, spsr, spsr_svc, spsr_abt, spsr_und, spsr_irq, spsr_fiq,
wr_state, wr_clean;
assign mode = cpsr.mode;
assign mask = cpsr.mask;
assign flags = pending_update ? wr_flags : cpsr.flags;
assign psr_rd = rd_word;
assign wr_word = psr_wr;
assign {wr_state.flags, wr_state.mask, wr_state.mode} = {wr_word.nzcv, wr_word.aif, wr_word.m};
`ifdef VERILATOR
psr_word cpsr_word /*verilator public*/,
spsr_svc_word /*verilator public*/,
spsr_abt_word /*verilator public*/,
spsr_und_word /*verilator public*/,
spsr_fiq_word /*verilator public*/,
spsr_irq_word /*verilator public*/;
assign {cpsr_word.nzcv, cpsr_word.aif, cpsr_word.m} = {cpsr.flags, cpsr.mask, cpsr.mode};
assign {spsr_svc_word.nzcv, spsr_svc_word.aif, spsr_svc_word.m}
= {spsr_svc.flags, spsr_svc.mask, spsr_svc.mode};
assign {spsr_abt_word.nzcv, spsr_abt_word.aif, spsr_abt_word.m}
= {spsr_abt.flags, spsr_abt.mask, spsr_abt.mode};
assign {spsr_und_word.nzcv, spsr_und_word.aif, spsr_und_word.m}
= {spsr_und.flags, spsr_und.mask, spsr_und.mode};
assign {spsr_irq_word.nzcv, spsr_irq_word.aif, spsr_irq_word.m}
= {spsr_irq.flags, spsr_irq.mask, spsr_irq.mode};
assign {spsr_fiq_word.nzcv, spsr_fiq_word.aif, spsr_fiq_word.m}
= {spsr_fiq.flags, spsr_fiq.mask, spsr_fiq.mode};
`endif
always_comb begin
next_flags = flags;
if(update_flags) begin
next_flags = alu_flags;
if(~alu_v_valid)
next_flags.v = flags.v;
end
rd_word = {$bits(rd_word){1'b0}};
if(saved)
{rd_word.nzcv, rd_word.aif, rd_word.m} = {spsr.flags, spsr.mask, spsr.mode};
else
{rd_word.nzcv, rd_word.aif, rd_word.m} = {flags, mask, mode};
wr_clean = wr_state;
unique case(wr_state.mode)
`MODE_USR, `MODE_FIQ, `MODE_IRQ, `MODE_SVC,
`MODE_ABT, `MODE_UND, `MODE_SYS: ;
default:
wr_clean.mode = mode;
endcase
if(mode == `MODE_USR) begin
wr_clean.mask = mask;
wr_clean.mode = `MODE_USR;
end
end
always_ff @(posedge clk) begin
wr_flags <= next_flags;
pending_update <= !write && update_flags;
if(!write) begin
if(pending_update)
cpsr.flags <= wr_flags;
end else if(!saved)
cpsr <= wr_clean;
else
unique0 case(mode)
`MODE_SVC: spsr_svc <= wr_clean;
`MODE_ABT: spsr_abt <= wr_clean;
`MODE_UND: spsr_und <= wr_clean;
`MODE_IRQ: spsr_irq <= wr_clean;
`MODE_FIQ: spsr_fiq <= wr_clean;
default: ;
endcase
end
initial begin
wr_flags = 4'b0000;
pending_update = 0;
cpsr.mode = `MODE_SVC;
cpsr.flags = 4'b0000;
cpsr.mask.a = 1;
cpsr.mask.i = 1;
cpsr.mask.f = 1;
spsr_svc = {$bits(spsr_svc){1'b0}};
spsr_abt = {$bits(spsr_svc){1'b0}};
spsr_und = {$bits(spsr_svc){1'b0}};
spsr_irq = {$bits(spsr_svc){1'b0}};
spsr_fiq = {$bits(spsr_svc){1'b0}};
end
endmodule
|