-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathdassign3_1.v
433 lines (335 loc) · 14.7 KB
/
dassign3_1.v
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
// EEM16 - Logic Design
// Design Assignment #3.1
// dassign3_1.v
// Verilog template
// You may define any additional modules as necessary
// Do not delete or modify any of the modules provided
// ****************
// Blocks to design
// ****************
module bitFlipAdd1(a,b);
parameter width=16;
input [width-1:0] a;
output [width-1:0] b;
assign b=~a+1;
endmodule
// Right-shifter
// more wires
// 3.1a) Rectified linear unit
// out = max(0, in/4)
// 16 bit signed input
// 8 bit unsigned output truncated
module relu(in, out);
input [15:0] in;
output [7:0] out;
// your code here
//it can't be a input that is worth 15 bits if its output bit is only 8 bits, how can we do stuff w/ a 15 bit input and turn int o an 8 bit output unsigned?
//check if sign bit is a 1, and gives out a 0. if unsigned (sign bit is a 0), then we gotta return the unsigned value/4 which is shift right by 2?
//need unsigned version of in
wire [15:0] uin,uins,uins2;
// bitFlipAdd1 bfa(in,uin); dont actually bitflipadd1 b/c if its sign bit is a0, we just shiftright it twice and its what we want?
//shr #(16) rsh1(uin,uins);
//shr #(16) rsh2(uin,uins2);
//wire [7:0] uins22;
//assign uins22=uins2[7:0];
mux2 #(8)ra(in/4, 8'b0, in[15], out); //select is msb
endmodule
// 3.1b) Pipelined 5 input ripple-carry adder
// 16 bit signed inputs
// 1 bit input: valid (when the other inputs are useful numbers)
// 16 bit signed output (truncated)
// 1 bit output: ready (when the output is the sum of valid inputs)
/*Create a five-input 16-bit pipelined ripple carry adder using the five-input 4-bit ripple carry adders from lab
1 and any necessary d-registers.
*/
module piped_adder(clk, a, b, c, d, e, valid, sum, ready);
input clk, valid;
input [15:0] a, b, c, d, e;
output [15:0] sum;
output ready;
wire [3:0] rca1sumt,rca2sumt,rca3sumt,rca4sumt;
//wire [3:0] rca1sumbot4,rca2sumbot4,rca3sumbot4,rca4sumbot4,rca5sumbot4,rca6sumbot4,rca7sumbot4,rca8sumbot4;
//wire [2:0] rca1sumtop3,rca2sumtop3,rca3sumtop3,rca4sumtop3,rca5sumtop3,rca6sumtop3,rca7sumtop3;
//and now its time to pipeline this shit with a shitload of dregs wtf
// your code here
// module adder5 (a,b,c,d,e, sum); //sum is 7 bit output, top 3 go to nxt
//module adder5carry (a,b,c,d,e, ci1, ci0a, ci0b, co1, co0a, co0b, sum);
wire corca1a,corca1b,corca1c;
wire corca1ap,corca1bp,corca1cp;
wire corca2a,corca2b,corca2c;
wire corca2ap,corca2bp,corca2cp;
wire corca3a,corca3b,corca3c;
wire corca3ap,corca3bp,corca3cp;
wire corca4a,corca4b,corca4c;
// wire corca4ap,corca4bp,corca4cp;
//do i need to wire valid to ready in some way or like, dont start until valid?
adder5carry rca1(a[3:0],b[3:0],c[3:0],d[3:0],e[3:0],0,0,0,corca1a,corca1b,corca1c,rca1sumt);
//gotta pipe it
dreg pipedp1a(clk,corca1a,corca1ap);
dreg pipedp1b(clk,corca1b,corca1bp);
dreg pipedp1c(clk,corca1c,corca1cp);
//do i also got to pipe in the inputs to the next rcas? seems like it...
//1 dreg to piped inputs
wire [3:0] a1p,b1p,c1p,d1p,e1p,a2p,b2p,c2p,d2p,e2p,a2pp,b2pp,c2pp,d2pp,e2pp,a3p,b3p,c3p,d3p,e3p,a3pp,b3pp,c3pp,d3pp,e3pp,a3ppp,b3ppp,c3ppp,d3ppp,e3ppp;
dreg #(4) pipeinputs1a(clk,a[7:4],a1p);
dreg #(4) pipeinputs1b(clk,b[7:4],b1p);
dreg #(4) pipeinputs1c(clk,c[7:4],c1p);
dreg #(4) pipeinputs1d(clk,d[7:4],d1p);
dreg #(4) pipeinputs1e(clk,e[7:4],e1p);
adder5carry rca2(a1p,b1p,c1p,d1p,e1p,corca1ap,corca1bp,corca1cp,corca2a,corca2b,corca2c,rca2sumt);
dreg pipedp2a(clk,corca2a,corca2ap);
dreg pipedp2b(clk,corca2b,corca2bp);
dreg pipedp2c(clk,corca2c,corca2cp);
//2 dreg to piped inputs
dreg #(4) pipeinputs2a(clk,a[11:8],a2p);
dreg #(4) pipeinputs2b(clk,b[11:8],b2p);
dreg #(4) pipeinputs2c(clk,c[11:8],c2p);
dreg #(4) pipeinputs2d(clk,d[11:8],d2p);
dreg #(4) pipeinputs2e(clk,e[11:8],e2p);
dreg #(4) pipeinputs2aa(clk,a2p,a2pp);
dreg #(4) pipeinputs2bb(clk,b2p,b2pp);
dreg #(4) pipeinputs2cc(clk,c2p,c2pp);
dreg #(4) pipeinputs2dd(clk,d2p,d2pp);
dreg #(4) pipeinputs2ee(clk,e2p,e2pp);
adder5carry rca3(a2pp,b2pp,c2pp,d2pp,e2pp,corca2ap,corca2bp,corca2cp,corca3a,corca3b,corca3c,rca3sumt);
dreg pipedp3a(clk,corca3a,corca3ap);
dreg pipedp3b(clk,corca3b,corca3bp);
dreg pipedp3c(clk,corca3c,corca3cp);
//3 //1 dreg to piped inputs
dreg #(4) pipeinputs3a(clk,a[15:12],a3p);
dreg #(4) pipeinputs3b(clk,b[15:12],b3p);
dreg #(4) pipeinputs3c(clk,c[15:12],c3p);
dreg #(4) pipeinputs3d(clk,d[15:12],d3p);
dreg #(4) pipeinputs3e(clk,e[15:12],e3p);
dreg #(4) pipeinputs3aa(clk,a3p,a3pp);
dreg #(4) pipeinputs3bb(clk,b3p,b3pp);
dreg #(4) pipeinputs3cc(clk,c3p,c3pp);
dreg #(4) pipeinputs3dd(clk,d3p,d3pp);
dreg #(4) pipeinputs3ee(clk,e3p,e3pp);
dreg #(4) pipeinputs3aaa(clk,a3pp,a3ppp);
dreg #(4) pipeinputs3bbb(clk,b3pp,b3ppp);
dreg #(4) pipeinputs3ccc(clk,c3pp,c3ppp);
dreg #(4) pipeinputs3ddd(clk,d3pp,d3ppp);
dreg #(4) pipeinputs3eee(clk,e3pp,e3ppp);
adder5carry rca4(a3ppp,b3ppp,c3ppp,d3ppp,e3ppp,corca3ap,corca3bp,corca3cp,corca4a,corca4b,corca4c,rca4sumt);
//the continued rca5s are just going to be having a lot of empty void in them in the case of drawing
//{8'b00000000,ain}
// assign sum[3:0]=rca1sumbot4; das end goal
/*
assign rca1sumtop3=rca1sumt[6:4];
assign rca1sumbot4=rca1sumt[3:0];
assign rca2sumbot4=rca2sumt[3:0];
assign rca2sumtop3=rca2sumt[6:4];
assign rca1sumtop3=rca1sumt[6:4];
assign rca1sumbot4=rca1sumt[3:0];
assign rca2sumbot4=rca2sumt[3:0];
assign rca2sumtop3=rca2sumt[6:4];
*/
//also need that padding syntax...
// adder5 rca5({1'b0,rca1sumtop3},rca2sumbot4,0,0,0,rca5sumt);
// assign sum[7:4]=rca5sumbot4;
//wire [3:0] rca2sumtop3p;
//fuck i need to pipe the top guys tooo LOL
//only the top 3 of rca2
// adder5 rca6({1'b0,rca2sumtop3p}, {1'b0,rca5sumtop3},rca3sumbot4,0,0,rca6sumt);
//ass//ign rca6sumtop3=rca6sumt[6:4];
//assign rca6sumbot4=rca6sumt[3:0];
// assign sum[11:8]=rca6sumbot4;
//adder5 rca7({1'b0,rca6sumtop3},{1'b0,rca3sumtop3pp},rca4sumbot4,0,0,rca7sumt);
//assign sum[15:12]=rca7sumbot4;
//adder5 rca8({1'b0,rca4sumtop3ppp},{1'b0,rca7sumtop3},0,0,0,rca8sumt);
//but arent all these guys trucnated lol
//
//now its time to dreg this shit
wire [3:0] d2,d3,d4,d52,d53,d662,d72;
// wire [6:0] d61,d62,d63,d64,d65,d66,d67;
//dreg #(4) dreg1a(clk,rca1sumt ,d61 ); //output for s[3:0] //actually does this guy get pipelined as a 7 first?
//dreg #(4) dreg1b(clk,rca2sumt,d62);
//dreg #(4) dreg1c(clk,rca3sumt,d63);
//dreg #(4) dreg1d(clk,rca4sumt,d64);
// dreg #(7) dreg5d(clk,rca5sumt,d65);
// dreg #(7) dreg6d(clk,rca6sumt,d66);
// dreg #(7) dreg7d(clk,rca7sumt,d67);
/*
assign rca1sumtop3=d61[6:4]; //after piped first instance rca1sumt
assign rca1sumbot4=d61[3:0];
assign rca2sumbot4=d62[3:0];
assign rca2sumtop3=d62[6:4];
assign rca3sumtop3=d63[6:4];
assign rca3sumbot4=d63[3:0];
assign rca4sumbot4=d64[3:0];
assign rca4sumtop3=d64[6:4];
assign rca5sumtop3=d65[6:4];
assign rca5sumbot4=d65[3:0];
assign rca6sumtop3=d66[6:4];
assign rca6sumbot4=d66[3:0];
assign rca7sumtop3=d67[6:4];
assign rca7sumbot4=d67[3:0];
*/
dreg #(4) dreg2(clk,rca1sumt ,d2 ); //output for s[3:0]
dreg #(4) dreg3(clk,d2 ,d3 ); //output for s[3:0]
dreg #(4) dreg4(clk,d3 ,d4 ); //output for s[3:0]
dreg #(4) dreg5(clk,d4 ,sum[3:0] ); //output for s[3:0]
dreg #(4) dreg52(clk,rca2sumt ,d52 ); //output for s[7:4]
dreg #(4) dreg53(clk,d52 ,d53 ); //output for s[3:0]
dreg #(4) dreg54(clk,d53 ,sum[7:4] ); //output for s[3:0]
dreg #(4) dreg62(clk,rca3sumt ,d662 ); //output for s[11:8]
dreg #(4) dreg63(clk,d662 ,sum[11:8]); //output for s[11:8]
dreg #(4) dreg73(clk,rca4sumt ,sum[15:12]); //output for s[11:8]
//gotta pipe my ready also by 4 stages
wire r2,r3,r4;
dreg dready1(clk,valid,r2);
dreg dready2(clk,r2,r3);
dreg dready3(clk,r3,r4);
dreg dready4(clk,r4,ready);
/*dreg #(4) dregtop2(clk,rca2sumtop3,rca2sumtop3p);
dreg #(4) dregtop3(clk,rca3sumtop3,rca3sumtop3p);
dreg #(4) dregtop3b(clk,rca3sumtop3p,rca3sumtop3pp);
dreg #(4) dregtop4a(clk,rca4sumtop3,rca4sumtop3p);
dreg #(4) dregtop4b(clk,rca4sumtop3p,rca4sumtop3pp);
dreg #(4) dregtop4c(clk,rca4sumtop3pp,rca4sumtop3ppp);
wire [3:0] rca3sumtop3p, rca3sumtop3pp, rca4sumtop3pp, rca4sumtop3ppp;
dreg #(4) dreg730(clk,rca8sumbot4 ,rdy); //output for s[11:8]
//actually takes 4 adder, 5 dreg delays. how do i time that
//dreg is 3x5=15
//4 adder5, which means 4 fa5+2+fa per, each fa5 has 4 fa, each fa=4tpd
//(4*4*4+8)*4=576
//so basically ready is just whether valid was true 5 clock cycles ago
*/
// assign #591 ready= 1;
endmodule
//That’s not me but k=4 Works with his adder5carry
// 3.1c) Pipelined neuron
// 8 bit signed weights, bias (constant)
// 8 bit unsigned inputs
// 1 bit input: new (when a set of inputs are available)
// 8 bit unsigned output
// 1 bit output: ready (when the output is valid)
module neuron(clk, w1, w2, w3, w4, b, x1, x2, x3, x4, new, y, ready);
input clk;
input [7:0] w1, w2, w3, w4, b; // signed 2s complement
input [7:0] x1, x2, x3, x4; // unsigned
input new;
output [7:0] y; // unsigned
output ready;
/* Using the sequential multiplier module from lab 2, the pipelined ripple-carry adder from above, and the
ReLU from above, implement the neuron module according to the rules for single-clock sequential logic.
Ensure that the outputs are directly generated by a d-register as specified by our pipelining rules.
y = max(0,1/4(w1x1 + w2x2 + w3x3 + w4x4 + b)
*/
//when new is high, ready is low.
//when ready is high, new is allowed to pulse high, else new waits.
//actually need to pipeline this bitch too
//But make sure u sign extend the B before u pipeline it
//module multiply (clk, ain, bin, reset, prod, ready);
wire [15:0]p1,p2,p3,p4,sumpipe,p1p,p2p,p3p,p4p,sumpipep;
wire [7:0]yp;
wire multiplier1rdy,multiplier2rdy,multiplier3rdy,multiplier4rdy;
multiply mer1(clk,w1,x1,new,p1,multiplier1rdy);
multiply mer2(clk,w2,x2,new,p2,multiplier2rdy);
multiply mer3(clk,w3,x3,new,p3,multiplier3rdy);
multiply mer4(clk,w4,x4,new,p4,multiplier4rdy);
/*dreg delayforadder(multiplier1rdy,m1);
dreg delayforadder(m1,m2);
dreg delayforadder(m2,m3);
dreg delayforadder(m3,m4);
*/
//dreg #(16) mul1(clk,p1,p1p);
//dreg #(16) mul2(clk,p2,p2p);
//dreg #(16) mul3(clk,p3,p3p);
//dreg #(16) mul4(clk,p4,p4p);
//then you can check when theyre all done
//and use that as reset for the pipeline add
//make sure the adder and multiplier are working together
//module piped_adder(clk, a, b, c, d, e, valid, sum, ready);
//if(multiplier1rdy,multiplier2rdy,multiplier3rdy,multiplier4rdy) then pa is ready to start.
/* wire out1,out2,out3,out4,donemult;
mux2 already1(0,1,multiplier1rdy,out1);
mux2 already2(0,1,multiplier2rdy,out2);
mux2 already3(0,1,multiplier3rdy,out3);
mux2 already4(0,1,multiplier4rdy,out4);
assign donemult=(out1&out2&out3&out4);
*/
// wire [2:0]counter;
// wire actualrdy;
//dreg dm1r(clk,counter,counter+1);
//make afucking counter using pulsewidth and dreg
//module pulse_width(clk, in, pwidth, long, type, new);
//wire [3:0] count;
// assign pwidth_d = new_d ? 1 : (pwidth + 1);
//wire [3:0]check,checkout;
// dreg #(3) couunter(clk,count,checkout);
// wire long,type,n;
//pulse_width pwd(clk,checkout,count,long,type,n); //cout is incremented value.
//adder actually,pwdith is going to update by adding 1.
/*thats where valid comes in, so when valid is set, thats when u wanna process stuff
*/
//assign actualrdy=(count==5)&&multiplier1rdy&&multiplier2rdy&&multiplier3rdy&&multiplier4rdy;
//assign n=(count==5);
//wire rdy,pipeaddready,pipev;
//what is the reset for piped_adder?
wire pipeready;
//apparently, also, need to pipeline the b and sign extend the b bias.
wire valid,validall;
assign validall=multiplier1rdy&&multiplier2rdy&&multiplier3rdy&&multiplier4rdy;
/*
module signextender(
input [7:0] unextended,//the msb bit is the sign bit
input clk,
output reg [7:0] extended
);*/
wire [7:0] bp,bpp;
wire valid2,validprev;
wire [2:0] counter;
dreg asdfasdfasdf(clk,counter[2],counter[0]);
mux2 otsready(counter[0],1,validall,counter[1]);
mux2 notttt(counter[1],0,new,counter[2]);
mux2 asdvalid(0,1,validall&!counter[0],validprev);
dreg asdfasdfasdfasdfasdfasdf(clk, validprev,valid);
/////signextender sxb(bp,clk,bpp);
//dreg #(8) processb(clk,b,bp);
//{{8{b[7]}},b}
piped_adder pa(clk,p1,p2,p3,p4,{{8{b[7]}},b},valid,sumpipe,valid2);
//dreg #(16) pa1(clk,sumpipe,sumpipep);
//module relu(in, out);
relu r(sumpipe,yp);
dreg #(8) relur(clk,yp,y);
/*then you feed those outputs directly into the pipedAdder with the and of all the ready bits from each multiplier
*/
//so the ready stuff is gucci, but everything else isnt.
//wire d1,d2,d3,d4;
dreg dead1(clk,valid2,ready);
//dreg dead4(clk,d3,ready);
/*
wire [2:0] counter;
//dreg #(8) dreg1(ready1,in1,out1);
//dreg #(8) dreg2(ready2,in2,out2);
//dreg #(8) dreg3(ready3,in3,out3);
//dreg #(8) dreg4(ready4,in4,out4);
//fuckin eda playground bmed me soooooo tilted rn but fkit gota push thru, already getting alotta help :/ mans not smart
wire allv,readyp;
dreg counterupdate1(clk,counter[2],counter[0]);
mux2 lookatnew(counter[0],0,new,counter[1]);
mux2 lookatnextc(counter[1],1, valid2,counter[2]);
//assign allv=ready1
// mux2 asdf(a,b,sel,y);
///assign allv=ready1&&ready2&&ready3&&ready4;
dreg prevupdates(clk,readyp,ready);
mux2 lookatprev(0,1,d3&&valid2&!counter[0],readyp);
*/
/*We know the adder takes a fixed amount of time, say 5 cycles, and the multiply takes variable time. We can have a counter to keep track of how long since new inputs were put to the multiply. If the multiply is done, and it has been at least 5 cycles, we know the adder is ready to accept the output of the multiply.
done either procedurally or structurally.
*/
//you get errno 66 if you dont sign extend b
// your code here
endmodule
module signextender(
input [7:0] unextended,//the msb bit is the sign bit
input clk,
output reg [7:0] extended
);
always@(posedge clk)
begin
extended <= $signed(unextended);
end
endmodule