aboutsummaryrefslogtreecommitdiffstats
path: root/fpga/usrp3/lib/rfnoc/dds_timed.v
diff options
context:
space:
mode:
Diffstat (limited to 'fpga/usrp3/lib/rfnoc/dds_timed.v')
-rw-r--r--fpga/usrp3/lib/rfnoc/dds_timed.v290
1 files changed, 290 insertions, 0 deletions
diff --git a/fpga/usrp3/lib/rfnoc/dds_timed.v b/fpga/usrp3/lib/rfnoc/dds_timed.v
new file mode 100644
index 000000000..fd03f6a23
--- /dev/null
+++ b/fpga/usrp3/lib/rfnoc/dds_timed.v
@@ -0,0 +1,290 @@
+//
+// Copyright 2016 Ettus Research, a National Instruments Company
+//
+// SPDX-License-Identifier: LGPL-3.0-or-later
+//
+// DDS that supports timed commands via the settings bus
+
+module dds_timed #(
+ parameter SR_FREQ_ADDR = 0,
+ parameter SR_SCALE_IQ_ADDR = 1,
+ parameter CMD_FIFO_SIZE = 5,
+ parameter WIDTH = 16,
+ parameter DDS_WIDTH = 24,
+ parameter PHASE_WIDTH = 24,
+ parameter PHASE_ACCUM_WIDTH = 32,
+ parameter SCALING_WIDTH = 18,
+ parameter HEADER_WIDTH = 128,
+ parameter HEADER_FIFO_SIZE = 5,
+ parameter SR_AWIDTH = 8,
+ parameter SR_DWIDTH = 32,
+ parameter SR_TWIDTH = 64
+)(
+ input clk, input reset, input clear,
+ output timed_cmd_fifo_full,
+ input set_stb, input [SR_AWIDTH-1:0] set_addr, input [SR_DWIDTH-1:0] set_data,
+ input [SR_TWIDTH-1:0] set_time, input set_has_time,
+ input [2*WIDTH-1:0] i_tdata, input i_tlast, input i_tvalid, output i_tready, input [HEADER_WIDTH-1:0] i_tuser,
+ output [2*WIDTH-1:0] o_tdata, output o_tlast, output o_tvalid, input o_tready, output [HEADER_WIDTH-1:0] o_tuser
+);
+
+ /**************************************************************************
+ * Track VITA time
+ *************************************************************************/
+ wire [2*WIDTH-1:0] int_tdata;
+ wire [HEADER_WIDTH-1:0] int_tuser;
+ wire int_tlast, int_tvalid, int_tready, int_tag;
+ wire [SR_AWIDTH-1:0] out_set_addr, timed_set_addr;
+ wire [SR_DWIDTH-1:0] out_set_data, timed_set_data;
+ wire out_set_stb, timed_set_stb;
+ wire eob;
+
+ axi_tag_time #(
+ .WIDTH(2*WIDTH),
+ .NUM_TAGS(1),
+ .SR_TAG_ADDRS(SR_FREQ_ADDR))
+ axi_tag_time (
+ .clk(clk),
+ .reset(reset),
+ .clear(clear),
+ .tick_rate(16'd1),
+ .timed_cmd_fifo_full(timed_cmd_fifo_full),
+ .s_axis_data_tdata(i_tdata), .s_axis_data_tlast(i_tlast),
+ .s_axis_data_tvalid(i_tvalid), .s_axis_data_tready(i_tready),
+ .s_axis_data_tuser(i_tuser),
+ .m_axis_data_tdata(int_tdata), .m_axis_data_tlast(int_tlast),
+ .m_axis_data_tvalid(int_tvalid), .m_axis_data_tready(int_tready),
+ .m_axis_data_tuser(int_tuser), .m_axis_data_tag(int_tag),
+ .in_set_stb(set_stb), .in_set_addr(set_addr), .in_set_data(set_data),
+ .in_set_time(set_time), .in_set_has_time(set_has_time),
+ .out_set_stb(out_set_stb), .out_set_addr(out_set_addr), .out_set_data(out_set_data),
+ .timed_set_stb(timed_set_stb), .timed_set_addr(timed_set_addr), .timed_set_data(timed_set_data));
+
+ wire [2*WIDTH-1:0] dds_in_tdata, unused_tdata;
+ wire [HEADER_WIDTH-1:0] header_in_tdata, header_out_tdata, unused_tuser;
+ wire dds_in_tlast, dds_in_tvalid, dds_in_tready, dds_in_tag;
+ wire header_in_tvalid, header_in_tready, header_in_tlast, unused_tag;
+ wire header_out_tvalid, header_out_tready;
+
+ split_stream #(
+ .WIDTH(2*WIDTH+HEADER_WIDTH+1), .ACTIVE_MASK(4'b0011))
+ split_head (
+ .clk(clk), .reset(reset), .clear(clear),
+ .i_tdata({int_tdata,int_tuser,int_tag}), .i_tlast(int_tlast),
+ .i_tvalid(int_tvalid), .i_tready(int_tready),
+ .o0_tdata({dds_in_tdata,unused_tuser,dds_in_tag}), .o0_tlast(dds_in_tlast),
+ .o0_tvalid(dds_in_tvalid), .o0_tready(dds_in_tready),
+ .o1_tdata({unused_tdata,header_in_tdata,unused_tag}), .o1_tlast(header_in_tlast),
+ .o1_tvalid(header_in_tvalid), .o1_tready(header_in_tready),
+ .o2_tready(1'b0), .o3_tready(1'b0));
+
+ axi_fifo #(
+ .WIDTH(HEADER_WIDTH), .SIZE(HEADER_FIFO_SIZE))
+ axi_fifo_header (
+ .clk(clk), .reset(reset), .clear(clear),
+ .i_tdata(header_in_tdata), .i_tvalid(header_in_tvalid & header_in_tlast), .i_tready(header_in_tready),
+ .o_tdata(header_out_tdata), .o_tvalid(header_out_tvalid),
+ .o_tready(header_out_tready), // Consume header on last output sample
+ .space(), .occupied());
+
+ assign eob = header_in_tdata[124];
+
+ /**************************************************************************
+ * Settings Regs
+ *************************************************************************/
+ wire [PHASE_ACCUM_WIDTH-1:0] phase_inc_tdata, phase_inc_timed_tdata;
+ wire phase_inc_tlast, phase_inc_tvalid, phase_inc_tready;
+ wire phase_inc_timed_tlast, phase_inc_timed_tready , phase_inc_timed_tvalid;
+
+ axi_setting_reg #(
+ .ADDR(SR_FREQ_ADDR), .AWIDTH(SR_AWIDTH), .WIDTH(PHASE_ACCUM_WIDTH), .STROBE_LAST(1))
+ set_freq (
+ .clk(clk), .reset(reset),
+ .set_stb(out_set_stb), .set_addr(out_set_addr), .set_data(out_set_data),
+ .o_tdata(phase_inc_tdata), .o_tlast(phase_inc_tlast), .o_tvalid(phase_inc_tvalid), .o_tready(phase_inc_tready));
+
+ axi_setting_reg #(
+ .ADDR(SR_FREQ_ADDR), .USE_FIFO(1), .FIFO_SIZE(CMD_FIFO_SIZE), .AWIDTH(SR_AWIDTH), .WIDTH(PHASE_ACCUM_WIDTH), .STROBE_LAST(1))
+ set_freq_timed (
+ .clk(clk), .reset(reset),
+ .set_stb(timed_set_stb), .set_addr(timed_set_addr), .set_data(timed_set_data),
+ .o_tdata(phase_inc_timed_tdata), .o_tlast(phase_inc_timed_tlast), .o_tvalid(phase_inc_timed_tvalid), .o_tready(phase_inc_timed_tready));
+
+ wire [SCALING_WIDTH-1:0] scaling_tdata;
+ wire scaling_tvalid, scaling_tready;
+
+ axi_setting_reg #(
+ .ADDR(SR_SCALE_IQ_ADDR), .AWIDTH(SR_AWIDTH), .WIDTH(SCALING_WIDTH), .REPEATS(1))
+ set_scale (
+ .clk(clk), .reset(reset),
+ .set_stb(out_set_stb), .set_addr(out_set_addr), .set_data(out_set_data),
+ .o_tdata(scaling_tdata), .o_tlast(), .o_tvalid(scaling_tvalid), .o_tready(scaling_tready));
+
+ /**************************************************************************
+ * DDS + Complex Mult + Phase Accumulator
+ *************************************************************************/
+ wire [PHASE_ACCUM_WIDTH-1:0] phase_inc_mux_tdata;
+ reg [PHASE_ACCUM_WIDTH-1:0] phase_inc;
+ wire phase_inc_mux_tlast, phase_inc_mux_tvalid, phase_inc_mux_tready;
+ reg [PHASE_ACCUM_WIDTH-1:0] phase;
+
+ wire [PHASE_WIDTH-1:0] phase_tdata = phase[PHASE_ACCUM_WIDTH-1:PHASE_ACCUM_WIDTH-PHASE_WIDTH];
+ wire phase_tvalid, phase_tready, phase_tlast;
+
+ wire [WIDTH*2-1:0] dds_in_fifo_tdata;
+ wire dds_in_fifo_tvalid, dds_in_fifo_tready, dds_in_fifo_tlast;
+ wire dds_out_tlast, dds_out_tvalid, dds_out_tready;
+
+ wire [DDS_WIDTH-1:0] dds_in_i_tdata, dds_in_q_tdata;
+ wire [DDS_WIDTH-1:0] dds_out_i_tdata, dds_out_q_tdata;
+ wire [15:0] dds_input_fifo_space, dds_input_fifo_occupied;
+
+ wire [WIDTH*2-1:0] dds_in_sync_tdata;
+ wire dds_in_sync_tvalid, dds_in_sync_tready, dds_in_sync_tlast;
+ wire [PHASE_WIDTH-1:0] phase_sync_tdata;
+ wire phase_sync_tvalid, phase_sync_tready, phase_sync_tlast;
+
+ assign phase_inc_mux_tdata = phase_inc_timed_tready ? phase_inc_timed_tdata : phase_inc_tdata;
+ assign phase_inc_mux_tlast = phase_inc_timed_tready ? phase_inc_timed_tlast : phase_inc_tlast;
+ assign phase_inc_mux_tvalid = phase_inc_timed_tready ? phase_inc_timed_tvalid : phase_inc_tvalid;
+ assign phase_inc_tready = phase_inc_mux_tready;
+ assign phase_inc_timed_tready = phase_inc_mux_tready & dds_in_tag;
+ assign phase_inc_mux_tready = phase_tready;
+
+ // phase is only valid when input i/q data stream is valid
+ assign phase_tvalid = dds_in_tvalid;
+ assign phase_tlast = dds_in_tlast;
+
+ always @(posedge clk) begin
+ if (reset | clear) begin
+ phase_inc <= 0;
+ end else if (phase_inc_mux_tvalid & phase_inc_mux_tready) begin
+ phase_inc <= phase_inc_mux_tdata;
+ end
+ end
+
+ // NCO, increment phase input to DDS SIN/COS LUT
+ always @(posedge clk) begin
+ if (reset | clear | (phase_inc_mux_tvalid & phase_inc_mux_tready) | eob) begin
+ phase <= 0;
+ end else if (dds_in_tvalid & dds_in_tready) begin //only increment phase when data into dds is valid and data fifo is ready
+ phase <= phase + phase_inc;
+ end
+ end
+
+
+ // Sync the two path's pipeline delay.
+ // This is needed to ensure that applying the phase update happens on the
+ // correct sample regardless of differing downstream path delays.
+ axi_sync #(
+ .SIZE(2),
+ .WIDTH_VEC({PHASE_WIDTH,2*WIDTH}), // Vector of widths, each width is defined by a 32-bit value
+ .FIFO_SIZE(0))
+ axi_sync (
+ .clk(clk), .reset(reset), .clear(clear),
+ .i_tdata({phase_tdata,dds_in_tdata}),
+ .i_tlast({phase_tlast,dds_in_tlast}),
+ .i_tvalid({phase_tvalid,dds_in_tvalid}),
+ .i_tready({phase_tready,dds_in_tready}),
+ .o_tdata({phase_sync_tdata,dds_in_sync_tdata}),
+ .o_tlast({phase_sync_tlast,dds_in_sync_tlast}),
+ .o_tvalid({phase_sync_tvalid,dds_in_sync_tvalid}),
+ .o_tready({phase_sync_tready,dds_in_sync_tready}));
+
+ // fifo to hold input data while pipeline catches up in dds
+ // this is blocked by the axi_sync following the dds
+ axi_fifo #(.WIDTH(2*WIDTH+1), .SIZE(5)) dds_input_fifo(
+ .clk(clk), .reset(reset), .clear(clear),
+ .i_tdata({dds_in_sync_tlast,dds_in_sync_tdata}), .i_tvalid(dds_in_sync_tvalid), .i_tready(dds_in_sync_tready),
+ .o_tdata({dds_in_fifo_tlast,dds_in_fifo_tdata}), .o_tvalid(dds_in_fifo_tvalid), .o_tready(dds_in_fifo_tready),
+ .space(dds_input_fifo_space), .occupied(dds_input_fifo_occupied)
+ );
+
+ // after fifo, do q quick sign extend op to get up to 24 bits. to match how the cordic deals with the data path.
+ sign_extend #(
+ .bits_in(WIDTH), .bits_out(DDS_WIDTH))
+ sign_extend_dds_i (
+ .in(dds_in_fifo_tdata[2*WIDTH-1:WIDTH]), .out(dds_in_i_tdata));
+
+ sign_extend #(
+ .bits_in(WIDTH), .bits_out(DDS_WIDTH))
+ sign_extend_dds_q (
+ .in(dds_in_fifo_tdata[WIDTH-1:0]), .out(dds_in_q_tdata));
+
+
+ // Wrapper for Xilinx IP AXI DDS + Complex Multiply
+ // NOTE: Seems Xilinx IP expects opposite I/Q combined complex data buses, so they are swapped here.
+ dds_freq_tune dds_freq_tune_inst (
+ .clk(clk),
+ .reset(reset | clear),
+ .eob(eob),
+ .rate_changed(1'b0),
+ .dds_input_fifo_occupied(dds_input_fifo_occupied),
+ /* IQ input */
+ .s_axis_din_tlast(dds_in_fifo_tlast),
+ .s_axis_din_tvalid(dds_in_fifo_tvalid),
+ .s_axis_din_tready(dds_in_fifo_tready),
+ .s_axis_din_tdata({dds_in_q_tdata, dds_in_i_tdata}),
+ /* Phase input from NCO */
+ .s_axis_phase_tlast(phase_sync_tlast),
+ .s_axis_phase_tvalid(phase_sync_tvalid),
+ .s_axis_phase_tready(phase_sync_tready),
+ .s_axis_phase_tdata(phase_sync_tdata), //24 bit
+ /* IQ output */
+ .m_axis_dout_tlast(dds_out_tlast),
+ .m_axis_dout_tvalid(dds_out_tvalid),
+ .m_axis_dout_tready(dds_out_tready),
+ .m_axis_dout_tdata({dds_out_q_tdata, dds_out_i_tdata})
+ //debug signals
+ );
+ /************************************************************************
+ * Perform scaling on the IQ output
+ ************************************************************************/
+ wire [DDS_WIDTH+SCALING_WIDTH-1:0] scaled_i_tdata, scaled_q_tdata;
+ wire scaled_tlast, scaled_tvalid, scaled_tready;
+
+ mult #(
+ .WIDTH_A(DDS_WIDTH),
+ .WIDTH_B(SCALING_WIDTH),
+ .WIDTH_P(DDS_WIDTH+SCALING_WIDTH),
+ .DROP_TOP_P(4),
+ .LATENCY(3),
+ .CASCADE_OUT(0))
+ i_mult (
+ .clk(clk), .reset(reset | clear),
+ .a_tdata(dds_out_i_tdata), .a_tlast(dds_out_tlast), .a_tvalid(dds_out_tvalid), .a_tready(dds_out_tready),
+ .b_tdata(scaling_tdata), .b_tlast(1'b0), .b_tvalid(dds_out_tvalid /* aligning scaling_tdata with dds_tdata */), .b_tready(scaling_tready),
+ .p_tdata(scaled_i_tdata), .p_tlast(scaled_tlast), .p_tvalid(scaled_tvalid), .p_tready(scaled_tready));
+
+ mult #(
+ .WIDTH_A(DDS_WIDTH),
+ .WIDTH_B(SCALING_WIDTH),
+ .WIDTH_P(DDS_WIDTH+SCALING_WIDTH),
+ .DROP_TOP_P(4),
+ .LATENCY(3),
+ .CASCADE_OUT(0))
+ q_mult (
+ .clk(clk), .reset(reset | clear),
+ .a_tdata(dds_out_q_tdata), .a_tlast(), .a_tvalid(dds_out_tvalid), .a_tready(),
+ .b_tdata(scaling_tdata), .b_tlast(1'b0), .b_tvalid(dds_out_tvalid /* aligning scaling_tdata with dds_tdata */), .b_tready(),
+ .p_tdata(scaled_q_tdata), .p_tlast(), .p_tvalid(), .p_tready(scaled_tready));
+
+ wire [2*WIDTH-1:0] sample_tdata;
+ wire sample_tlast, sample_tvalid, sample_tready;
+
+ axi_round_and_clip_complex #(
+ .WIDTH_IN(DDS_WIDTH+SCALING_WIDTH), .WIDTH_OUT(WIDTH), .CLIP_BITS(12))
+ axi_round_and_clip_complex (
+ .clk(clk), .reset(reset | clear),
+ .i_tdata({scaled_i_tdata, scaled_q_tdata}), .i_tlast(scaled_tlast), .i_tvalid(scaled_tvalid), .i_tready(scaled_tready),
+ .o_tdata(sample_tdata), .o_tlast(sample_tlast), .o_tvalid(sample_tvalid), .o_tready(sample_tready));
+
+ // Throttle output on last sample if header is not valid
+ assign header_out_tready = sample_tlast & sample_tvalid & o_tready;
+ assign sample_tready = (sample_tvalid & sample_tlast) ? (header_out_tvalid & o_tready) : o_tready;
+ assign o_tvalid = (sample_tvalid & sample_tlast) ? header_out_tvalid : sample_tvalid;
+ assign o_tlast = sample_tlast;
+ assign o_tdata = sample_tdata;
+ assign o_tuser = header_out_tdata;
+
+endmodule