/* OFDM modem decoder Copyright 2021 Ahmet Inan */ #include #include #include #include namespace DSP { using std::abs; using std::min; using std::cos; using std::sin; } #include "bip_buffer.hh" #include "theil_sen.hh" #include "xorshift.hh" #include "trigger.hh" #include "complex.hh" #include "decibel.hh" #include "blockdc.hh" #include "hilbert.hh" #include "phasor.hh" #include "bitman.hh" #include "delay.hh" #include "sma.hh" #include "wav.hh" #include "pcm.hh" #include "fft.hh" #include "mls.hh" #include "crc.hh" #include "osd.hh" #include "psk.hh" #include "polar_tables.hh" #include "polar_helper.hh" #include "polar_encoder.hh" #include "polar_list_decoder.hh" template struct SchmidlCox { typedef DSP::Const Const; static const int match_len = guard_len | 1; static const int match_del = (match_len - 1) / 2; DSP::FastFourierTransform fwd; DSP::FastFourierTransform bwd; DSP::SMA4 cor; DSP::SMA4 pwr; DSP::SMA4 match; DSP::Delay delay; DSP::SchmittTrigger threshold; DSP::FallingEdgeTrigger falling; cmplx tmp0[symbol_len], tmp1[symbol_len], tmp2[symbol_len]; cmplx seq[symbol_len], kern[symbol_len]; cmplx cmplx_shift = 0; value timing_max = 0; value phase_max = 0; int index_max = 0; static int bin(int carrier) { return (carrier + symbol_len) % symbol_len; } static cmplx demod_or_erase(cmplx curr, cmplx prev) { if (!(norm(prev) > 0)) return 0; cmplx cons = curr / prev; if (!(norm(cons) <= 4)) return 0; return cons; } public: int symbol_pos = 0; value cfo_rad = 0; value frac_cfo = 0; SchmidlCox(const cmplx *sequence) : threshold(value(0.17*match_len), value(0.19*match_len)) { for (int i = 0; i < symbol_len; ++i) seq[i] = sequence[i]; fwd(kern, sequence); for (int i = 0; i < symbol_len; ++i) kern[i] = conj(kern[i]) / value(symbol_len); } bool operator()(const cmplx *samples) { cmplx P = cor(samples[search_pos+symbol_len] * conj(samples[search_pos+2*symbol_len])); value R = value(0.5) * pwr(norm(samples[search_pos+2*symbol_len])); value min_R = 0.0001 * symbol_len; R = std::max(R, min_R); value timing = match(norm(P) / (R * R)); value phase = delay(arg(P)); bool collect = threshold(timing); bool process = falling(collect); if (!collect && !process) return false; if (timing_max < timing) { timing_max = timing; phase_max = phase; index_max = match_del; } else if (index_max < symbol_len + guard_len + match_del) { ++index_max; } if (!process) return false; frac_cfo = phase_max / value(symbol_len); DSP::Phasor osc; osc.omega(frac_cfo); symbol_pos = search_pos - index_max; index_max = 0; timing_max = 0; for (int i = 0; i < symbol_len; ++i) tmp1[i] = samples[i+symbol_pos+symbol_len] * osc(); fwd(tmp0, tmp1); for (int i = 0; i < symbol_len; ++i) tmp1[i] = demod_or_erase(tmp0[i], tmp0[bin(i-1)]); fwd(tmp0, tmp1); for (int i = 0; i < symbol_len; ++i) tmp0[i] *= kern[i]; bwd(tmp2, tmp0); int shift = 0; value peak = 0; value next = 0; for (int i = 0; i < symbol_len; ++i) { value power = norm(tmp2[i]); if (power > peak) { next = peak; peak = power; shift = i; } else if (power > next) { next = power; } } if (peak <= next * 4) return false; int pos_err = std::nearbyint(arg(tmp2[shift]) * symbol_len / Const::TwoPi()); if (abs(pos_err) > guard_len / 2) return false; symbol_pos -= pos_err; cfo_rad = shift * (Const::TwoPi() / symbol_len) - frac_cfo; if (cfo_rad >= Const::Pi()) cfo_rad -= Const::TwoPi(); return true; } }; void base37_decoder(char *str, long long int val, int len) { for (int i = len-1; i >= 0; --i, val /= 37) str[i] = " 0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ"[val%37]; } template struct Decoder { typedef float code_type; #ifdef __AVX2__ typedef SIMD mesg_type; #else typedef SIMD mesg_type; #endif typedef DSP::Const Const; static const int symbol_len = (1280 * rate) / 8000; static const int filter_len = (((21 * rate) / 8000) & ~3) | 1; static const int guard_len = symbol_len / 8; static const int data_bits = 43040; static const int crc_bits = data_bits + 32; static const int mod_min = 2; static const int mod_max = 3; static const int cons_max = 64800 / mod_min; static const int cols_min = 256; static const int rows_max = cons_max / cols_min; static const int mls0_len = 127; static const int mls0_off = - mls0_len + 1; static const int mls0_poly = 0b10001001; static const int mls1_len = 255; static const int mls1_off = - mls1_len / 2; static const int mls1_poly = 0b100101011; static const int buffer_len = (rows_max + 8) * (symbol_len + guard_len); static const int search_pos = buffer_len - 4 * (symbol_len + guard_len); DSP::ReadPCM *pcm; DSP::FastFourierTransform fwd; DSP::FastFourierTransform bwd; DSP::BlockDC blockdc; DSP::Hilbert hilbert; DSP::BipBuffer input_hist; DSP::TheilSenEstimator2 tse; SchmidlCox correlator; CODE::CRC crc0; CODE::CRC crc1; CODE::OrderedStatisticsDecoder<255, 71, 4> osddec; CODE::PolarEncoder polarenc; CODE::PolarListDecoder polardec; int8_t genmat[255*71]; mesg_type mesg[44096], mess[65536]; code_type code[65536]; cmplx head[symbol_len], tail[symbol_len], cons[cons_max]; cmplx fdom[symbol_len], tdom[buffer_len]; value index[cons_max], phase[cons_max]; value cfo_rad, sfo_rad; const uint32_t *frozen_bits; int code_order; int symbol_pos; int oper_mode; int mod_bits; int cons_cnt; int cons_bits; int mesg_bits; static int bin(int carrier) { return (carrier + symbol_len) % symbol_len; } static int nrz(bool bit) { return 1 - 2 * bit; } static cmplx demod_or_erase(cmplx curr, cmplx prev) { if (!(norm(prev) > 0)) return 0; cmplx cons = curr / prev; if (!(norm(cons) <= 4)) return 0; return cons; } const cmplx *mls0_seq() { CODE::MLS seq0(mls0_poly); for (int i = 0; i < symbol_len/2; ++i) fdom[i] = 0; for (int i = 0; i < mls0_len; ++i) fdom[(i+mls0_off/2+symbol_len/2)%(symbol_len/2)] = nrz(seq0()); return fdom; } void lengthen() { int code_bits = 1 << code_order; for (int i = code_bits-1, j = cons_bits-1, k = mesg_bits-1; i >= 0; --i) if ((frozen_bits[i/32] >> (i%32)) & 1 || k-- < crc_bits) code[i] = code[j--]; else code[i] = CODE::PolarHelper::quant(9000); } void systematic() { polarenc(mess, mesg, frozen_bits, code_order); int code_bits = 1 << code_order; for (int i = 0, j = 0; i < code_bits && j < mesg_bits; ++i) if (!((frozen_bits[i/32] >> (i%32)) & 1)) mesg[j++] = mess[i]; } cmplx mod_map(code_type *b) { switch (oper_mode) { case 6: case 7: case 10: case 11: return PhaseShiftKeying<8, cmplx, code_type>::map(b); case 8: case 9: case 12: case 13: return PhaseShiftKeying<4, cmplx, code_type>::map(b); } return 0; } void mod_hard(code_type *b, cmplx c) { switch (oper_mode) { case 6: case 7: case 10: case 11: PhaseShiftKeying<8, cmplx, code_type>::hard(b, c); break; case 8: case 9: case 12: case 13: PhaseShiftKeying<4, cmplx, code_type>::hard(b, c); break; } } void mod_soft(code_type *b, cmplx c, value precision) { switch (oper_mode) { case 6: case 7: case 10: case 11: PhaseShiftKeying<8, cmplx, code_type>::soft(b, c, precision); break; case 8: case 9: case 12: case 13: PhaseShiftKeying<4, cmplx, code_type>::soft(b, c, precision); break; } } Decoder(uint8_t *out, DSP::ReadPCM *pcm, int skip_count) : pcm(pcm), correlator(mls0_seq()), crc0(0xA8F4), crc1(0xD419CC15) { CODE::BoseChaudhuriHocquenghemGenerator<255, 71>::matrix(genmat, true, { 0b100011101, 0b101110111, 0b111110011, 0b101101001, 0b110111101, 0b111100111, 0b100101011, 0b111010111, 0b000010011, 0b101100101, 0b110001011, 0b101100011, 0b100011011, 0b100111111, 0b110001101, 0b100101101, 0b101011111, 0b111111001, 0b111000011, 0b100111001, 0b110101001, 0b000011111, 0b110000111, 0b110110001}); bool real = pcm->channels() == 1; blockdc.samples(2*(symbol_len+guard_len)); const cmplx *buf; do { do { if (!pcm->good()) return; cmplx tmp; pcm->read(reinterpret_cast(&tmp), 1); if (real) tmp = hilbert(blockdc(tmp.real())); buf = input_hist(tmp); } while (!correlator(buf)); } while (skip_count--); symbol_pos = correlator.symbol_pos; cfo_rad = correlator.cfo_rad; std::cerr << "symbol pos: " << symbol_pos << std::endl; std::cerr << "coarse cfo: " << cfo_rad * (rate / Const::TwoPi()) << " Hz " << std::endl; DSP::Phasor osc; osc.omega(-cfo_rad); for (int i = 0; i < symbol_len; ++i) tdom[i] = buf[i+symbol_pos+(symbol_len+guard_len)] * osc(); fwd(fdom, tdom); CODE::MLS seq1(mls1_poly); for (int i = 0; i < mls1_len; ++i) fdom[bin(i+mls1_off)] *= nrz(seq1()); int8_t soft[mls1_len]; uint8_t data[(mls1_len+7)/8]; for (int i = 0; i < mls1_len; ++i) soft[i] = std::min(std::max( std::nearbyint(127 * demod_or_erase( fdom[bin(i+mls1_off)], fdom[bin(i-1+mls1_off)]).real()), -128), 127); bool unique = osddec(data, soft, genmat); if (!unique) { std::cerr << "OSD error." << std::endl; return; } uint64_t md = 0; for (int i = 0; i < 55; ++i) md |= (uint64_t)CODE::get_be_bit(data, i) << i; uint16_t cs = 0; for (int i = 0; i < 16; ++i) cs |= (uint16_t)CODE::get_be_bit(data, i+55) << i; crc0.reset(); if (crc0(md<<9) != cs) { std::cerr << "header CRC error." << std::endl; return; } oper_mode = md & 255; int cons_cols; switch (oper_mode) { case 6: cons_cols = 432; mod_bits = 3; code_order = 16; cons_bits = 64800; mesg_bits = 43808; frozen_bits = frozen_64800_43072; break; case 7: cons_cols = 400; mod_bits = 3; code_order = 16; cons_bits = 64800; mesg_bits = 43808; frozen_bits = frozen_64800_43072; break; case 8: cons_cols = 400; mod_bits = 2; code_order = 16; cons_bits = 64800; mesg_bits = 43808; frozen_bits = frozen_64800_43072; break; case 9: cons_cols = 360; mod_bits = 2; code_order = 16; cons_bits = 64800; mesg_bits = 43808; frozen_bits = frozen_64800_43072; break; case 10: cons_cols = 512; mod_bits = 3; code_order = 16; cons_bits = 64512; mesg_bits = 44096; frozen_bits = frozen_64512_43072; break; case 11: cons_cols = 384; mod_bits = 3; code_order = 16; cons_bits = 64512; mesg_bits = 44096; frozen_bits = frozen_64512_43072; break; case 12: cons_cols = 384; mod_bits = 2; code_order = 16; cons_bits = 64512; mesg_bits = 44096; frozen_bits = frozen_64512_43072; break; case 13: cons_cols = 256; mod_bits = 2; code_order = 16; cons_bits = 64512; mesg_bits = 44096; frozen_bits = frozen_64512_43072; break; default: std::cerr << "operation mode " << oper_mode << " unsupported." << std::endl; return; } cons_cnt = cons_bits / mod_bits; std::cerr << "oper mode: " << oper_mode << std::endl; if ((md>>8) == 0 || (md>>8) >= 129961739795077L) { std::cerr << "call sign unsupported." << std::endl; return; } char call_sign[10]; base37_decoder(call_sign, md>>8, 9); call_sign[9] = 0; std::cerr << "call sign: " << call_sign << std::endl; int cons_rows = cons_cnt / cons_cols; int code_off = - cons_cols / 2; osc.omega(-cfo_rad); for (int i = 0; i < buffer_len; ++i) tdom[i] = buf[i] * osc(); cmplx *cur = tdom + symbol_pos - (cons_rows + 1) * (symbol_len + guard_len); fwd(fdom, cur); for (int j = 0; j < cons_rows; ++j) { for (int i = 0; i < cons_cols; ++i) head[bin(i+code_off)] = fdom[bin(i+code_off)]; fwd(fdom, cur += symbol_len+guard_len); for (int i = 0; i < cons_cols; ++i) cons[cons_cols*j+i] = demod_or_erase(fdom[bin(i+code_off)], head[bin(i+code_off)]); } if (1) { for (int i = 0; i < cons_cnt; ++i) { code_type tmp[mod_max]; mod_hard(tmp, cons[i]); index[i] = (i % cons_cols) + code_off; phase[i] = arg(cons[i] * conj(mod_map(tmp))); } tse.compute(index, phase, cons_cnt); //std::cerr << "Theil-Sen slope = " << tse.slope() << std::endl; //std::cerr << "Theil-Sen yint = " << tse.yint() << std::endl; sfo_rad -= tse.slope() * symbol_len / value(symbol_len+guard_len); cfo_rad += tse.yint() / (symbol_len+guard_len); std::cerr << "coarse sfo: " << 1000000 * sfo_rad / Const::TwoPi() << " ppm" << std::endl; std::cerr << "finer cfo: " << cfo_rad * (rate / Const::TwoPi()) << " Hz " << std::endl; for (int i = 0; i < cons_cnt; ++i) cons[i] *= DSP::polar(1, -tse((i % cons_cols) + code_off)); } value precision = 16; if (1) { value sp = 0, np = 0; for (int i = 0; i < cons_cnt; ++i) { code_type tmp[mod_max]; mod_hard(tmp, cons[i]); cmplx hard = mod_map(tmp); cmplx error = cons[i] - hard; sp += norm(hard); np += norm(error); } value snr = DSP::decibel(sp / np); std::cerr << "init Es/N0: " << snr << " dB" << std::endl; // $LLR=log(\frac{p(x=+1|y)}{p(x=-1|y)})$ // $p(x|\mu,\sigma)=\frac{1}{\sqrt{2\pi}\sigma}}e^{-\frac{(x-\mu)^2}{2\sigma^2}}$ value sigma = std::sqrt(np / (2 * sp)); precision = 1 / (sigma * sigma); } for (int i = 0; i < cons_cnt; ++i) mod_soft(code+mod_bits*i, cons[i], precision); lengthen(); CODE::PolarHelper::PATH metric[mesg_type::SIZE]; polardec(metric, mesg, code, frozen_bits, code_order); systematic(); int order[mesg_type::SIZE]; for (int k = 0; k < mesg_type::SIZE; ++k) order[k] = k; std::sort(order, order+mesg_type::SIZE, [metric](int a, int b){ return metric[a] < metric[b]; }); int best = -1; for (int k = 0; k < mesg_type::SIZE; ++k) { crc1.reset(); for (int i = 0; i < crc_bits; ++i) crc1(mesg[i].v[order[k]] < 0); if (crc1() == 0) { best = order[k]; break; } } if (best < 0) { std::cerr << "payload decoding error." << std::endl; return; } for (int i = 0; i < data_bits; ++i) CODE::set_le_bit(out, i, mesg[i].v[best] < 0); } }; int main(int argc, char **argv) { if (argc < 3 || argc > 4) { std::cerr << "usage: " << argv[0] << " OUTPUT INPUT [SKIP]" << std::endl; return 1; } typedef float value; typedef DSP::Complex cmplx; const char *output_name = argv[1]; const char *input_name = argv[2]; DSP::ReadWAV input_file(input_name); if (input_file.channels() < 1 || input_file.channels() > 2) { std::cerr << "Only real or analytic signal (one or two channels) supported." << std::endl; return 1; } int skip_count = 1; if (argc > 3) skip_count = std::atoi(argv[3]); const int data_len = 43040 / 8; uint8_t *output_data = new uint8_t[data_len]; switch (input_file.rate()) { case 8000: delete new Decoder(output_data, &input_file, skip_count); break; case 16000: delete new Decoder(output_data, &input_file, skip_count); break; case 44100: delete new Decoder(output_data, &input_file, skip_count); break; case 48000: delete new Decoder(output_data, &input_file, skip_count); break; default: std::cerr << "Unsupported sample rate." << std::endl; return 1; } std::ofstream output_file(output_name, std::ios::binary | std::ios::trunc); if (output_file.bad()) { std::cerr << "Couldn't open file \"" << output_name << "\" for writing." << std::endl; return 1; } CODE::Xorshift32 scrambler; for (int i = 0; i < data_len; ++i) output_data[i] ^= scrambler(); for (int i = 0; i < data_len; ++i) output_file.put(output_data[i]); delete []output_data; return 0; }