aboutsummaryrefslogtreecommitdiffstats
path: root/src/atrac1denc.h
blob: 841e3e5a46b6db635707b5f2085584b173c6590a (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
/*
 * This file is part of AtracDEnc.
 *
 * AtracDEnc is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * AtracDEnc is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with AtracDEnc; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

#pragma once
#include "pcmengin.h"
#include "aea.h"
#include "transient_detector.h"
#include "atrac/atrac1.h"
#include "atrac/atrac1_qmf.h"
#include "atrac/atrac_scale.h"
#include "lib/mdct/mdct.h"

#include <assert.h>
#include <vector>

namespace NAtracDEnc {

enum EMode {
    E_ENCODE = 1,
    E_DECODE = 2,
    E_ATRAC3 = 4
};

class TAtrac1MDCT {
    NMDCT::TMDCT<512> Mdct512;
    NMDCT::TMDCT<256> Mdct256;
    NMDCT::TMDCT<64> Mdct64;
    NMDCT::TMIDCT<512> Midct512;
    NMDCT::TMIDCT<256> Midct256;
    NMDCT::TMIDCT<64> Midct64;
public:
    void IMdct(TFloat specs[512], const TBlockSize& mode, TFloat* low, TFloat* mid, TFloat* hi);
    void Mdct(TFloat specs[512], TFloat* low, TFloat* mid, TFloat* hi, const TBlockSize& blockSize);
    TAtrac1MDCT()
        : Mdct512(1)
        , Mdct256(0.5)
        , Mdct64(0.5)
        , Midct512(512*2)
        , Midct256(256*2)
        , Midct64(64*2)
    {}
};

class TAtrac1Encoder : public IProcessor<TFloat>, public TAtrac1MDCT {
    TCompressedOutputPtr Aea;
    const NAtrac1::TAtrac1EncodeSettings Settings;

    TFloat PcmBufLow[2][256 + 16];
    TFloat PcmBufMid[2][256 + 16];
    TFloat PcmBufHi[2][512 + 16];

    Atrac1AnalysisFilterBank<TFloat> AnalysisFilterBank[2];

    const std::vector<float> LoudnessCurve;

    class TTransientDetectors {
        std::vector<TTransientDetector> transientDetectorLow;
        std::vector<TTransientDetector> transientDetectorMid;
        std::vector<TTransientDetector> transientDetectorHi;
    public:
        TTransientDetectors()
            : transientDetectorLow(2, TTransientDetector(16, 128))
            , transientDetectorMid(2, TTransientDetector(16, 128))
            , transientDetectorHi(2, TTransientDetector(16, 256))
        {}
        TTransientDetector& GetDetector(uint32_t channel, uint32_t band) {
            switch (band) {
                case 0:
                    return transientDetectorLow[channel];
                break;
                case 1:
                    return transientDetectorMid[channel];
                break;
                case 2:
                    return transientDetectorHi[channel];
                break;
                default:
                    assert(false);
                    return transientDetectorLow[channel];
            }
        }
    };
    TAtrac1Encoder::TTransientDetectors TransientDetectors;

    TScaler<NAtrac1::TAtrac1Data> Scaler;
    static constexpr float LoudFactor = 0.006;
    float Loudness = LoudFactor;

public:
    TAtrac1Encoder(TCompressedOutputPtr&& aea, NAtrac1::TAtrac1EncodeSettings&& settings);
    TPCMEngine<TFloat>::TProcessLambda GetLambda() override;
};

class TAtrac1Decoder : public IProcessor<TFloat>, public TAtrac1MDCT {
    TCompressedInputPtr Aea;
    const NAtrac1::TAtrac1EncodeSettings Settings;

    TFloat PcmBufLow[2][256 + 16];
    TFloat PcmBufMid[2][256 + 16];
    TFloat PcmBufHi[2][512 + 16];

    int32_t PcmValueMax = 1;
    int32_t PcmValueMin = -1;

    Atrac1SynthesisFilterBank<TFloat> SynthesisFilterBank[2];
public:
    TAtrac1Decoder(TCompressedInputPtr&& aea);
    TPCMEngine<TFloat>::TProcessLambda GetLambda() override;
};

}