You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
600 lines
15 KiB
600 lines
15 KiB
/*
|
|
*
|
|
* $Id: k3baudiodecoder.cpp 619556 2007-01-03 17:38:12Z trueg $
|
|
* Copyright (C) 2003 Sebastian Trueg <trueg@k3b.org>
|
|
*
|
|
* This file is part of the K3b project.
|
|
* Copyright (C) 1998-2007 Sebastian Trueg <trueg@k3b.org>
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
* (at your option) any later version.
|
|
* See the file "COPYING" for the exact licensing terms.
|
|
*/
|
|
|
|
#include <config.h>
|
|
|
|
#include <k3bcore.h>
|
|
|
|
#include "k3baudiodecoder.h"
|
|
#include "k3bpluginmanager.h"
|
|
|
|
#include <kdebug.h>
|
|
#include <kfilemetainfo.h>
|
|
|
|
#include <tqmap.h>
|
|
|
|
#include <math.h>
|
|
|
|
#ifdef HAVE_LIBSAMPLERATE
|
|
#include <samplerate.h>
|
|
#else
|
|
#include "libsamplerate/samplerate.h"
|
|
#endif
|
|
|
|
#if !(HAVE_LRINT && HAVE_LRINTF)
|
|
#define lrint(dbl) ((int) (dbl))
|
|
#define lrintf(flt) ((int) (flt))
|
|
#endif
|
|
|
|
// use a one second buffer
|
|
static const int DECODING_BUFFER_SIZE = 75*2352;
|
|
|
|
class K3bAudioDecoder::Private
|
|
{
|
|
public:
|
|
Private()
|
|
: metaInfo(0),
|
|
resampleState(0),
|
|
resampleData(0),
|
|
inBuffer(0),
|
|
inBufferPos(0),
|
|
inBufferFill(0),
|
|
outBuffer(0),
|
|
monoBuffer(0),
|
|
decodingBufferPos(0),
|
|
decodingBufferFill(0),
|
|
valid(true) {
|
|
}
|
|
|
|
// the current position of the decoder
|
|
// This does NOT include the decodingBuffer
|
|
K3b::Msf currentPos;
|
|
|
|
// since the current position above is measured in frames
|
|
// there might be a little offset since the decoded data is not
|
|
// always a multiple of 2353 bytes
|
|
int currentPosOffset;
|
|
|
|
// already decoded bytes from last init or last seek
|
|
// TODO: replace alreadyDecoded with currentPos
|
|
unsigned long alreadyDecoded;
|
|
|
|
K3b::Msf decodingStartPos;
|
|
|
|
KFileMetaInfo* metaInfo;
|
|
|
|
// set to true once decodeInternal() returned 0
|
|
bool decoderFinished;
|
|
|
|
// resampling
|
|
SRC_STATE* resampleState;
|
|
SRC_DATA* resampleData;
|
|
|
|
float* inBuffer;
|
|
float* inBufferPos;
|
|
int inBufferFill;
|
|
|
|
float* outBuffer;
|
|
|
|
int samplerate;
|
|
int channels;
|
|
|
|
// mono -> stereo conversion
|
|
char* monoBuffer;
|
|
|
|
char decodingBuffer[DECODING_BUFFER_SIZE];
|
|
char* decodingBufferPos;
|
|
int decodingBufferFill;
|
|
|
|
TQMap<TQString, TQString> technicalInfoMap;
|
|
TQMap<MetaDataField, TQString> metaInfoMap;
|
|
|
|
bool valid;
|
|
};
|
|
|
|
|
|
|
|
K3bAudioDecoder::K3bAudioDecoder( TQObject* parent, const char* name )
|
|
: TQObject( parent, name )
|
|
{
|
|
d = new Private();
|
|
}
|
|
|
|
|
|
K3bAudioDecoder::~K3bAudioDecoder()
|
|
{
|
|
cleanup();
|
|
|
|
if( d->inBuffer ) delete [] d->inBuffer;
|
|
if( d->outBuffer ) delete [] d->outBuffer;
|
|
if( d->monoBuffer ) delete [] d->monoBuffer;
|
|
|
|
delete d->metaInfo;
|
|
delete d->resampleData;
|
|
if( d->resampleState )
|
|
src_delete( d->resampleState );
|
|
delete d;
|
|
}
|
|
|
|
|
|
void K3bAudioDecoder::setFilename( const TQString& filename )
|
|
{
|
|
m_fileName = filename;
|
|
delete d->metaInfo;
|
|
d->metaInfo = 0;
|
|
}
|
|
|
|
|
|
bool K3bAudioDecoder::isValid() const
|
|
{
|
|
return d->valid;
|
|
}
|
|
|
|
|
|
bool K3bAudioDecoder::analyseFile()
|
|
{
|
|
d->technicalInfoMap.clear();
|
|
d->metaInfoMap.clear();
|
|
delete d->metaInfo;
|
|
d->metaInfo = 0;
|
|
|
|
cleanup();
|
|
|
|
bool ret = analyseFileInternal( m_length, d->samplerate, d->channels );
|
|
if( ret && ( d->channels == 1 || d->channels == 2 ) && m_length > 0 ) {
|
|
d->valid = initDecoder();
|
|
return d->valid;
|
|
}
|
|
else {
|
|
d->valid = false;
|
|
return false;
|
|
}
|
|
}
|
|
|
|
|
|
bool K3bAudioDecoder::initDecoder( const K3b::Msf& startOffset )
|
|
{
|
|
if( initDecoder() ) {
|
|
if( startOffset > 0 )
|
|
return seek( startOffset );
|
|
else
|
|
return true;
|
|
}
|
|
else
|
|
return false;
|
|
}
|
|
|
|
|
|
bool K3bAudioDecoder::initDecoder()
|
|
{
|
|
cleanup();
|
|
|
|
if( d->resampleState )
|
|
src_reset( d->resampleState );
|
|
|
|
d->alreadyDecoded = 0;
|
|
d->currentPos = 0;
|
|
d->currentPosOffset = 0;
|
|
d->decodingBufferFill = 0;
|
|
d->decodingBufferPos = 0;
|
|
d->decodingStartPos = 0;
|
|
d->inBufferFill = 0;
|
|
|
|
d->decoderFinished = false;
|
|
|
|
return initDecoderInternal();
|
|
}
|
|
|
|
|
|
int K3bAudioDecoder::decode( char* _data, int maxLen )
|
|
{
|
|
unsigned long lengthToDecode = (m_length - d->decodingStartPos).audioBytes();
|
|
|
|
if( d->alreadyDecoded >= lengthToDecode )
|
|
return 0;
|
|
|
|
if( maxLen <= 0 )
|
|
return 0;
|
|
|
|
int read = 0;
|
|
|
|
if( d->decodingBufferFill == 0 ) {
|
|
//
|
|
// now we decode into the decoding buffer
|
|
// to ensure a minimum buffer size
|
|
//
|
|
d->decodingBufferFill = 0;
|
|
d->decodingBufferPos = d->decodingBuffer;
|
|
|
|
if( !d->decoderFinished ) {
|
|
if( d->samplerate != 44100 ) {
|
|
|
|
// check if we have data left from some previous conversion
|
|
if( d->inBufferFill > 0 ) {
|
|
read = resample( d->decodingBuffer, DECODING_BUFFER_SIZE );
|
|
}
|
|
else {
|
|
if( !d->inBuffer ) {
|
|
d->inBuffer = new float[DECODING_BUFFER_SIZE/2];
|
|
}
|
|
|
|
if( (read = decodeInternal( d->decodingBuffer, DECODING_BUFFER_SIZE )) == 0 )
|
|
d->decoderFinished = true;
|
|
|
|
d->inBufferFill = read/2;
|
|
d->inBufferPos = d->inBuffer;
|
|
from16bitBeSignedToFloat( d->decodingBuffer, d->inBuffer, d->inBufferFill );
|
|
|
|
read = resample( d->decodingBuffer, DECODING_BUFFER_SIZE );
|
|
}
|
|
}
|
|
else if( d->channels == 1 ) {
|
|
if( !d->monoBuffer ) {
|
|
d->monoBuffer = new char[DECODING_BUFFER_SIZE/2];
|
|
}
|
|
|
|
// we simply duplicate every frame
|
|
if( (read = decodeInternal( d->monoBuffer, DECODING_BUFFER_SIZE/2 )) == 0 )
|
|
d->decoderFinished = true;
|
|
|
|
for( int i = 0; i < read; i+=2 ) {
|
|
d->decodingBuffer[2*i] = d->decodingBuffer[2*i+2] = d->monoBuffer[i];
|
|
d->decodingBuffer[2*i+1] = d->decodingBuffer[2*i+3] = d->monoBuffer[i+1];
|
|
}
|
|
|
|
read *= 2;
|
|
}
|
|
else {
|
|
if( (read = decodeInternal( d->decodingBuffer, DECODING_BUFFER_SIZE )) == 0 )
|
|
d->decoderFinished = true;
|
|
}
|
|
}
|
|
|
|
if( read < 0 ) {
|
|
return -1;
|
|
}
|
|
else if( read == 0 ) {
|
|
// check if we need to pad
|
|
int bytesToPad = lengthToDecode - d->alreadyDecoded;
|
|
if( bytesToPad > 0 ) {
|
|
kdDebug() << "(K3bAudioDecoder) track length: " << lengthToDecode
|
|
<< "; decoded module data: " << d->alreadyDecoded
|
|
<< "; we need to pad " << bytesToPad << " bytes." << endl;
|
|
|
|
if( DECODING_BUFFER_SIZE < bytesToPad )
|
|
bytesToPad = DECODING_BUFFER_SIZE;
|
|
|
|
::memset( d->decodingBuffer, 0, bytesToPad );
|
|
|
|
kdDebug() << "(K3bAudioDecoder) padded " << bytesToPad << " bytes." << endl;
|
|
|
|
read = bytesToPad;
|
|
}
|
|
else {
|
|
kdDebug() << "(K3bAudioDecoder) decoded " << d->alreadyDecoded << " bytes." << endl;
|
|
return 0;
|
|
}
|
|
}
|
|
else {
|
|
|
|
// check if we decoded too much
|
|
if( d->alreadyDecoded + read > lengthToDecode ) {
|
|
kdDebug() << "(K3bAudioDecoder) we decoded too much. Cutting output by "
|
|
<< (read + d->alreadyDecoded - lengthToDecode) << endl;
|
|
read = lengthToDecode - d->alreadyDecoded;
|
|
}
|
|
}
|
|
|
|
d->decodingBufferFill = read;
|
|
}
|
|
|
|
|
|
// clear out the decoding buffer
|
|
read = TQMIN( maxLen, d->decodingBufferFill );
|
|
::memcpy( _data, d->decodingBufferPos, read );
|
|
d->decodingBufferPos += read;
|
|
d->decodingBufferFill -= read;
|
|
|
|
d->alreadyDecoded += read;
|
|
d->currentPos += (read+d->currentPosOffset)/2352;
|
|
d->currentPosOffset = (read+d->currentPosOffset)%2352;
|
|
|
|
return read;
|
|
}
|
|
|
|
|
|
// resample data in d->inBufferPos and save the result to data
|
|
//
|
|
//
|
|
int K3bAudioDecoder::resample( char* data, int maxLen )
|
|
{
|
|
if( !d->resampleState ) {
|
|
d->resampleState = src_new( SRC_SINC_MEDIUM_QUALITY, d->channels, 0 );
|
|
if( !d->resampleState ) {
|
|
kdDebug() << "(K3bAudioDecoder) unable to initialize resampler." << endl;
|
|
return -1;
|
|
}
|
|
d->resampleData = new SRC_DATA;
|
|
}
|
|
|
|
if( !d->outBuffer ) {
|
|
d->outBuffer = new float[DECODING_BUFFER_SIZE/2];
|
|
}
|
|
|
|
d->resampleData->data_in = d->inBufferPos;
|
|
d->resampleData->data_out = d->outBuffer;
|
|
d->resampleData->input_frames = d->inBufferFill/d->channels;
|
|
d->resampleData->output_frames = maxLen/2/2; // in case of mono files we need the space anyway
|
|
d->resampleData->src_ratio = 44100.0/(double)d->samplerate;
|
|
if( d->inBufferFill == 0 )
|
|
d->resampleData->end_of_input = 1; // this should force libsamplerate to output the last frames
|
|
else
|
|
d->resampleData->end_of_input = 0;
|
|
|
|
int len = 0;
|
|
if( (len = src_process( d->resampleState, d->resampleData ) ) ) {
|
|
kdDebug() << "(K3bAudioDecoder) error while resampling: " << src_strerror(len) << endl;
|
|
return -1;
|
|
}
|
|
|
|
if( d->channels == 2 )
|
|
fromFloatTo16BitBeSigned( d->outBuffer, data, d->resampleData->output_frames_gen*d->channels );
|
|
else {
|
|
for( int i = 0; i < d->resampleData->output_frames_gen; ++i ) {
|
|
fromFloatTo16BitBeSigned( &d->outBuffer[i], &data[4*i], 1 );
|
|
fromFloatTo16BitBeSigned( &d->outBuffer[i], &data[4*i+2], 1 );
|
|
}
|
|
}
|
|
|
|
d->inBufferPos += d->resampleData->input_frames_used*d->channels;
|
|
d->inBufferFill -= d->resampleData->input_frames_used*d->channels;
|
|
if( d->inBufferFill <= 0 ) {
|
|
d->inBufferPos = d->inBuffer;
|
|
d->inBufferFill = 0;
|
|
}
|
|
|
|
// 16 bit frames, so we need to multiply by 2
|
|
// and we always have two channels
|
|
return d->resampleData->output_frames_gen*2*2;
|
|
}
|
|
|
|
|
|
void K3bAudioDecoder::from16bitBeSignedToFloat( char* src, float* dest, int samples )
|
|
{
|
|
while( samples ) {
|
|
samples--;
|
|
dest[samples] = static_cast<float>( TQ_INT16(((src[2*samples]<<8)&0xff00)|(src[2*samples+1]&0x00ff)) / 32768.0 );
|
|
}
|
|
}
|
|
|
|
|
|
void K3bAudioDecoder::fromFloatTo16BitBeSigned( float* src, char* dest, int samples )
|
|
{
|
|
while( samples ) {
|
|
samples--;
|
|
|
|
float scaled = src[samples] * 32768.0;
|
|
TQ_INT16 val = 0;
|
|
|
|
// clipping
|
|
if( scaled >= ( 1.0 * 0x7FFF ) )
|
|
val = 32767;
|
|
else if( scaled <= ( -8.0 * 0x1000 ) )
|
|
val = -32768;
|
|
else
|
|
val = lrintf(scaled);
|
|
|
|
dest[2*samples] = val>>8;
|
|
dest[2*samples+1] = val;
|
|
}
|
|
}
|
|
|
|
|
|
void K3bAudioDecoder::from8BitTo16BitBeSigned( char* src, char* dest, int samples )
|
|
{
|
|
while( samples ) {
|
|
samples--;
|
|
|
|
float scaled = static_cast<float>(TQ_UINT8(src[samples])-128) / 128.0 * 32768.0;
|
|
TQ_INT16 val = 0;
|
|
|
|
// clipping
|
|
if( scaled >= ( 1.0 * 0x7FFF ) )
|
|
val = 32767;
|
|
else if( scaled <= ( -8.0 * 0x1000 ) )
|
|
val = -32768;
|
|
else
|
|
val = lrintf(scaled);
|
|
|
|
dest[2*samples] = val>>8;
|
|
dest[2*samples+1] = val;
|
|
}
|
|
}
|
|
|
|
|
|
bool K3bAudioDecoder::seek( const K3b::Msf& pos )
|
|
{
|
|
kdDebug() << "(K3bAudioDecoder) seek from " << d->currentPos.toString() << " (+" << d->currentPosOffset
|
|
<< ") to " << pos.toString() << endl;
|
|
|
|
if( pos > length() )
|
|
return false;
|
|
|
|
d->decoderFinished = false;
|
|
|
|
if( pos == d->currentPos && d->currentPosOffset == 0 )
|
|
return true;
|
|
|
|
if( pos == 0 )
|
|
return initDecoder();
|
|
|
|
bool success = false;
|
|
|
|
//
|
|
// First check if we may do a "perfect seek".
|
|
// We cannot rely on the decoding plugins to seek perfectly. Especially
|
|
// the mp3 decoder does not. But in case we want to split a live recording
|
|
// it is absolutely nesseccary to perform a perfect seek.
|
|
// So if we did not already decode past the seek position and the difference
|
|
// between the current position and the seek position is less than some fixed
|
|
// value we simply decode up to the seek position.
|
|
//
|
|
if( ( pos > d->currentPos ||
|
|
( pos == d->currentPos && d->currentPosOffset == 0 ) )
|
|
&&
|
|
( pos - d->currentPos < K3b::Msf(0,10,0) ) ) { // < 10 seconds is ok
|
|
kdDebug() << "(K3bAudioDecoder) performing perfect seek from " << d->currentPos.toString()
|
|
<< " to " << pos.toString() << ". :)" << endl;
|
|
|
|
unsigned long bytesToDecode = pos.audioBytes() - d->currentPos.audioBytes() - d->currentPosOffset;
|
|
kdDebug() << "(K3bAudioDecoder) seeking " << bytesToDecode << " bytes." << endl;
|
|
char buffi[10*2352];
|
|
while( bytesToDecode > 0 ) {
|
|
int read = decode( buffi, TQMIN(10*2352, bytesToDecode) );
|
|
if( read <= 0 )
|
|
return false;
|
|
|
|
bytesToDecode -= read;
|
|
}
|
|
|
|
kdDebug() << "(K3bAudioDecoder) perfect seek done." << endl;
|
|
|
|
success = true;
|
|
}
|
|
else {
|
|
//
|
|
// Here we have to reset the resampling stuff since we restart decoding at another position.
|
|
//
|
|
if( d->resampleState )
|
|
src_reset( d->resampleState );
|
|
d->inBufferFill = 0;
|
|
|
|
//
|
|
// And also reset the decoding buffer to not return any garbage from previous decoding.
|
|
//
|
|
d->decodingBufferFill = 0;
|
|
|
|
success = seekInternal( pos );
|
|
}
|
|
|
|
d->alreadyDecoded = 0;
|
|
d->currentPos = d->decodingStartPos = pos;
|
|
d->currentPosOffset = 0;
|
|
|
|
return success;
|
|
}
|
|
|
|
|
|
void K3bAudioDecoder::cleanup()
|
|
{
|
|
}
|
|
|
|
|
|
TQString K3bAudioDecoder::metaInfo( MetaDataField f )
|
|
{
|
|
if( d->metaInfoMap.contains( f ) )
|
|
return d->metaInfoMap[f];
|
|
|
|
// fall back to KFileMetaInfo
|
|
if( !d->metaInfo )
|
|
d->metaInfo = new KFileMetaInfo( filename() );
|
|
|
|
if( d->metaInfo->isValid() ) {
|
|
TQString tag;
|
|
switch( f ) {
|
|
case META_TITLE:
|
|
tag = "Title";
|
|
break;
|
|
case META_ARTIST:
|
|
tag = "Artist";
|
|
break;
|
|
case META_SONGWRITER:
|
|
tag = "Songwriter";
|
|
break;
|
|
case META_COMPOSER:
|
|
tag = "Composer";
|
|
break;
|
|
case META_COMMENT:
|
|
tag = "Comment";
|
|
break;
|
|
}
|
|
|
|
KFileMetaInfoItem item = d->metaInfo->item( tag );
|
|
if( item.isValid() )
|
|
return item.string();
|
|
}
|
|
|
|
return TQString();
|
|
}
|
|
|
|
|
|
void K3bAudioDecoder::addMetaInfo( MetaDataField f, const TQString& value )
|
|
{
|
|
if( !value.isEmpty() )
|
|
d->metaInfoMap[f] = value;
|
|
else
|
|
kdDebug() << "(K3bAudioDecoder) empty meta data field." << endl;
|
|
}
|
|
|
|
|
|
TQStringList K3bAudioDecoder::supportedTechnicalInfos() const
|
|
{
|
|
TQStringList l;
|
|
for( TQMap<TQString, TQString>::const_iterator it = d->technicalInfoMap.begin();
|
|
it != d->technicalInfoMap.end(); ++it )
|
|
l.append( it.key() );
|
|
return l;
|
|
}
|
|
|
|
|
|
TQString K3bAudioDecoder::technicalInfo( const TQString& key ) const
|
|
{
|
|
return d->technicalInfoMap[key];
|
|
}
|
|
|
|
|
|
void K3bAudioDecoder::addTechnicalInfo( const TQString& key, const TQString& value )
|
|
{
|
|
d->technicalInfoMap[key] = value;
|
|
}
|
|
|
|
|
|
K3bAudioDecoder* K3bAudioDecoderFactory::createDecoder( const KURL& url )
|
|
{
|
|
kdDebug() << "(K3bAudioDecoderFactory::createDecoder( " << url.path() << " )" << endl;
|
|
TQPtrList<K3bPlugin> fl = k3bcore->pluginManager()->plugins( "AudioDecoder" );
|
|
|
|
// first search for a single format decoder
|
|
for( TQPtrListIterator<K3bPlugin> it( fl ); it.current(); ++it ) {
|
|
K3bAudioDecoderFactory* f = dynamic_cast<K3bAudioDecoderFactory*>( it.current() );
|
|
if( f && !f->multiFormatDecoder() && f->canDecode( url ) ) {
|
|
kdDebug() << "1" << endl; return f->createDecoder();}
|
|
}
|
|
|
|
// no single format decoder. Search for a multi format decoder
|
|
for( TQPtrListIterator<K3bPlugin> it( fl ); it.current(); ++it ) {
|
|
K3bAudioDecoderFactory* f = dynamic_cast<K3bAudioDecoderFactory*>( it.current() );
|
|
if( f && f->multiFormatDecoder() && f->canDecode( url ) ) {
|
|
kdDebug() << "2" << endl; return f->createDecoder();}
|
|
}
|
|
|
|
kdDebug() << "(K3bAudioDecoderFactory::createDecoder( " << url.path() << " ) no success" << endl;
|
|
|
|
// nothing found
|
|
return 0;
|
|
}
|
|
|
|
#include "k3baudiodecoder.moc"
|