You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
74 lines
2.1 KiB
74 lines
2.1 KiB
/*************************************************************************** |
|
* Copyright (C) 2013 by Azat Khuzhin <a3at.mail@gmail.com> * |
|
* * |
|
* This program is free software; you can redistribute it and/or modify * |
|
* it under the terms of the GNU General Public License as published by * |
|
* the Free Software Foundation; either version 2 of the License, or * |
|
* (at your option) any later version. * |
|
***************************************************************************/ |
|
|
|
|
|
#include <QFile> |
|
#include <QDataStream> |
|
#include <QTextCodec> |
|
|
|
#include <kencodingprober.h> |
|
#include <QtCore/QDebug> |
|
|
|
#include "document.h" |
|
#include "debug_txt.h" |
|
|
|
using namespace Txt; |
|
|
|
Document::Document( const QString &fileName ) |
|
{ |
|
#ifdef TXT_DEBUG |
|
qCDebug(OkularTxtDebug) << "Opening file" << fileName; |
|
#endif |
|
|
|
QFile plainFile( fileName ); |
|
if ( !plainFile.open( QIODevice::ReadOnly | QIODevice::Text ) ) |
|
{ |
|
qCDebug(OkularTxtDebug) << "Can't open file" << plainFile.fileName(); |
|
return; |
|
} |
|
|
|
const QByteArray buffer = plainFile.readAll(); |
|
setPlainText( toUnicode(buffer) ); |
|
} |
|
|
|
Document::~Document() |
|
{ |
|
} |
|
|
|
QString Document::toUnicode( const QByteArray &array ) |
|
{ |
|
QByteArray encoding; |
|
KEncodingProber prober(KEncodingProber::Universal); |
|
int charsFeeded = 0; |
|
int chunkSize = 3000; // ~= number of symbols in page. |
|
|
|
// Try to detect encoding. |
|
while ( encoding.isEmpty() && charsFeeded < array.size() ) |
|
{ |
|
prober.feed( array.mid( charsFeeded, chunkSize ) ); |
|
charsFeeded += chunkSize; |
|
|
|
if (prober.confidence() >= 0.5) |
|
{ |
|
encoding = prober.encoding(); |
|
break; |
|
} |
|
} |
|
|
|
if ( encoding.isEmpty() ) |
|
{ |
|
return QString(); |
|
} |
|
|
|
qCDebug(OkularTxtDebug) << "Detected" << prober.encoding() << "encoding" |
|
<< "based on" << charsFeeded << "chars"; |
|
return QTextCodec::codecForName( encoding )->toUnicode( array ); |
|
} |
|
|
|
Q_LOGGING_CATEGORY(OkularTxtDebug, "org.kde.okular.generators.txt")
|
|
|