diff --git a/src/dict/dictionary.hh b/src/dict/dictionary.hh index 010429ffa..2fed491be 100644 --- a/src/dict/dictionary.hh +++ b/src/dict/dictionary.hh @@ -226,6 +226,8 @@ public: hasAnyData( false ) { } +signals: + void finishedArticle( QString articleText ); protected: bool hasAnyData; // With this being false, dataSize() always returns -1 @@ -235,6 +237,8 @@ protected: /// A helper class for synchronous word search implementations. class WordSearchRequestInstant: public WordSearchRequest { + Q_OBJECT + public: WordSearchRequestInstant() diff --git a/src/dict/dictserver.cc b/src/dict/dictserver.cc index e7d7ae555..0e3d1da13 100644 --- a/src/dict/dictserver.cc +++ b/src/dict/dictserver.cc @@ -7,7 +7,6 @@ #include #include #include -#include "gddebug.hh" #include "htmlescape.hh" #include @@ -23,155 +22,173 @@ enum { namespace { -#define MAX_MATCHES_COUNT 60 -bool readLine( QTcpSocket & socket, QString & line, QString & errorString, QAtomicInt & isCancelled ) -{ - line.clear(); - errorString.clear(); - if ( socket.state() != QTcpSocket::ConnectedState ) - return false; +enum class DictServerState { + START, + CONNECT, + DB, + DB_DATA, + DB_DATA_FINISHED, + CLIENT, + AUTH, + OPTION, + HANDSHAKE, + + MATCH, + MATCH_DATA, + FINISHED, + DEFINE, + DEFINE_DATA, +}; - for ( ;; ) { - if ( Utils::AtomicInt::loadAcquire( isCancelled ) ) - return false; +#define MAX_MATCHES_COUNT 60 - if ( socket.canReadLine() ) { - QByteArray reply = socket.readLine(); - line = QString::fromUtf8( reply.data(), reply.size() ); - return true; - } - if ( !socket.waitForReadyRead( 2000 ) ) { - errorString = - "Data reading error: socket error " + QString::number( socket.error() ) + ": \"" + socket.errorString() + "\""; - break; - } - } - return false; +void disconnectFromServer( QTcpSocket & socket ) +{ + if ( socket.state() == QTcpSocket::ConnectedState ) + socket.write( QByteArray( "QUIT\r\n" ) ); + + socket.disconnectFromHost(); } -bool connectToServer( QTcpSocket & socket, QString const & url, QString & errorString, QAtomicInt & isCancelled ) -{ - QUrl serverUrl( url ); - quint16 port = serverUrl.port( DefaultPort ); - QString reply; - for ( ;; ) { - if ( Utils::AtomicInt::loadAcquire( isCancelled ) ) - return false; +class DictServerImpl: public QObject +{ + Q_OBJECT - socket.connectToHost( serverUrl.host(), port ); - if ( socket.state() != QTcpSocket::ConnectedState ) { - if ( !socket.waitForConnected( 2000 ) ) - break; - } + QString url; + QString errorString; - if ( Utils::AtomicInt::loadAcquire( isCancelled ) ) - return false; + QMutex mutex; - if ( !readLine( socket, reply, errorString, isCancelled ) ) - break; + QString msgId; - if ( !reply.isEmpty() && reply.left( 3 ) != "220" ) { - errorString = "Server refuse connection: " + reply; - return false; - } +public: + QTcpSocket socket; + DictServerState state; - QString msgId = reply.mid( reply.lastIndexOf( " " ) ).trimmed(); - socket.write( QByteArray( "CLIENT GoldenDict\r\n" ) ); - if ( !socket.waitForBytesWritten( 1000 ) ) - break; + DictServerImpl( QObject * parent, QString const & url_ ): + QObject( parent ), + url( url_ ) + { + } - if ( Utils::AtomicInt::loadAcquire( isCancelled ) ) - return false; + void run( std::function< void() > callback ) + { + int pos = url.indexOf( "://" ); + if ( pos < 0 ) + url = "dict://" + url; - if ( !readLine( socket, reply, errorString, isCancelled ) ) - break; + QUrl serverUrl( url ); + quint16 port = serverUrl.port( DefaultPort ); + QString reply; + socket.connectToHost( serverUrl.host(), port ); + connect( &socket, &QTcpSocket::connected, this, [ this ]() { + //initialize the description. + QString req = QString( "CLIENT GoldenDict\r\n" ); + socket.write( req.toUtf8() ); + state = DictServerState::CONNECT; + } ); - if ( !serverUrl.userInfo().isEmpty() ) { - QString authCommand = QString( "AUTH " ); - QString authString = msgId; + connect( &socket, &QTcpSocket::errorOccurred, this, []( QAbstractSocket::SocketError error ) { + qDebug() << "socket error message: " << error; + } ); + connect( &socket, &QTcpSocket::readyRead, this, [ this, callback ]() { + QMutexLocker const _( &mutex ); - int pos = serverUrl.userInfo().indexOf( QRegularExpression( "[:;]" ) ); - if ( pos > 0 ) { - authCommand += serverUrl.userInfo().left( pos ); - authString += serverUrl.userInfo().mid( pos + 1 ); - } - else - authCommand += serverUrl.userInfo(); + if ( state == DictServerState::CONNECT ) { + QByteArray reply = socket.readLine(); + qDebug() << "received:" << reply; - authCommand += " "; - authCommand += QCryptographicHash::hash( authString.toUtf8(), QCryptographicHash::Md5 ).toHex(); - authCommand += "\r\n"; + if ( !reply.isEmpty() && reply.left( 3 ) != "220" ) { + errorString = "Server refuse connection: " + reply; + return; + } - socket.write( authCommand.toUtf8() ); + msgId = reply.mid( reply.lastIndexOf( " " ) ).trimmed(); - if ( !socket.waitForBytesWritten( 1000 ) ) - break; + state = DictServerState::CLIENT; + socket.write( QByteArray( "CLIENT GoldenDict\r\n" ) ); + } - if ( Utils::AtomicInt::loadAcquire( isCancelled ) ) - return false; + else if ( state == DictServerState::CLIENT ) { + QByteArray reply = socket.readLine(); + qDebug() << "received:" << reply; - if ( !readLine( socket, reply, errorString, isCancelled ) ) - break; + QUrl serverUrl( url ); + if ( !serverUrl.userInfo().isEmpty() ) { + QString authCommand = QString( "AUTH " ); + QString authString = msgId; - if ( reply.left( 3 ) != "230" ) { - errorString = "Authentication error: " + reply; - return false; - } - } + int pos = serverUrl.userInfo().indexOf( QRegularExpression( "[:;]" ) ); + if ( pos > 0 ) { + authCommand += serverUrl.userInfo().left( pos ); + authString += serverUrl.userInfo().mid( pos + 1 ); + } + else + authCommand += serverUrl.userInfo(); - socket.write( QByteArray( "OPTION MIME\r\n" ) ); + authCommand += " "; + authCommand += QCryptographicHash::hash( authString.toUtf8(), QCryptographicHash::Md5 ).toHex(); + authCommand += "\r\n"; - if ( !socket.waitForBytesWritten( 1000 ) ) - break; + state = DictServerState::AUTH; + socket.write( authCommand.toUtf8() ); + } + else { + state = DictServerState::OPTION; - if ( Utils::AtomicInt::loadAcquire( isCancelled ) ) - return false; + socket.write( QByteArray( "OPTION MIME\r\n" ) ); + } + } + else if ( state == DictServerState::OPTION || state == DictServerState::AUTH ) { - if ( !readLine( socket, reply, errorString, isCancelled ) ) - break; + QByteArray reply = socket.readLine(); + qDebug() << "received:" << reply; - if ( reply.left( 3 ) != "250" ) { - // RFC 2229, 3.10.1.1: - // OPTION MIME is a REQUIRED server capability, - // all DICT servers MUST implement this command. - errorString = "Server doesn't support mime capability: " + reply; - return false; - } + if ( reply.left( 3 ) != "250" ) { + // RFC 2229, 3.10.1.1: + // OPTION MIME is a REQUIRED server capability, + // all DICT servers MUST implement this command. + errorString = "Server doesn't support mime capability: " + reply; + return; + } + state = DictServerState::HANDSHAKE; - return true; + if ( callback ) { + callback(); + } + } + } ); } - if ( !Utils::AtomicInt::loadAcquire( isCancelled ) ) - errorString = QString( "Server connection fault, socket error %1: \"%2\"" ) - .arg( QString::number( socket.error() ) ) - .arg( socket.errorString() ); - return false; -} - -void disconnectFromServer( QTcpSocket & socket ) -{ - if ( socket.state() == QTcpSocket::ConnectedState ) - socket.write( QByteArray( "QUIT\r\n" ) ); + ~DictServerImpl() override + { + disconnectFromServer( socket ); + } +}; - socket.disconnectFromHost(); -} class DictServerDictionary: public Dictionary::Class { + Q_OBJECT + string name; QString url, icon; quint32 langId; QString errorString; - QTcpSocket socket; QStringList databases; QStringList strategies; - QStringList serverDatabases; + // QStringList serverDatabases; + DictServerState state; + QMutex mutex; + + QString msgId; public: + QTcpSocket socket; DictServerDictionary( string const & id, string const & name_, @@ -202,14 +219,77 @@ class DictServerDictionary: public Dictionary::Class socket.connectToHost( serverUrl.host(), port ); connect( &socket, &QTcpSocket::connected, this, [ this ]() { //initialize the description. - getServerDatabasesAfterConnect(); + QString req = QString( "SHOW DB\r\n" ); + socket.write( req.toUtf8() ); + state = DictServerState::DB; } ); - connect( &socket, &QTcpSocket::stateChanged, this, []( QAbstractSocket::SocketState state ) { - qDebug() << "socket state change: " << state; + + connect( this, &DictServerDictionary::finishDatabase, this, [ this ]() { + socket.write( QByteArray( "CLIENT GoldenDict\r\n" ) ); } ); + connect( &socket, &QTcpSocket::errorOccurred, this, []( QAbstractSocket::SocketError error ) { qDebug() << "socket error message: " << error; } ); + connect( &socket, &QTcpSocket::readyRead, this, [ this ]() { + QMutexLocker const _( &mutex ); + QByteArray reply = socket.readLine(); + qDebug() << "received:" << reply; + if ( state == DictServerState::DB ) { + + if ( reply.left( 3 ) == "110" ) { + state = DictServerState::DB_DATA; + int countPos = reply.indexOf( ' ', 4 ); + // Get databases count + int count = reply.mid( 4, countPos > 4 ? countPos - 4 : -1 ).toInt(); + + // Read databases + int x = 0; + for ( ; x < count; x++ ) { + reply = socket.readLine(); + + if ( reply.isEmpty() ) { + return; + } + reply = reply.trimmed(); + + qDebug() << "receive db:" << reply; + + if ( reply[ 0 ] == '.' ) { + state = DictServerState::DB_DATA_FINISHED; + emit finishDatabase(); + return; + } + + if ( !reply.isEmpty() ) + databases.append( reply ); + } + + qDebug() << "db count:" << x; + if ( x == count ) { + emit finishDatabase(); + } + } + } + else if ( state == DictServerState::DB_DATA ) { + while ( !reply.isEmpty() ) { + + qDebug() << "receive db:" << reply; + if ( reply[ 0 ] == '.' ) { + state = DictServerState::DB_DATA_FINISHED; + emit finishDatabase(); + return; + } + + reply = reply.trimmed(); + + if ( !reply.isEmpty() ) + databases.append( reply ); + + reply = socket.readLine(); + } + } + } ); } ~DictServerDictionary() override @@ -259,7 +339,10 @@ class DictServerDictionary: public Dictionary::Class friend class DictServerWordSearchRequest; friend class DictServerArticleRequest; - void getServerDatabasesAfterConnect(); + +private: +signals: + void finishDatabase(); }; void DictServerDictionary::loadIcon() noexcept @@ -280,93 +363,85 @@ void DictServerDictionary::loadIcon() noexcept QString const & DictServerDictionary::getDescription() { if ( dictionaryDescription.isEmpty() ) { - dictionaryDescription = QCoreApplication::translate( "DictServer", "Url: " ) + url + "\n"; - dictionaryDescription += QCoreApplication::translate( "DictServer", "Databases: " ) + databases.join( ", " ) + "\n"; + dictionaryDescription = QCoreApplication::translate( "DictServer", "Url: " ) + url + "
"; + dictionaryDescription += QCoreApplication::translate( "DictServer", "Databases: " ) + "
"; dictionaryDescription += QCoreApplication::translate( "DictServer", "Search strategies: " ) + strategies.join( ", " ); - if ( !serverDatabases.isEmpty() ) { - dictionaryDescription += "\n\n"; + if ( !databases.isEmpty() ) { + dictionaryDescription += "

"; dictionaryDescription += QCoreApplication::translate( "DictServer", "Server databases" ) + " (" - + QString::number( serverDatabases.size() ) + "):"; - for ( const auto & serverDatabase : serverDatabases ) - dictionaryDescription += "\n" + serverDatabase; + + QString::number( databases.size() ) + "):"; + for ( const auto & serverDatabase : databases ) + dictionaryDescription += "
" + serverDatabase; } } return dictionaryDescription; } -void DictServerDictionary::getServerDatabasesAfterConnect() + +class DictServerWordSearchRequest: public Dictionary::WordSearchRequest { + Q_OBJECT QAtomicInt isCancelled; + wstring word; + QString errorString; + DictServerDictionary & dict; - for ( ;; ) { - QString req = QString( "SHOW DB\r\n" ); - socket.write( req.toUtf8() ); - socket.waitForBytesWritten( 1000 ); + QStringList matchesList; + int currentStrategy = 0; + int currentDatabase = 0; - QString reply; + DictServerState state = DictServerState::START; + QString msgId; - if ( !readLine( socket, reply, errorString, isCancelled ) ) - return; + DictServerImpl * dictImpl; - if ( reply.left( 3 ) == "110" ) { - int countPos = reply.indexOf( ' ', 4 ); - // Get databases count - int count = reply.mid( 4, countPos > 4 ? countPos - 4 : -1 ).toInt(); +public: - // Read databases - for ( int x = 0; x < count; x++ ) { - if ( !readLine( socket, reply, errorString, isCancelled ) ) - break; + DictServerWordSearchRequest( wstring word_, DictServerDictionary & dict_ ): + word( std::move( word_ ) ), + dict( dict_ ), + dictImpl( new DictServerImpl( this, dict_.url ) ) + { - if ( reply[ 0 ] == '.' ) - break; + connect( this, &DictServerWordSearchRequest::finishedMatches, this, [ this ]() { + state = DictServerState::FINISHED; - while ( reply.endsWith( '\r' ) || reply.endsWith( '\n' ) ) - reply.chop( 1 ); + matchesList.removeDuplicates(); + int countn = qMin( matchesList.size(), MAX_MATCHES_COUNT ); - if ( !reply.isEmpty() ) - serverDatabases.append( reply ); + if ( countn ) { + QMutexLocker _( &dataMutex ); + for ( int x = 0; x < countn; x++ ) + matches.emplace_back( gd::toWString( matchesList.at( x ) ) ); } + finish(); + } ); - break; - } - else { - gdWarning( "Retrieving databases from \"%s\" fault: %s\n", getName().c_str(), reply.toUtf8().data() ); - break; - } - } -} - -class DictServerWordSearchRequest: public Dictionary::WordSearchRequest -{ - QAtomicInt isCancelled; - wstring word; - QString errorString; - QFuture< void > f; - DictServerDictionary & dict; - QTcpSocket * socket; - -public: + this->run(); - DictServerWordSearchRequest( wstring const & word_, DictServerDictionary & dict_ ): - word( word_ ), - dict( dict_ ), - socket( 0 ) - { - f = QtConcurrent::run( [ this ]() { - this->run(); + dictImpl->run( [ this ]() { + QString matchReq = QString( "MATCH " ) + dict.databases.at( 0 ) + " " + dict.strategies.at( 0 ) + " \"" + + QString::fromStdU32String( word ) + "\"\r\n"; + state = DictServerState::MATCH; + dictImpl->socket.write( matchReq.toUtf8() ); + currentDatabase++; } ); } void run(); - ~DictServerWordSearchRequest() override - { - f.waitForFinished(); - } + ~DictServerWordSearchRequest() override = default; void cancel() override; + + void addMatchedWord( const QString & ); + +private: + void readMatchData( QByteArray & reply ); + +signals: + void finishedMatches(); }; void DictServerWordSearchRequest::run() @@ -376,130 +451,67 @@ void DictServerWordSearchRequest::run() return; } - socket = new QTcpSocket; - - if ( !socket ) { - finish(); - return; - } + connect( &dictImpl->socket, &QTcpSocket::readyRead, this, [ this ]() { + if ( state == DictServerState::MATCH ) { + QByteArray reply = dictImpl->socket.readLine(); + qDebug() << "receive match:" << reply; + auto code = reply.left( 3 ); + if ( reply.left( 3 ) != "152" ) { - if ( connectToServer( *socket, dict.url, errorString, isCancelled ) ) { - QStringList matchesList; - - for ( int ns = 0; ns < dict.strategies.size(); ns++ ) { - for ( int i = 0; i < dict.databases.size(); i++ ) { - QString matchReq = QString( "MATCH " ) + dict.databases.at( i ) + " " + dict.strategies.at( ns ) + " \"" - + QString::fromStdU32String( word ) + "\"\r\n"; - socket->write( matchReq.toUtf8() ); - socket->waitForBytesWritten( 1000 ); - - if ( Utils::AtomicInt::loadAcquire( isCancelled ) ) - break; - - QString reply; - - if ( !readLine( *socket, reply, errorString, isCancelled ) ) - break; - - if ( Utils::AtomicInt::loadAcquire( isCancelled ) ) - break; - - if ( reply.left( 3 ) == "250" ) { - // "OK" reply - matches info will be later - if ( !readLine( *socket, reply, errorString, isCancelled ) ) - break; - - if ( Utils::AtomicInt::loadAcquire( isCancelled ) ) - break; + if ( currentDatabase >= dict.databases.size() ) { + currentStrategy++; + currentDatabase = 0; } - - if ( reply.left( 3 ) == "552" ) { - // No matches - continue; + if ( currentStrategy >= dict.strategies.size() ) { + emit finishedMatches(); + return; } - if ( reply[ 0 ] == '5' || reply[ 0 ] == '4' ) { - // Database error - gdWarning( "Find matches in \"%s\", database \"%s\", strategy \"%s\" fault: %s\n", - dict.getName().c_str(), - dict.databases.at( i ).toUtf8().data(), - dict.strategies.at( ns ).toUtf8().data(), - reply.toUtf8().data() ); - continue; - } - - if ( reply.left( 3 ) == "152" ) { - // Matches found - int countPos = reply.indexOf( ' ', 4 ); - - // Get matches count - int count = reply.mid( 4, countPos > 4 ? countPos - 4 : -1 ).toInt(); - - // Read matches - for ( int x = 0; x <= count; x++ ) { - if ( Utils::AtomicInt::loadAcquire( isCancelled ) ) - break; - - if ( !readLine( *socket, reply, errorString, isCancelled ) ) - break; - - if ( reply[ 0 ] == '.' ) - break; - - while ( reply.endsWith( '\r' ) || reply.endsWith( '\n' ) ) - reply.chop( 1 ); - - int pos = reply.indexOf( ' ' ); - if ( pos >= 0 ) { - QString word = reply.mid( pos + 1 ); - if ( word.endsWith( '\"' ) ) - word.chop( 1 ); - if ( word[ 0 ] == '\"' ) - word = word.mid( 1 ); - - matchesList.append( word ); - } - } - if ( Utils::AtomicInt::loadAcquire( isCancelled ) || !errorString.isEmpty() ) - break; - } + QString matchReq = QString( "MATCH " ) + dict.databases.at( currentDatabase ) + " " + + dict.strategies.at( currentStrategy ) + " \"" + QString::fromStdU32String( word ) + "\"\r\n"; + state = DictServerState::MATCH; + dictImpl->socket.write( matchReq.toUtf8() ); + currentDatabase++; } + else { + state = DictServerState::MATCH_DATA; - if ( Utils::AtomicInt::loadAcquire( isCancelled ) || !errorString.isEmpty() ) - break; - - matchesList.removeDuplicates(); - if ( matchesList.size() >= MAX_MATCHES_COUNT ) - break; + readMatchData( reply ); + } } + else if ( state == DictServerState::MATCH_DATA ) { + QByteArray reply = dictImpl->socket.readLine(); + qDebug() << "receive:" << reply; + readMatchData( reply ); + } + } ); - if ( !Utils::AtomicInt::loadAcquire( isCancelled ) && errorString.isEmpty() ) { - matchesList.removeDuplicates(); - - int count = matchesList.size(); - if ( count > MAX_MATCHES_COUNT ) - count = MAX_MATCHES_COUNT; + connect( &dictImpl->socket, &QTcpSocket::errorOccurred, this, [ this ]( QAbstractSocket::SocketError error ) { + qDebug() << "socket error message: " << error; + cancel(); + } ); +} +void DictServerWordSearchRequest::readMatchData( QByteArray & reply ) +{ + do { + reply = this->dictImpl->socket.readLine(); - if ( count ) { - QMutexLocker _( &dataMutex ); - for ( int x = 0; x < count; x++ ) - matches.emplace_back( gd::toWString( matchesList.at( x ) ) ); - } - } - } + if ( reply.isEmpty() ) + return; - if ( !errorString.isEmpty() ) - gdWarning( "Prefix find in \"%s\" fault: %s\n", dict.getName().c_str(), errorString.toUtf8().data() ); - if ( Utils::AtomicInt::loadAcquire( isCancelled ) ) - socket->abort(); - else - disconnectFromServer( *socket ); + reply = reply.trimmed(); + int pos = reply.indexOf( ' ' ); + if ( pos >= 0 ) { + QString word = reply.mid( pos + 1 ); + if ( word.endsWith( '\"' ) ) + word.chop( 1 ); + if ( word[ 0 ] == '\"' ) + word = word.mid( 1 ); - delete socket; - socket = nullptr; - if ( !Utils::AtomicInt::loadAcquire( isCancelled ) ) - finish(); + this->addMatchedWord( word ); + } + } while ( true ); } void DictServerWordSearchRequest::cancel() @@ -507,36 +519,139 @@ void DictServerWordSearchRequest::cancel() isCancelled.ref(); finish(); } +void DictServer::DictServerWordSearchRequest::addMatchedWord( const QString & str ) +{ + matchesList.append( str ); + + if ( matchesList.size() >= MAX_MATCHES_COUNT ) { + emit finishedMatches(); + } +} class DictServerArticleRequest: public Dictionary::DataRequest { QAtomicInt isCancelled; wstring word; QString errorString; - QFuture< void > f; DictServerDictionary & dict; - QTcpSocket * socket; + string articleData; + + int currentDatabase = 0; + DictServerState state; + bool contentInHtml = false; + public: - DictServerArticleRequest( wstring const & word_, DictServerDictionary & dict_ ): - word( word_ ), + DictServerImpl * dictImpl; + DictServerArticleRequest( wstring word_, DictServerDictionary & dict_ ): + word( std::move( word_ ) ), dict( dict_ ), - socket( 0 ) + dictImpl( new DictServerImpl( this, dict_.url ) ) + { - f = QtConcurrent::run( [ this ]() { - this->run(); + + connect( this, &DictServerArticleRequest::finishedArticle, this, [ this ]( QString articleText ) { + if ( Utils::AtomicInt::loadAcquire( isCancelled ) || !errorString.isEmpty() ) + return; + + static QRegularExpression phonetic( R"(\\([^\\]+)\\)", + QRegularExpression::CaseInsensitiveOption ); // phonetics: \stuff\ ... + static QRegularExpression divs_inside_phonetic( "]*)>]*)>", + QRegularExpression::CaseInsensitiveOption ); + static QRegularExpression refs( R"(\{([^\{\}]+)\})", + QRegularExpression::CaseInsensitiveOption ); // links: {stuff} + static QRegularExpression links( "", + QRegularExpression::CaseInsensitiveOption ); + static QRegularExpression tags( "<[^>]*>", QRegularExpression::CaseInsensitiveOption ); + + string articleStr; + if ( contentInHtml ) + articleStr = articleText.toUtf8().data(); + else + articleStr = Html::preformat( articleText.toUtf8().data() ); + + articleText = QString::fromUtf8( articleStr.c_str(), articleStr.size() ); + int pos; + if ( !contentInHtml ) { + articleText = articleText.replace( refs, R"(\1)" ); + + pos = 0; + QString articleNewText; + + // Handle phonetics + + QRegularExpressionMatchIterator it = phonetic.globalMatch( articleText ); + while ( it.hasNext() ) { + QRegularExpressionMatch match = it.next(); + articleNewText += articleText.mid( pos, match.capturedStart() - pos ); + pos = match.capturedEnd(); + + QString phonetic_text = match.captured( 1 ); + phonetic_text.replace( divs_inside_phonetic, R"()" ); + + articleNewText += "" + phonetic_text + ""; + } + if ( pos ) { + articleNewText += articleText.mid( pos ); + articleText = articleNewText; + articleNewText.clear(); + } + + // Handle links + + pos = 0; + it = links.globalMatch( articleText ); + while ( it.hasNext() ) { + QRegularExpressionMatch match = it.next(); + articleNewText += articleText.mid( pos, match.capturedStart() - pos ); + pos = match.capturedEnd(); + + QString link = match.captured( 1 ); + link.replace( tags, " " ); + link.replace( " ", " " ); + + QString newLink = match.captured(); + newLink.replace( 30, + match.capturedLength( 1 ), + QString::fromUtf8( QUrl::toPercentEncoding( link.simplified() ) ) ); + articleNewText += newLink; + } + if ( pos ) { + articleNewText += articleText.mid( pos ); + articleText = articleNewText; + articleNewText.clear(); + } + } + + articleData += string( "
" ) + articleText.toUtf8().data() + "
"; + + + if ( !Utils::AtomicInt::loadAcquire( isCancelled ) && errorString.isEmpty() && !articleData.empty() ) { + appendString( articleData ); + + hasAnyData = true; + } + finish(); + } ); + this->run(); + + dictImpl->run( [ this ]() { + QString defineReq = + QString( "DEFINE " ) + dict.databases.at( 0 ) + " \"" + QString::fromStdU32String( word ) + "\"\r\n"; + dictImpl->socket.write( defineReq.toUtf8() ); + currentDatabase++; + + state = DictServerState::DEFINE; } ); } void run(); - ~DictServerArticleRequest() - { - f.waitForFinished(); - } + ~DictServerArticleRequest() override = default; void cancel() override; + void readData( QByteArray reply ); }; void DictServerArticleRequest::run() @@ -546,57 +661,26 @@ void DictServerArticleRequest::run() return; } - socket = new QTcpSocket; - - if ( !socket ) { - finish(); - return; - } - - if ( connectToServer( *socket, dict.url, errorString, isCancelled ) ) { - string articleData; - - for ( int i = 0; i < dict.databases.size(); i++ ) { - QString defineReq = - QString( "DEFINE " ) + dict.databases.at( i ) + " \"" + QString::fromStdU32String( word ) + "\"\r\n"; - socket->write( defineReq.toUtf8() ); - socket->waitForBytesWritten( 1000 ); - - QString reply; - if ( Utils::AtomicInt::loadAcquire( isCancelled ) ) - break; - - if ( !readLine( *socket, reply, errorString, isCancelled ) ) - break; + connect( &dictImpl->socket, &QTcpSocket::readyRead, this, [ this ]() { + if ( state == DictServerState::DEFINE ) { + QByteArray reply = dictImpl->socket.readLine(); + qDebug() << "receive define:" << reply; - if ( Utils::AtomicInt::loadAcquire( isCancelled ) ) - break; - - if ( reply.left( 3 ) == "250" ) { - // "OK" reply - matches info will be later - if ( !readLine( *socket, reply, errorString, isCancelled ) ) - break; - - if ( Utils::AtomicInt::loadAcquire( isCancelled ) ) - break; - } - - if ( reply.left( 3 ) == "552" ) { - // No matches found - continue; + auto code = reply.left( 3 ); + if ( reply.left( 3 ) != "150" ) { + if ( currentDatabase >= dict.databases.size() ) { + return; + } + QString defineReq = QString( "DEFINE " ) + dict.databases.at( currentDatabase ) + " \"" + + QString::fromStdU32String( word ) + "\"\r\n"; + dictImpl->socket.write( defineReq.toUtf8() ); + currentDatabase++; } + else { - if ( reply[ 0 ] == '5' || reply[ 0 ] == '4' ) { - // Database error - gdWarning( "Articles request from \"%s\", database \"%s\" fault: %s\n", - dict.getName().c_str(), - dict.databases.at( i ).toUtf8().data(), - reply.toUtf8().data() ); - continue; - } + state = DictServerState::DEFINE_DATA; - if ( reply.left( 3 ) == "150" ) { // Articles found int countPos = reply.indexOf( ' ', 4 ); @@ -607,195 +691,124 @@ void DictServerArticleRequest::run() // Read articles for ( int x = 0; x < count; x++ ) { - if ( Utils::AtomicInt::loadAcquire( isCancelled ) ) - break; - - if ( !readLine( *socket, reply, errorString, isCancelled ) ) - break; - - if ( reply.left( 3 ) == "250" ) - break; - - if ( reply.left( 3 ) == "151" ) { - int pos = 4; - int endPos; - - // Skip requested word - if ( reply[ pos ] == '\"' ) - endPos = reply.indexOf( '\"', pos + 1 ) + 1; - else - endPos = reply.indexOf( ' ', pos ); - - if ( endPos < pos ) { - // It seems mailformed string - break; - } + reply = dictImpl->socket.readLine(); + if ( reply.isEmpty() ) + return; + readData( reply ); + } + } + } + else if ( state == DictServerState::DEFINE_DATA ) { + QByteArray reply = dictImpl->socket.readLine(); + qDebug() << "receive define data:" << reply; + while ( true ) { + if ( reply.isEmpty() ) + return; + readData( reply ); + reply = dictImpl->socket.readLine(); + } + } + } ); - pos = endPos + 1; + connect( &dictImpl->socket, &QTcpSocket::errorOccurred, this, [ this ]( QAbstractSocket::SocketError error ) { + qDebug() << "socket error message: " << error; + cancel(); + } ); +} - QString dbID, dbName; +void DictServerArticleRequest::readData( QByteArray reply ) +{ - // Retrieve database ID - endPos = reply.indexOf( ' ', pos ); + if ( reply.isEmpty() ) + return; - if ( endPos < pos ) { - // It seems mailformed string - break; - } + if ( reply.left( 3 ) == "250" ) + return; - dbID = reply.mid( pos, endPos - pos ); + if ( reply.left( 3 ) == "151" ) { + int pos = 4; + int endPos; - // Retrieve database ID - pos = endPos + 1; - endPos = reply.indexOf( ' ', pos ); - if ( reply[ pos ] == '\"' ) - endPos = reply.indexOf( '\"', pos + 1 ) + 1; - else - endPos = reply.indexOf( ' ', pos ); + // Skip requested word + if ( reply[ pos ] == '\"' ) + endPos = reply.indexOf( '\"', pos + 1 ) + 1; + else + endPos = reply.indexOf( ' ', pos ); - if ( endPos < pos ) { - // It seems mailformed string - break; - } + if ( endPos < pos ) { + // It seems mailformed string + return; + } - dbName = reply.mid( pos, endPos - pos ); - if ( dbName.endsWith( '\"' ) ) - dbName.chop( 1 ); - if ( dbName[ 0 ] == '\"' ) - dbName = dbName.mid( 1 ); + pos = endPos + 1; - articleData += string( "
From " ) + dbName.toUtf8().data() + " [" - + dbID.toUtf8().data() + "]:" + "
"; + QString dbID, dbName; - // Retreive MIME headers if any + // Retrieve database ID + endPos = reply.indexOf( ' ', pos ); - static QRegularExpression contentTypeExpr( "Content-Type\\s*:\\s*text/html", - QRegularExpression::CaseInsensitiveOption ); + if ( endPos < pos ) { + // It seems mailformed string + return; + } - bool contentInHtml = false; - for ( ;; ) { - if ( !readLine( *socket, reply, errorString, isCancelled ) ) - break; + dbID = reply.mid( pos, endPos - pos ); - if ( reply == "\r\n" ) - break; + // Retrieve database ID + pos = endPos + 1; + endPos = reply.indexOf( ' ', pos ); + if ( reply[ pos ] == '\"' ) + endPos = reply.indexOf( '\"', pos + 1 ) + 1; + else + endPos = reply.indexOf( ' ', pos ); - QRegularExpressionMatch match = contentTypeExpr.match( reply ); - if ( match.hasMatch() ) - contentInHtml = true; - } + if ( endPos < pos ) { + // It seems mailformed string + return; + } - // Retrieve article text + dbName = reply.mid( pos, endPos - pos ); + if ( dbName.endsWith( '\"' ) ) + dbName.chop( 1 ); + if ( dbName[ 0 ] == '\"' ) + dbName = dbName.mid( 1 ); - articleText.clear(); - for ( ;; ) { - if ( !readLine( *socket, reply, errorString, isCancelled ) ) - break; + articleData += string( "
" ) + dbName.toUtf8().data() + "
"; - if ( reply == ".\r\n" ) - break; + // Retreive MIME headers if any - articleText += reply; - } + static QRegularExpression contentTypeExpr( "Content-Type\\s*:\\s*text/html", + QRegularExpression::CaseInsensitiveOption ); - if ( Utils::AtomicInt::loadAcquire( isCancelled ) || !errorString.isEmpty() ) - break; - - static QRegularExpression phonetic( R"(\\([^\\]+)\\)", - QRegularExpression::CaseInsensitiveOption ); // phonetics: \stuff\ ... - static QRegularExpression divs_inside_phonetic( "
]*)>]*)>", - QRegularExpression::CaseInsensitiveOption ); - static QRegularExpression refs( R"(\{([^\{\}]+)\})", - QRegularExpression::CaseInsensitiveOption ); // links: {stuff} - static QRegularExpression links( "", - QRegularExpression::CaseInsensitiveOption ); - static QRegularExpression tags( "<[^>]*>", QRegularExpression::CaseInsensitiveOption ); - - string articleStr; - if ( contentInHtml ) - articleStr = articleText.toUtf8().data(); - else - articleStr = Html::preformat( articleText.toUtf8().data() ); - - articleText = QString::fromUtf8( articleStr.c_str(), articleStr.size() ); - if ( !contentInHtml ) { - articleText = articleText.replace( refs, R"(\1)" ); - - pos = 0; - QString articleNewText; - - // Handle phonetics - - QRegularExpressionMatchIterator it = phonetic.globalMatch( articleText ); - while ( it.hasNext() ) { - QRegularExpressionMatch match = it.next(); - articleNewText += articleText.mid( pos, match.capturedStart() - pos ); - pos = match.capturedEnd(); - - QString phonetic_text = match.captured( 1 ); - phonetic_text.replace( divs_inside_phonetic, R"()" ); - - articleNewText += "" + phonetic_text + ""; - } - if ( pos ) { - articleNewText += articleText.mid( pos ); - articleText = articleNewText; - articleNewText.clear(); - } - - // Handle links - - pos = 0; - it = links.globalMatch( articleText ); - while ( it.hasNext() ) { - QRegularExpressionMatch match = it.next(); - articleNewText += articleText.mid( pos, match.capturedStart() - pos ); - pos = match.capturedEnd(); - - QString link = match.captured( 1 ); - link.replace( tags, " " ); - link.replace( " ", " " ); - - QString newLink = match.captured(); - newLink.replace( 30, - match.capturedLength( 1 ), - QString::fromUtf8( QUrl::toPercentEncoding( link.simplified() ) ) ); - articleNewText += newLink; - } - if ( pos ) { - articleNewText += articleText.mid( pos ); - articleText = articleNewText; - articleNewText.clear(); - } - } + for ( ;; ) { + reply = dictImpl->socket.readLine(); + if ( reply.isEmpty() ) + return; - articleData += string( "
" ) + articleText.toUtf8().data() + "
"; - } + if ( reply == "\r\n" ) + break; - if ( Utils::AtomicInt::loadAcquire( isCancelled ) || !errorString.isEmpty() ) - break; - } - } + QRegularExpressionMatch match = contentTypeExpr.match( reply ); + if ( match.hasMatch() ) + contentInHtml = true; } - if ( !Utils::AtomicInt::loadAcquire( isCancelled ) && errorString.isEmpty() && !articleData.empty() ) { - appendString( articleData ); + QString articleText; + // Retrieve article text + + articleText.clear(); + for ( ;; ) { + reply = dictImpl->socket.readLine(); + if ( reply.isEmpty() ) + return; + + if ( reply == ".\r\n" ) { + emit finishedArticle( articleText ); + return; + } - hasAnyData = true; + articleText += reply; } } - - if ( !errorString.isEmpty() ) - gdWarning( "Articles request from \"%s\" fault: %s\n", dict.getName().c_str(), errorString.toUtf8().data() ); - - if ( Utils::AtomicInt::loadAcquire( isCancelled ) ) - socket->abort(); - else - disconnectFromServer( *socket ); - - delete socket; - socket = nullptr; - if ( !Utils::AtomicInt::loadAcquire( isCancelled ) ) - finish(); } void DictServerArticleRequest::cancel() @@ -849,5 +862,5 @@ vector< sptr< Dictionary::Class > > makeDictionaries( Config::DictServers const return result; } - -} // namespace DictServer +#include "dictserver.moc" +} // namespace DictServer \ No newline at end of file