Skip to content

Commit

Permalink
Eagerly fill LogFilteredData::filteredItemsCache_
Browse files Browse the repository at this point in the history
and progressively fill/remove items instead of completely regenerating
the whole cache.
  • Loading branch information
gin-ahirsch committed Aug 10, 2018
1 parent e64e69c commit e18d691
Show file tree
Hide file tree
Showing 7 changed files with 176 additions and 56 deletions.
163 changes: 122 additions & 41 deletions src/data/logfiltereddata.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -47,8 +47,6 @@ LogFilteredData::LogFilteredData() : AbstractLogData(),
maxLengthMarks_ = 0;
searchDone_ = true;
visibility_ = MarksAndMatches;

filteredItemsCacheDirty_ = true;
}

// Usual constructor: just copy the data, the search is started by runSearch()
Expand All @@ -72,8 +70,6 @@ LogFilteredData::LogFilteredData( const LogData* logData )

visibility_ = MarksAndMatches;

filteredItemsCacheDirty_ = true;

// Forward the update signal
connect( &workerThread_, SIGNAL( searchProgressed( int, int, qint64 ) ),
this, SLOT( handleSearchProgressed( int, int, qint64 ) ) );
Expand Down Expand Up @@ -123,7 +119,7 @@ void LogFilteredData::clearSearch()
matching_lines_.clear();
maxLength_ = 0;
nbLinesProcessed_ = 0;
filteredItemsCacheDirty_ = true;
removeAllFromFilteredItemsCache( Match );
}

qint64 LogFilteredData::getMatchingLineNumber( int matchNum ) const
Expand Down Expand Up @@ -172,11 +168,6 @@ LogFilteredData::FilteredLineType
else if ( visibility_ == MarksOnly )
return Mark;
else {
// If it is MarksAndMatches, we have to look.
// Regenerate the cache if needed
if ( filteredItemsCacheDirty_ )
regenerateFilteredItemsCache();

return filteredItemsCache_[ index ].type();
}
}
Expand All @@ -189,7 +180,7 @@ void LogFilteredData::addMark( qint64 line, QChar mark )
marks_.addMark( line, mark );
maxLengthMarks_ = qMax( maxLengthMarks_,
sourceLogData_->getLineLength( line ) );
filteredItemsCacheDirty_ = true;
insertIntoFilteredItemsCache( FilteredItem{ static_cast<LineNumber>( line ), Mark } );
}
else
LOG(logERROR) << "LogFilteredData::addMark\
Expand Down Expand Up @@ -236,53 +227,87 @@ qint64 LogFilteredData::getMarkBefore( qint64 line ) const

void LogFilteredData::deleteMark( QChar mark )
{
marks_.deleteMark( mark );
filteredItemsCacheDirty_ = true;
int index = marks_.findMark( mark );
qint64 line = marks_.getLineMarkedByIndex( index );
marks_.deleteMarkAt( index );

// FIXME: maxLengthMarks_
if ( line < 0 ) {
// LOG(logWARNING)?
return;
}

updateMaxLengthMarks( line );
removeFromFilteredItemsCache( FilteredItem{ static_cast<LineNumber>( line ), Mark } );
}

void LogFilteredData::deleteMark( qint64 line )
{
marks_.deleteMark( line );
filteredItemsCacheDirty_ = true;

updateMaxLengthMarks( line );
removeFromFilteredItemsCache( FilteredItem{ static_cast<LineNumber>( line ), Mark } );
}

void LogFilteredData::updateMaxLengthMarks( qint64 removed_line )
{
if ( removed_line < 0 ) {
LOG(logWARNING) << "updateMaxLengthMarks called with negative line-number";
return;
}
// Now update the max length if needed
if ( sourceLogData_->getLineLength( line ) >= maxLengthMarks_ ) {
if ( sourceLogData_->getLineLength( removed_line ) >= maxLengthMarks_ ) {
LOG(logDEBUG) << "deleteMark recalculating longest mark";
maxLengthMarks_ = 0;
for ( Marks::const_iterator i = marks_.begin();
i != marks_.end(); ++i ) {
LOG(logDEBUG) << "line " << i->lineNumber();
for ( auto& mark : marks_ ) {
LOG(logDEBUG) << "line " << mark.lineNumber();
maxLengthMarks_ = qMax( maxLengthMarks_,
sourceLogData_->getLineLength( i->lineNumber() ) );
sourceLogData_->getLineLength( mark.lineNumber() ) );
}
}
}

void LogFilteredData::clearMarks()
{
marks_.clear();
filteredItemsCacheDirty_ = true;
maxLengthMarks_ = 0;
removeAllFromFilteredItemsCache( Mark );
}

void LogFilteredData::setVisibility( Visibility visi )
{
visibility_ = visi;

if ( visibility_ == MarksAndMatches )
regenerateFilteredItemsCache();
}

//
// Slots
//
void LogFilteredData::handleSearchProgressed( int nbMatches, int progress, qint64 initial_position )
{
using std::begin;
using std::end;
using std::next;

LOG(logDEBUG) << "LogFilteredData::handleSearchProgressed matches="
<< nbMatches << " progress=" << progress;

// searchDone_ = true;
workerThread_.getSearchResult( &maxLength_, &matching_lines_, &nbLinesProcessed_ );
filteredItemsCacheDirty_ = true;
assert( nbMatches >= 0 );

size_t start_index = matching_lines_.size();

workerThread_.updateSearchResult( &maxLength_, &matching_lines_, &nbLinesProcessed_ );

assert( matching_lines_.size() >= start_index );

filteredItemsCache_.reserve( matching_lines_.size() + marks_.size() );
// (it's an overestimate but probably not by much so it's fine)

for ( auto it = next( begin( matching_lines_ ), start_index ); it != end( matching_lines_ ); ++it ) {
insertIntoFilteredItemsCache( FilteredItem{ it->lineNumber(), Match } );
}

emit searchProgressed( nbMatches, progress, initial_position );
}
Expand All @@ -305,10 +330,6 @@ LineNumber LogFilteredData::findLogDataLine( LineNumber lineNum ) const
LOG(logERROR) << "Index too big in LogFilteredData: " << lineNum;
}
else {
// Regenerate the cache if needed
if ( filteredItemsCacheDirty_ )
regenerateFilteredItemsCache();

if ( lineNum < filteredItemsCache_.size() )
line = filteredItemsCache_[ lineNum ].lineNumber();
else
Expand All @@ -333,11 +354,6 @@ LineNumber LogFilteredData::findFilteredLine( LineNumber lineNum ) const
lineNum );
}
else {
// Regenerate the cache if needed
if ( filteredItemsCacheDirty_ ) {
regenerateFilteredItemsCache();
}

lineIndex = lookupLineNumber( filteredItemsCache_.begin(),
filteredItemsCache_.end(),
lineNum );
Expand Down Expand Up @@ -398,10 +414,6 @@ qint64 LogFilteredData::doGetNbLine() const
else if ( visibility_ == MarksOnly )
nbLines = marks_.size();
else {
// Regenerate the cache if needed (hopefully most of the time
// it won't be necessarily)
if ( filteredItemsCacheDirty_ )
regenerateFilteredItemsCache();
nbLines = filteredItemsCache_.size();
}

Expand Down Expand Up @@ -439,13 +451,16 @@ void LogFilteredData::doSetMultibyteEncodingOffsets( int, int )
{
}

// TODO: We might be a bit smarter and not regenerate the whole thing when
// e.g. stuff is added at the end of the search.
void LogFilteredData::regenerateFilteredItemsCache() const
{
LOG(logDEBUG) << "regenerateFilteredItemsCache";

filteredItemsCache_.clear();
if ( filteredItemsCache_.size() > 0 ) {
// the cache was not invalidated, so we can keep it
LOG(logDEBUG) << "cache was not invalidated";
return;
}

filteredItemsCache_.reserve( matching_lines_.size() + marks_.size() );
// (it's an overestimate but probably not by much so it's fine)

Expand Down Expand Up @@ -474,7 +489,73 @@ void LogFilteredData::regenerateFilteredItemsCache() const
filteredItemsCache_.push_back( FilteredItem( line, type ) );
}

filteredItemsCacheDirty_ = false;

LOG(logDEBUG) << "finished regenerateFilteredItemsCache";
}

void LogFilteredData::insertIntoFilteredItemsCache( FilteredItem item )
{
using std::begin;
using std::end;

if ( visibility_ != MarksAndMatches ) {
// this is invalidated and will be regenerated when we need it
filteredItemsCache_.clear();
LOG(logDEBUG) << "cache is invalidated";
return;
}

// Search for the corresponding index.
auto found = std::lower_bound( begin( filteredItemsCache_ ), end( filteredItemsCache_ ), item );
if ( found == end( filteredItemsCache_ ) || found->lineNumber() > item.lineNumber() ) {
filteredItemsCache_.insert( found, item );
} else {
assert( found->lineNumber() == item.lineNumber() );
found->add( item.type() );
}
}

void LogFilteredData::removeFromFilteredItemsCache( FilteredItem item )
{
using std::begin;
using std::distance;
using std::end;

if ( visibility_ != MarksAndMatches ) {
// this is invalidated and will be regenerated when we need it
filteredItemsCache_.clear();
LOG(logDEBUG) << "cache is invalidated";
return;
}

// Search for the corresponding index.
auto found = std::equal_range( begin( filteredItemsCache_ ), end( filteredItemsCache_ ), item );
if( found.first == end( filteredItemsCache_ ) ) {
LOG(logERROR) << "Attempt to remove line " << item.lineNumber() << " from filteredItemsCache_ failed, since it was not found";
return;
}

if ( distance( found.first, found.second ) > 1 ) {
LOG(logERROR) << "Multiple matches found for line " << item.lineNumber() << " in filteredItemsCache_";
// FIXME: collapse them?
}

if ( !found.first->remove( item.type() ) ){
filteredItemsCache_.erase( found.first );
}
}

void LogFilteredData::removeAllFromFilteredItemsCache( FilteredLineType type )
{
using std::begin;
using std::end;

if ( visibility_ != MarksAndMatches ) {
// this is invalidated and will be regenerated when we need it
filteredItemsCache_.clear();
LOG(logDEBUG) << "cache is invalidated";
return;
}

auto erase_begin = std::remove_if( begin( filteredItemsCache_ ), end( filteredItemsCache_ ), [type]( FilteredItem& item ) { return !item.remove( type ); } );
filteredItemsCache_.erase( erase_begin, end( filteredItemsCache_ ) );
}
7 changes: 6 additions & 1 deletion src/data/logfiltereddata.h
Original file line number Diff line number Diff line change
Expand Up @@ -156,7 +156,6 @@ class LogFilteredData : public AbstractLogData {
// when visibility_ == MarksAndMatches
// (QVector store actual objects instead of pointers)
mutable std::vector<FilteredItem> filteredItemsCache_;
mutable bool filteredItemsCacheDirty_;

LogFilteredDataWorkerThread workerThread_;
Marks marks_;
Expand All @@ -166,6 +165,12 @@ class LogFilteredData : public AbstractLogData {
LineNumber findFilteredLine( LineNumber lineNum ) const;

void regenerateFilteredItemsCache() const;
void insertIntoFilteredItemsCache( FilteredItem item );
void removeFromFilteredItemsCache( FilteredItem item );
void removeAllFromFilteredItemsCache( FilteredLineType type );

// update maxLengthMarks_ when a Mark was removed.
void updateMaxLengthMarks( qint64 removed_line );
};

inline LogFilteredData::FilteredLineType& operator|=(LogFilteredData::FilteredLineType& a, LogFilteredData::FilteredLineType b)
Expand Down
25 changes: 21 additions & 4 deletions src/data/logfiltereddataworkerthread.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -28,15 +28,32 @@
const int SearchOperation::nbLinesInChunk = 5000;

void SearchData::getAll( int* length, SearchResultArray* matches,
qint64* lines) const
qint64* lines ) const
{
matches->clear();
getAllMissing( length, matches, lines );
}

void SearchData::getAllMissing( int* length, SearchResultArray* matches,
qint64* lines ) const
{
QMutexLocker locker( &dataMutex_ );


*length = maxLength_;
*lines = nbLinesProcessed_;

if ( matches_.size() < matches->size() ) {
LOG(logWARNING) << "Cannot append search-data to smaller match-array";
return;
}

matches->reserve( matches_.size() - matches->size() );

// This is a copy (potentially slow)
*matches = matches_;
size_t offset = matches->size();
std::insert_iterator<SearchResultArray> inserter{ *matches, next( begin( *matches ), offset ) };
copy( next( begin( matches_ ), offset ), end( matches_ ), inserter );
}

void SearchData::setAll( int length,
Expand Down Expand Up @@ -167,10 +184,10 @@ void LogFilteredDataWorkerThread::interrupt()
}

// This will do an atomic copy of the object
void LogFilteredDataWorkerThread::getSearchResult(
void LogFilteredDataWorkerThread::updateSearchResult(
int* maxLength, SearchResultArray* searchMatches, qint64* nbLinesProcessed )
{
searchData_.getAll( maxLength, searchMatches, nbLinesProcessed );
searchData_.getAllMissing( maxLength, searchMatches, nbLinesProcessed );
}

// This is the thread's main loop
Expand Down
8 changes: 6 additions & 2 deletions src/data/logfiltereddataworkerthread.h
Original file line number Diff line number Diff line change
Expand Up @@ -63,6 +63,10 @@ class SearchData
// Atomically get all the search data
void getAll( int* length, SearchResultArray* matches,
qint64* nbLinesProcessed ) const;
// Atomically get all the search data
// Appends the missing entries. Does not check that the existing entries match.
void getAllMissing( int* length, SearchResultArray* matches,
qint64* lines ) const;
// Atomically set all the search data
// (overwriting the existing)
// (the matches are always moved)
Expand Down Expand Up @@ -155,8 +159,8 @@ class LogFilteredDataWorkerThread : public QThread
// Interrupts the search if one is in progress
void interrupt();

// Returns a copy of the current indexing data
void getSearchResult( int* maxLength, SearchResultArray* searchMatches,
// Updates the array by copying the current indexing data
void updateSearchResult( int* maxLength, SearchResultArray* searchMatches,
qint64* nbLinesProcessed );

signals:
Expand Down
2 changes: 1 addition & 1 deletion src/log.h
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,7 @@
#include <cstdio>

// Modify here!
//#define FILELOG_MAX_LEVEL logDEBUG
// #define FILELOG_MAX_LEVEL logDEBUG

inline std::string NowTime();

Expand Down
Loading

0 comments on commit e18d691

Please sign in to comment.