In my program I am reading a lot of data from a text file & putting it to a QTableWidget. Initially it was all done in the GUI thread & then I decided to multi thread it to have better performance. But on the contrary the performance was significantly slow i.e. 8x slower! So I decided to benchmark it. Here are my files:
main.cpp
#include <QtGui/QApplication>
#include <QMutex>
#include <QDir>
#include <string>
#include <QDebug>
#include "mainwindow.h"
QFile *logFile = NULL;
QTextStream *logStream = NULL;
QMutex *mutex = NULL;
bool *debugMode = NULL;
void myMessageOutput(QtMsgType type, const char *msg)
{
if(((logFile != NULL) && (debugMode != NULL)))
{
mutex->lock();
switch (type)
{
case QtDebugMsg:
if(!*debugMode)
{
mutex->unlock();
return;
}
*logStream << msg;
logStream->flush();
break;
case QtWarningMsg:
*logStream << "\n*** Warning ***\n";
*logStream << msg;
*logStream << "\n*** Warning Complete ***\n";
logStream->flush();
break;
case QtCriticalMsg:
*logStream << "\n*** Critical ***\n";
*logStream << msg;
*logStream << "\n*** Critical Complete ***\n";
logStream->flush();
break;
case QtFatalMsg:
*logStream << "\n*** Fatal ***\n";
*logStream << msg;
*logStream << "\n*** Fatal Complete ***\n";
logStream->flush();
abort();
}
mutex->unlock();
}
}
void CreateLogFile()
{
QString path = "C:\\Users\\abcd\\Documents\\QT\\benchmark\\output.log";
QFile *file = new QFile(path);
if(file->exists())
file->remove();
if(!file->open(QFile::WriteOnly | QFile::Text))
{
qFatal("Could not create log file.");
}
logStream = new QTextStream(file);
logStream->setRealNumberNotation(QTextStream::FixedNotation);
logStream->setRealNumberPrecision(16);
logFile = file;
}
int main(int argc, char *argv[])
{
mutex = new QMutex();
qInstallMsgHandler(myMessageOutput);
debugMode = new bool;
CreateLogFile();
*debugMode = true;
QApplication a(argc, argv);
MainWindow w;
w.show();
w.bench2();
return a.exec();
}
mainwindow.h
#ifndef MAINWINDOW_H
#define MAINWINDOW_H
#include <QMainWindow>
#include <QThread>
#include "multi_thread.h"
namespace Ui {
class MainWindow;
}
class MainWindow : public QMainWindow
{
Q_OBJECT
public:
explicit MainWindow(QWidget *parent = 0);
~MainWindow();
void bench2();
private:
Ui::MainWindow *ui;
};
#endif // MAINWINDOW_H
mainwindow.cpp
#include "mainwindow.h"
#include "ui_mainwindow.h"
#include <QDebug>
#include <QList>
#include <QTime>
MainWindow::MainWindow(QWidget *parent) : QMainWindow(parent), ui(new Ui::MainWindow)
{
ui->setupUi(this);
}
MainWindow::~MainWindow()
{
delete ui;
}
void MainWindow::bench2()
{
QTableWidget *table = new QTableWidget();
table->setRowCount(1000);
table->setColumnCount(1000);
for(int i = 0; i < 1000; i++)
{
for(int j = 0; j < 1000; j++)
table->setItem(i, j, new QTableWidgetItem());
}
Multi_Thread **multis = new Multi_Thread *[4];
QThread **thrs = new QThread *[4];
int from;
int to = -1;
QTime time;
time.start();
for(int i = 0; i < 4; i++)
{
from = to + 1;
to = from + 250;
if(i == 3)
to = 999;
multis[i] = new Multi_Thread();
multis[i]->setTable(table, from, to);
thrs[i] = new QThread();
connect(thrs[i], SIGNAL(started()), multis[i], SLOT(bench2_1()));
multis[i]->moveToThread(thrs[i]);
}
for(int i = 0; i < 4; i++)
{
if(!i)
time.start();
thrs[i]->start();
}
for(int i = 0; i < 4; i++)
{
thrs[i]->wait();
}
qDebug() << "\nbench2 1 " << time.elapsed();
for(int i = 0; i < 4; i++)
{
delete multis[i];
delete thrs[i];
}
delete[] multis;
delete[] thrs;
table->clear();
table->setRowCount(1000);
table->setColumnCount(1000);
for(int i = 0; i < 1000; i++)
{
for(int j = 0; j < 1000; j++)
table->setItem(i, j, new QTableWidgetItem());
}
time.start();
for(int i = 0; i < 1000; i++)
{
for(int j = 0; j < 1000; j++)
table->item(i, j)->setText("0");
}
qDebug() << "\nbench2 2 " << time.elapsed();
table->clear();
table->setRowCount(1000);
table->setColumnCount(1000);
QTableWidgetItem ***items = new QTableWidgetItem **[1000];
for(int i = 0; i < 1000; i++)
{
items[i] = new QTableWidgetItem *[1000];
for(int j = 0; j < 1000; j++)
{
QTableWidgetItem *item = new QTableWidgetItem();
table->setItem(i, j, item);
items[i][j] = item;
}
}
multis = new Multi_Thread *[4];
thrs = new QThread *[4];
to = -1;
for(int i = 0; i < 4; i++)
{
from = to + 1;
to = from + 250;
if(i == 3)
to = 999;
multis[i] = new Multi_Thread();
multis[i]->setItems(items, from, to);
thrs[i] = new QThread();
connect(thrs[i], SIGNAL(started()), multis[i], SLOT(bench2_2()));
multis[i]->moveToThread(thrs[i]);
}
table->blockSignals(true);
table->setUpdatesEnabled(false);
table->setWordWrap(false);
for(int i = 0; i < 4; i++)
{
if(!i)
time.start();
thrs[i]->start();
}
for(int i = 0; i < 4; i++)
{
thrs[i]->wait();
}
qDebug() << "\nbench2 3 " << time.elapsed();
table->blockSignals(false);
table->setUpdatesEnabled(true);
table->setWordWrap(true);
for(int i = 0; i < 4; i++)
{
delete multis[i];
delete thrs[i];
}
delete[] multis;
delete[] thrs;
table->clear();
for(int i = 0; i < 1000; i++)
{
delete[] items[i];
}
delete[] items;
}
multi_thread.h
#ifndef MULTI_THREAD_H
#define MULTI_THREAD_H
#include <QObject>
#include <QThread>
#include <QTableWidget>
class Multi_Thread : public QObject
{
Q_OBJECT
public:
explicit Multi_Thread();
void setTable(QTableWidget *tab, int f, int t);
void setItems(QTableWidgetItem ***i, int f, int t);
private:
QTableWidget *table;
QTableWidgetItem ***items;
int from;
int to;
signals:
public slots:
void bench2_1();
void bench2_2();
};
#endif // MULTI_THREAD_H
multi_thread.cpp
#include "multi_thread.h"
Multi_Thread::Multi_Thread() : QObject()
{
}
void Multi_Thread::setTable(QTableWidget *tab, int f, int t)
{
table = tab;
from = f;
to = t;
}
void Multi_Thread::setItems(QTableWidgetItem ***i, int f, int t)
{
items = i;
from = f;
to = t;
}
void Multi_Thread::bench2_1()
{
for(int i = from; i <= to; i++)
{
for(int j = 0; j < 1000; j++)
{
table->item(i, j)->setText("0");
}
}
QThread::currentThread()->exit(0);
}
void Multi_Thread::bench2_2()
{
for(int i = from; i <= to; i++)
{
for(int j = 0; j < 1000; j++)
{
items[i][j]->setText("0");
}
}
QThread::currentThread()->exit(0);
}
output.log
bench2 1 7654
bench2 2 1160
bench2 3 8021
What is strange is that I was expecting "bench2 3" to be faster than "bench2 1".
PS: My laptop hardware can needs 4 threads to reach 100% usage. Please edit it as per your hardware requirements. Can be known from Environment variables.