Skip to content

Commit e87ed37

Browse files
Merged in cbillington/lyse/feature (pull request labscript-suite#40)
Performance optimisation. Approved-by: Jan Werkmann <jan.wrk.fb@gmail.com>
2 parents 5e61815 + 3284773 commit e87ed37

File tree

1 file changed

+76
-57
lines changed

1 file changed

+76
-57
lines changed

__main__.py

+76-57
Original file line numberDiff line numberDiff line change
@@ -46,7 +46,7 @@
4646

4747
from qtutils.qt import QtCore, QtGui, QtWidgets
4848
from qtutils.qt.QtCore import pyqtSignal as Signal
49-
from qtutils import inmain_decorator, UiLoader, DisconnectContextManager
49+
from qtutils import inmain_decorator, inmain, UiLoader, DisconnectContextManager
5050
from qtutils.outputbox import OutputBox
5151
from qtutils.auto_scroll_to_end import set_auto_scroll_to_end
5252
import qtutils.icons
@@ -1143,6 +1143,8 @@ def __init__(self, view, exp_config):
11431143
self._view = view
11441144
self.exp_config = exp_config
11451145
self._model = UneditableModel()
1146+
self.row_number_by_filepath = {}
1147+
self._previous_n_digits = 0
11461148

11471149
headerview_style = """
11481150
QHeaderView {
@@ -1213,17 +1215,6 @@ def connect_signals(self):
12131215
self._view.customContextMenuRequested.connect(self.on_view_context_menu_requested)
12141216
self.action_remove_selected.triggered.connect(self.on_remove_selection)
12151217

1216-
def get_model_row_by_filepath(self, filepath):
1217-
filepath_colname = ('filepath',) + ('',) * (self.nlevels - 1)
1218-
possible_items = self._model.findItems(filepath, column=self.column_indices[filepath_colname])
1219-
if len(possible_items) > 1:
1220-
raise LookupError('Multiple items found')
1221-
elif not possible_items:
1222-
raise LookupError('No item found')
1223-
item = possible_items[0]
1224-
index = item.index()
1225-
return index.row()
1226-
12271218
def on_remove_selection(self):
12281219
self.remove_selection()
12291220

@@ -1325,8 +1316,8 @@ def mark_as_deleted_off_disk(self, filepath):
13251316
# Shot has been removed from FileBox, nothing to do here:
13261317
return
13271318

1328-
model_row_number = self.get_model_row_by_filepath(filepath)
1329-
status_item = self._model.item(model_row_number, self.COL_STATUS)
1319+
row_number = self.row_number_by_filepath[filepath]
1320+
status_item = self._model.item(row_number, self.COL_STATUS)
13301321
already_marked_as_deleted = status_item.data(self.ROLE_DELETED_OFF_DISK)
13311322
if already_marked_as_deleted:
13321323
return
@@ -1350,38 +1341,40 @@ def update_row(self, filepath, dataframe_already_updated=False, status_percent=N
13501341
if (new_row_data is None) == (updated_row_data is None) and not dataframe_already_updated:
13511342
raise ValueError('Exactly one of new_row_data or updated_row_data must be provided')
13521343

1353-
df_row_index = np.where(self.dataframe['filepath'].values == filepath)
13541344
try:
1355-
df_row_index = df_row_index[0][0]
1356-
except IndexError:
1345+
row_number = self.row_number_by_filepath[filepath]
1346+
except KeyError:
13571347
# Row has been deleted, nothing to do here:
13581348
return
13591349

1350+
filepath_colname = ('filepath',) + ('',) * (self.nlevels - 1)
1351+
assert filepath == self.dataframe.get_value(row_number, filepath_colname)
1352+
13601353
if updated_row_data is not None and not dataframe_already_updated:
13611354
for group, name in updated_row_data:
13621355
column_name = (group, name) + ('',) * (self.nlevels - 2)
13631356
value = updated_row_data[group, name]
13641357
try:
1365-
self.dataframe.set_value(df_row_index, column_name, value)
1358+
self.dataframe.set_value(row_number, column_name, value)
13661359
except ValueError:
13671360
# did the column not already exist when we tried to set an iterable?
13681361
if not column_name in self.dataframe.columns:
13691362
# create it with a non-iterable and then overwrite with the iterable value:
1370-
self.dataframe.set_value(df_row_index, column_name, None)
1363+
self.dataframe.set_value(row_number, column_name, None)
13711364
else:
13721365
# Incompatible datatype - convert the datatype of the column to
13731366
# 'object'
13741367
self.dataframe[column_name] = self.dataframe[column_name].astype('object')
13751368
# Now that the column exists and has dtype object, we can set the value:
1376-
self.dataframe.set_value(df_row_index, column_name, value)
1369+
self.dataframe.set_value(row_number, column_name, value)
13771370

13781371
dataframe_already_updated = True
13791372

13801373
if not dataframe_already_updated:
13811374
if new_row_data is None:
13821375
raise ValueError("If dataframe_already_updated is False, then new_row_data, as returned "
13831376
"by dataframe_utils.get_dataframe_from_shot(filepath) must be provided.")
1384-
self.dataframe = replace_with_padding(self.dataframe, new_row_data, df_row_index)
1377+
self.dataframe = replace_with_padding(self.dataframe, new_row_data, row_number)
13851378
self.update_column_levels()
13861379

13871380
# Check and create necessary new columns in the Qt model:
@@ -1433,20 +1426,13 @@ def update_row(self, filepath, dataframe_already_updated=False, status_percent=N
14331426
self.column_indices = {name: index for index, name in self.column_names.items()}
14341427

14351428
# Update the data in the Qt model:
1436-
model_row_number = self.get_model_row_by_filepath(filepath)
1437-
dataframe_row = self.dataframe.iloc[df_row_index].to_dict()
1429+
dataframe_row = self.dataframe.iloc[row_number].to_dict()
14381430
for column_number, column_name in self.column_names.items():
14391431
if not isinstance(column_name, tuple):
14401432
# One of our special columns, does not correspond to a column in the dataframe:
14411433
continue
14421434
if updated_row_data is not None and column_name not in updated_row_data:
14431435
continue
1444-
item = self._model.item(model_row_number, column_number)
1445-
if item is None:
1446-
# This is the first time we've written a value to this part of the model:
1447-
item = QtGui.QStandardItem('NaN')
1448-
item.setData(QtCore.Qt.AlignCenter, QtCore.Qt.TextAlignmentRole)
1449-
self._model.setItem(model_row_number, column_number, item)
14501436
value = dataframe_row[column_name]
14511437
if isinstance(value, float):
14521438
value_str = scientific_notation(value)
@@ -1457,7 +1443,15 @@ def update_row(self, filepath, dataframe_already_updated=False, status_percent=N
14571443
short_value_str = lines[0] + ' ...'
14581444
else:
14591445
short_value_str = value_str
1460-
item.setText(short_value_str)
1446+
1447+
item = self._model.item(row_number, column_number)
1448+
if item is None:
1449+
# This is the first time we've written a value to this part of the model:
1450+
item = QtGui.QStandardItem(short_value_str)
1451+
item.setData(QtCore.Qt.AlignCenter, QtCore.Qt.TextAlignmentRole)
1452+
self._model.setItem(row_number, column_number, item)
1453+
else:
1454+
item.setText(short_value_str)
14611455
item.setToolTip(repr(value))
14621456

14631457
for i, column_name in enumerate(sorted(new_column_names)):
@@ -1466,7 +1460,7 @@ def update_row(self, filepath, dataframe_already_updated=False, status_percent=N
14661460
self._view.resizeColumnToContents(column_number)
14671461

14681462
if status_percent is not None:
1469-
status_item = self._model.item(model_row_number, self.COL_STATUS)
1463+
status_item = self._model.item(row_number, self.COL_STATUS)
14701464
status_item.setData(status_percent, self.ROLE_STATUS_PERCENT)
14711465

14721466
if new_column_names or defunct_column_names:
@@ -1483,15 +1477,29 @@ def new_row(self, filepath):
14831477
name_item = QtGui.QStandardItem(filepath)
14841478
return [status_item, name_item]
14851479

1486-
def renumber_rows(self):
1487-
"""Add/update row indices - the rows are numbered in simple sequential order
1488-
for easy comparison with the dataframe"""
1480+
def renumber_rows(self, add_from=0):
1481+
"""Add/update row indices - the rows are numbered in simple sequential
1482+
order for easy comparison with the dataframe. add_from allows you to
1483+
only add numbers for new rows from the given index as a performance
1484+
optimisation, though if the number of digits changes, all rows will
1485+
still be renumbered. add_from should not be used if rows have been
1486+
deleted."""
14891487
n_digits = len(str(self._model.rowCount()))
1490-
print(self._model.rowCount())
1491-
for row_number in range(self._model.rowCount()):
1488+
if n_digits != self._previous_n_digits:
1489+
# All labels must be updated:
1490+
add_from = 0
1491+
self._previous_n_digits = n_digits
1492+
1493+
if add_from == 0:
1494+
self.row_number_by_filepath = {}
1495+
1496+
for row_number in range(add_from, self._model.rowCount()):
14921497
vertical_header_item = self._model.verticalHeaderItem(row_number)
14931498
row_number_str = str(row_number).rjust(n_digits)
14941499
vert_header_text = '{}. |'.format(row_number_str)
1500+
filepath_item = self._model.item(row_number, self.COL_FILEPATH)
1501+
filepath = filepath_item.text()
1502+
self.row_number_by_filepath[filepath] = row_number
14951503
if self.integer_indexing:
14961504
header_cols = ['sequence_index', 'run number', 'run repeat']
14971505
header_strings = []
@@ -1503,8 +1511,6 @@ def renumber_rows(self):
15031511
header_strings.append('----')
15041512
vert_header_text += ' |'.join(header_strings)
15051513
else:
1506-
filepath_item = self._model.item(row_number, self.COL_FILEPATH)
1507-
filepath = filepath_item.text()
15081514
basename = os.path.splitext(os.path.basename(filepath))[0]
15091515
vert_header_text += ' ' + basename
15101516
vertical_header_item.setText(vert_header_text)
@@ -1518,7 +1524,7 @@ def add_files(self, filepaths, new_row_data):
15181524

15191525
# Check for duplicates:
15201526
for filepath in filepaths:
1521-
if filepath in self.dataframe['filepath'].values or filepath in to_add:
1527+
if filepath in self.row_number_by_filepath or filepath in to_add:
15221528
app.output_box.output('Warning: Ignoring duplicate shot %s\n' % filepath, red=True)
15231529
if new_row_data is not None:
15241530
df_row_index = np.where(new_row_data['filepath'].values == filepath)
@@ -1529,19 +1535,26 @@ def add_files(self, filepaths, new_row_data):
15291535

15301536
assert len(new_row_data) == len(to_add)
15311537

1538+
if to_add:
1539+
# Update the dataframe:
1540+
self.dataframe = concat_with_padding(self.dataframe, new_row_data)
1541+
self.update_column_levels()
1542+
1543+
app.filebox.set_add_shots_progress(None, None, "updating filebox")
1544+
15321545
for filepath in to_add:
1533-
# Add the new rows to the model:
1546+
# Add the new rows to the Qt model:
15341547
self._model.appendRow(self.new_row(filepath))
15351548
vert_header_item = QtGui.QStandardItem('...loading...')
15361549
self._model.setVerticalHeaderItem(self._model.rowCount() - 1, vert_header_item)
15371550
self._view.resizeRowToContents(self._model.rowCount() - 1)
15381551

1539-
if to_add:
1540-
self.dataframe = concat_with_padding(self.dataframe, new_row_data)
1541-
self.update_column_levels()
1542-
for filepath in to_add:
1543-
self.update_row(filepath, dataframe_already_updated=True)
1544-
self.renumber_rows()
1552+
self.renumber_rows(add_from=self._model.rowCount()-len(to_add))
1553+
1554+
# Update the Qt model:
1555+
for filepath in to_add:
1556+
self.update_row(filepath, dataframe_already_updated=True)
1557+
15451558

15461559
@inmain_decorator()
15471560
def get_first_incomplete(self):
@@ -1667,14 +1680,20 @@ def set_columns_visible(self, columns_visible):
16671680
self.shots_model.set_columns_visible(columns_visible)
16681681

16691682
@inmain_decorator()
1670-
def set_add_shots_progress(self, completed, total):
1671-
if completed == total:
1683+
def set_add_shots_progress(self, completed, total, message):
1684+
self.ui.progressBar_add_shots.setFormat("Adding shots: [{}] %v/%m (%p%)".format(message))
1685+
if completed == total and message is None:
16721686
self.ui.progressBar_add_shots.hide()
16731687
else:
1674-
self.ui.progressBar_add_shots.setMaximum(total)
1675-
self.ui.progressBar_add_shots.setValue(completed)
1688+
if total is not None:
1689+
self.ui.progressBar_add_shots.setMaximum(total)
1690+
if completed is not None:
1691+
self.ui.progressBar_add_shots.setValue(completed)
16761692
if self.ui.progressBar_add_shots.isHidden():
16771693
self.ui.progressBar_add_shots.show()
1694+
if completed is None and total is None and message is not None:
1695+
# Ensure a repaint when only the message changes:
1696+
self.ui.progressBar_add_shots.repaint()
16781697

16791698
def incoming_buffer_loop(self):
16801699
"""We use a queue as a buffer for incoming shots. We don't want to hang and not
@@ -1698,19 +1717,21 @@ def incoming_buffer_loop(self):
16981717
if self.incoming_queue.qsize() == 0:
16991718
# Wait momentarily in case more arrive so we can batch process them:
17001719
time.sleep(0.1)
1720+
# Batch process to decrease number of dataframe concatenations:
1721+
batch_size = len(self.shots_model.dataframe) // 3 + 1
17011722
while True:
17021723
try:
17031724
filepath = self.incoming_queue.get(False)
17041725
except queue.Empty:
17051726
break
17061727
else:
17071728
filepaths.append(filepath)
1708-
if len(filepaths) >= 5:
1729+
if len(filepaths) >= batch_size:
17091730
break
17101731
logger.info('adding:\n%s' % '\n'.join(filepaths))
17111732
if n_shots_added == 0:
17121733
total_shots = self.incoming_queue.qsize() + len(filepaths)
1713-
self.set_add_shots_progress(1, total_shots)
1734+
self.set_add_shots_progress(1, total_shots, "reading shot files")
17141735

17151736
# Remove duplicates from the list (preserving order) in case the
17161737
# client sent the same filepath multiple times:
@@ -1728,15 +1749,12 @@ def incoming_buffer_loop(self):
17281749
n_shots_added += 1
17291750
shots_remaining = self.incoming_queue.qsize()
17301751
total_shots = n_shots_added + shots_remaining + len(filepaths) - (i + 1)
1731-
if i != len(filepaths) - 1:
1732-
# Leave the last update until after dataframe concatenation.
1733-
# Looks more responsive that way:
1734-
self.set_add_shots_progress(n_shots_added, total_shots)
1752+
self.set_add_shots_progress(n_shots_added, total_shots, "reading shot files")
1753+
self.set_add_shots_progress(n_shots_added, total_shots, "concatenating dataframes")
17351754
if dataframes:
17361755
new_row_data = concat_with_padding(*dataframes)
17371756
else:
17381757
new_row_data = None
1739-
self.set_add_shots_progress(n_shots_added, total_shots)
17401758

17411759
# Do not add the shots that were not found on disk. Reverse
17421760
# loop so that removing an item doesn't change the indices of
@@ -1748,6 +1766,7 @@ def incoming_buffer_loop(self):
17481766
# Let the analysis loop know to look for new shots:
17491767
self.analysis_pending.set()
17501768
if shots_remaining == 0:
1769+
self.set_add_shots_progress(n_shots_added, total_shots, None)
17511770
n_shots_added = 0 # reset our counter for the next batch
17521771

17531772
except Exception:

0 commit comments

Comments
 (0)