diff --git a/.travis.yml b/.travis.yml index b642b91..095230c 100644 --- a/.travis.yml +++ b/.travis.yml @@ -8,11 +8,28 @@ virtualenv: before_install: - sudo apt-get update - -install: - if [[ $TRAVIS_PYTHON_VERSION == 2.7 ]]; then - sudo apt-get install --fix-missing python-opencv python-numpy python-pyside libtiff4-dev libjpeg8-dev zlib1g-dev libzbar-dev; + sudo apt-get install -y --fix-missing libzbar-dev; + fi + + # We do this conditionally because it saves us some downloading if the + # version is the same. + - if [[ "$TRAVIS_PYTHON_VERSION" == "2.7" ]]; then + wget https://repo.continuum.io/miniconda/Miniconda2-latest-Linux-x86_64.sh -O miniconda.sh; fi + - bash miniconda.sh -b -p $HOME/miniconda + - export PATH="$HOME/miniconda/bin:$PATH" + - hash -r + - conda config --set always_yes yes --set changeps1 no + - conda update --yes conda + # Useful for debugging any issues with conda + - conda info -a + + - conda create -q -n test-environment python=$TRAVIS_PYTHON_VERSION pillow pyside numpy scikit-learn opencv + - source activate test-environment + - python setup.py install + +install: - pip install -r requirements.txt - "export DISPLAY=:99.0" - "sh -e /etc/init.d/xvfb start" diff --git a/CHANGELOG.md b/CHANGELOG.md index 5d95c5f..a1fe86e 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -2,10 +2,12 @@ This is an overview of major changes. Refer to the git repository for a full log Version 0.1.28 ------------- +- Fixed #291 - Alter travis to use Anaconda / Miniconda - Fixed #288 - Minimap navigator - Fixed #286 - Disable default template command when the default template selected - Fixed #284 - Document info view to contain links - Fixed #281 - Don't make images read-only +- Fixed #212 - Customized bounding box ordering - Fixed #204 - Improvements to subsegment dots - Fixed #203 - Resize handles should have constant size regardless of zoom diff --git a/DevelopingOnMacOSX.md b/DevelopingOnMacOSX.md index aea171a..036dd96 100644 --- a/DevelopingOnMacOSX.md +++ b/DevelopingOnMacOSX.md @@ -35,19 +35,24 @@ cd ~/projects/inselect pip install -r requirements.txt ``` -# OpenCV -`numpy` is pinned by opencv installation +## OpenCV +Version of `numpy` is pinned by opencv installation but we want latest version - +I have not encountered any problems by installing the latest version. +`jjhelmus` provides versions after `2.4.10` but these make the Mac build +extremely problematic by introducing many `dylib` dependencies that are +troublesome to freeze. ``` -conda install --yes -c https://conda.binstar.org/jjhelmus opencv +conda install --yes -c https://conda.binstar.org/jjhelmus opencv=2.4.10 +conda install --yes numpy ``` -# setuptools +## setuptools A [bug in PyInstaller 3.1.1](https://github.com/pyinstaller/pyinstaller/issues/1773) means that we need to use setupools 19.2: ``` -conda install setuptools=19.2 +conda install --yes setuptools=19.2 ``` ## LibDMTX barcode reading library diff --git a/DevelopingOnWindows.md b/DevelopingOnWindows.md index 47c0d1f..49be4d1 100644 --- a/DevelopingOnWindows.md +++ b/DevelopingOnWindows.md @@ -25,7 +25,7 @@ follows: ``` conda update --yes conda -conda create --yes --name inselect pillow pyside pywin32 numpy +conda create --yes --name inselect pillow pyside pywin32 numpy scikit-learn activate inselect python -m pip install --upgrade pip pip install -r requirements.txt @@ -92,7 +92,7 @@ follows: ``` conda update --yes conda -conda create --yes --name inselect pillow pyside pywin32 numpy +conda create --yes --name inselect pillow pyside pywin32 numpy scikit-learn activate inselect python -m pip install --upgrade pip pip install -r requirements.txt diff --git a/build.sh b/build.sh index decfd34..0655735 100755 --- a/build.sh +++ b/build.sh @@ -24,10 +24,14 @@ if [[ "$OSTYPE" == "darwin"* ]]; then rm -rf build dist pyinstaller --clean inselect.spec - for script in export_metadata ingest read_barcodes save_crops segment; do + for script in export_metadata ingest read_barcodes save_crops; do rm -rf $script.spec - pyinstaller --onefile --icon=data/inselect.icns inselect/scripts/$script.py + pyinstaller --onefile --hidden-import numpy inselect/scripts/$script.py done + # segment has an additional hidden import + rm -rf segment.spec + pyinstaller --onefile --hidden-import numpy \ + --hidden-import sklearn.neighbors.typedefs inselect/scripts/segment.py # Add a few items to the PropertyList file generated by PyInstaller python -m bin.plist dist/inselect.app/Contents/Info.plist diff --git a/inselect.spec b/inselect.spec index 34c8815..e1f77b9 100644 --- a/inselect.spec +++ b/inselect.spec @@ -1,6 +1,7 @@ # For PyInstaller build on Mac import sys + from pathlib import Path block_cipher = None @@ -9,7 +10,7 @@ a = Analysis(['inselect.py'], pathex=[str(Path('.').absolute())], binaries=None, datas=None, - hiddenimports=[], + hiddenimports=['sklearn.neighbors.typedefs'], hookspath=[], runtime_hooks=[], excludes=['Tkinter'], @@ -18,23 +19,25 @@ a = Analysis(['inselect.py'], cipher=block_cipher) -# PyInstaller does not detect some dylibs, I think because they are symlinked. +# PyInstaller does not detect some dylibs, I think in some cases because they +# are symlinked. # See Stack Overflow post http://stackoverflow.com/a/17595149 for example # of manipulating Analysis.binaries. -# Tuples (name, source) MISSING_DYLIBS = ( - ('libQtCore.4.dylib', 'libQtCore.4.8.7.dylib'), - ('libQtGui.4.dylib', 'libQtGui.4.8.7.dylib'), - ('libpng16.16.dylib', 'libpng16.16.dylib'), - ('libz.1.dylib', 'libz.1.dylib'), + 'libQtCore.4.dylib', + 'libQtGui.4.dylib', + 'libpng16.16.dylib', + 'libz.1.dylib', ) # The lib directory associated with this environment LIB = Path(sys.argv[0]).parent.parent.joinpath('lib') -a.binaries += TOC([(name, str(LIB.joinpath(source)), 'BINARY') for name, source in MISSING_DYLIBS]) - +# Find the source for each library and add it to the list of binaries +a.binaries += TOC([ + (lib, str(LIB.joinpath(lib).resolve()), 'BINARY') for lib in MISSING_DYLIBS +]) pyz = PYZ(a.pure, a.zipped_data, cipher=block_cipher) # Prefer to freeze to a folder rather than a single file. The choice makes no @@ -51,7 +54,7 @@ if SINGLE_FILE: name='inselect', debug=False, strip=False, - upx=True, + upx=False, console=False, icon='data/inselect.icns') else: @@ -62,7 +65,7 @@ else: name='inselect', debug=False, strip=False, - upx=True, + upx=False, console=False, icon='data/inselect.icns') @@ -71,7 +74,7 @@ else: a.zipfiles, a.datas, strip=False, - upx=True, + upx=False, name='inselect') diff --git a/inselect/gui/main_window.py b/inselect/gui/main_window.py index 4e0af48..691e753 100644 --- a/inselect/gui/main_window.py +++ b/inselect/gui/main_window.py @@ -32,6 +32,7 @@ from .plugins.subsegment import SubsegmentPlugin from .recent_documents import RecentDocuments from .roles import RotationRole +from .sort_document_items import sort_items_choice from .user_template_choice import user_template_choice from .utils import contiguous, report_to_user, qimage_of_bgr from .views.boxes import BoxesView, GraphicsItemView @@ -963,11 +964,11 @@ def _create_menu_actions(self): triggered=partial(self.select_next_prev, next=False) ) self.select_by_size_larger_action = QAction( - "Select increasing size", self, shortcut="ctrl+>", + "Select &increasing size", self, shortcut="ctrl+>", triggered=partial(self.select_by_size_step, larger=True) ) self.select_by_size_smaller_action = QAction( - "Select decreasing size", self, shortcut="ctrl+<", + "Select d&ecreasing size", self, shortcut="ctrl+<", triggered=partial(self.select_by_size_step, larger=False) ) @@ -984,14 +985,23 @@ def _create_menu_actions(self): self.delete_action.shortcut()]) self.rotate_clockwise_action = QAction( - "Rotate clockwise", self, shortcut="ctrl+R", + "Rotate c&lockwise", self, shortcut="ctrl+R", triggered=partial(self.rotate90, clockwise=True) ) self.rotate_counter_clockwise_action = QAction( - "Rotate counter-clockwise", self, shortcut="ctrl+L", + "Rotate c&ounter-clockwise", self, shortcut="ctrl+L", triggered=partial(self.rotate90, clockwise=False) ) + self.sort_by_rows_action = QAction( + "Sort by &rows", self, checkable=True, + triggered=partial(self.sort_boxes, by_columns=False) + ) + self.sort_by_columns_action = QAction( + "Sort by &columns", self, checkable=True, + triggered=partial(self.sort_boxes, by_columns=True) + ) + # Plugins # Plugin shortcuts start at F5 shortcut_offset = 5 @@ -1054,7 +1064,7 @@ def _create_menu_actions(self): icon=self.style().standardIcon(QtGui.QStyle.SP_ArrowDown) ) self.zoom_home_action = QAction( - "Whole image", self, + "&Whole image", self, shortcut=QtGui.QKeySequence.MoveToStartOfDocument, triggered=self.zoom_home, checkable=True ) @@ -1071,10 +1081,10 @@ def _create_menu_actions(self): ) self.show_object_grid_action = QAction( - 'Show grid', self, shortcut='ctrl+G', triggered=self.show_grid + 'Show &grid', self, shortcut='ctrl+G', triggered=self.show_grid ) self.show_object_expanded_action = QAction( - 'Show expanded', self, + 'Show &expanded', self, shortcut='ctrl+E', triggered=self.show_expanded ) @@ -1184,6 +1194,9 @@ def _create_menus(self): self._edit_menu.addAction(self.rotate_clockwise_action) self._edit_menu.addAction(self.rotate_counter_clockwise_action) self._edit_menu.addSeparator() + self._edit_menu.addAction(self.sort_by_rows_action) + self._edit_menu.addAction(self.sort_by_columns_action) + self._edit_menu.addSeparator() user_template_popup = self._edit_menu.addMenu('Metadata template') self.view_metadata.popup_button.inject_actions(user_template_popup) self._edit_menu.addSeparator() @@ -1210,7 +1223,7 @@ def _create_menus(self): self._view_menu.addAction(self.show_object_grid_action) self._view_menu.addAction(self.show_object_expanded_action) self._view_menu.addSeparator() - colours_popup = self._view_menu.addMenu('Colour scheme') + colours_popup = self._view_menu.addMenu('&Colour scheme') for action in self.colour_scheme_actions: colours_popup.addAction(action) @@ -1345,6 +1358,22 @@ def copy_to_new_document(self): else: self.new_document(path, default_metadata_items=items) + @report_to_user + def sort_boxes(self, by_columns): + """Sorts boxes either by columns or by rows. + """ + if self.document: + # Sort boxes + self.model.to_document(self.document) + items = sort_items_choice().sort_items( + self.document.items, by_columns + ) + self.model.set_new_boxes(items) + else: + # Record the user's choice + sort_items_choice().sort_items([], by_columns) + self.sync_ui() + def _accept_drag_drop(self, event): """If event refers to a single file that can opened, returns the path. Returns None otherwise. @@ -1428,6 +1457,8 @@ def sync_ui(self): self.delete_action.setEnabled(has_selection) self.rotate_clockwise_action.setEnabled(has_selection) self.rotate_counter_clockwise_action.setEnabled(has_selection) + self.sort_by_rows_action.setChecked(not sort_items_choice().by_columns) + self.sort_by_columns_action.setChecked(sort_items_choice().by_columns) self.cookie_cutter_widget.sync_actions(document, has_rows) for action in self.plugin_actions: action.setEnabled(document) diff --git a/inselect/gui/plugins/segment.py b/inselect/gui/plugins/segment.py index 9564259..84a9714 100644 --- a/inselect/gui/plugins/segment.py +++ b/inselect/gui/plugins/segment.py @@ -1,8 +1,10 @@ from PySide.QtGui import QIcon, QMessageBox -from inselect.lib.segment import segment_document +from inselect.lib.segment_document import SegmentDocument from inselect.lib.utils import debug_print +from inselect.gui.sort_document_items import sort_items_choice + from .plugin import Plugin @@ -16,6 +18,7 @@ def __init__(self, document, parent): self.rects = self.display = None self.document = document self.parent = parent + self.sort_choice = sort_items_choice().by_columns @classmethod def icon(cls): @@ -34,8 +37,12 @@ def can_be_run(self): def __call__(self, progress): debug_print('SegmentPlugin.__call__') - doc, display = segment_document(self.document, callback=progress) + doc, display = SegmentDocument(self.sort_choice).segment( + self.document, callback=progress + ) self.items, self.display = doc.items, display - debug_print('SegmentPlugin.__call__ exiting. Found [{0}] boxes'.format(len(self.items))) + debug_print('SegmentPlugin.__call__ exiting. Found [{0}] boxes'.format( + len(self.items)) + ) diff --git a/inselect/gui/plugins/subsegment.py b/inselect/gui/plugins/subsegment.py index e8074b8..cfafed6 100644 --- a/inselect/gui/plugins/subsegment.py +++ b/inselect/gui/plugins/subsegment.py @@ -1,11 +1,10 @@ -import numpy as np - from PySide.QtGui import QIcon, QMessageBox -from inselect.lib.segment import segment_grabcut -from inselect.lib.rect import Rect +from inselect.lib.segment_document import SegmentDocument from inselect.lib.utils import debug_print +from inselect.gui.sort_document_items import sort_items_choice + from .plugin import Plugin @@ -19,13 +18,13 @@ def __init__(self, document, parent): self.rects = self.display = None self.document = document self.parent = parent + self.sort_choice = sort_items_choice().by_columns @classmethod def icon(cls): return QIcon(':/data/subsegment_icon.png') def can_be_run(self): - # TODO LH Fix this horrible, horrible, horrible, horrible, horrible hack selected = self.parent.view_object.selectedIndexes() items_of_indexes = self.parent.view_graphics_item.items_of_indexes item = items_of_indexes(selected).next() if 1 == len(selected) else None @@ -44,52 +43,16 @@ def can_be_run(self): def __call__(self, progress): debug_print('SubsegmentPlugin.__call__') - if self.document.thumbnail: - debug_print('Subsegment will work on thumbnail') - image = self.document.thumbnail - else: - debug_print('Segment will work on full-res scan') - image = self.document.scanned - - # Perform the subsegmentation - items = self.document.items - row = self.row - window = image.from_normalised([items[row]['rect']]).next() - # Points as a list of tuples, with coordinates relative to # the top-left of the sub-segmentation window - seeds = [(p.x(), p.y()) for p in self.seeds] - - rects, display = segment_grabcut(image.array, window, seeds) + seeds = [(int(p.x()), int(p.y())) for p in self.seeds] - # Normalised Rects - rects = list(Rect(*map(lambda v: int(round(v)), rect[:4])) for rect in rects) - rects = image.to_normalised(rects) - - # Padding of one percent of height and width - rects = (r.padded(percent=1) for r in rects) - - # Constrain rects to be within image - rects = list(r.intersect(Rect(0.0, 0.0, 1.0, 1.0)) for r in rects) - - # Copy any existing metadata, rotation etc to the new items, update with - # new rects and replace the existing item - existing = items[row] - new_items = [None] * len(rects) - for index, rect in enumerate(rects): - new_items[index] = existing.copy() - new_items[index]['rect'] = rect - items[row:(1+row)] = new_items - - # Segmentation image - h, w = image.array.shape[:2] - display_image = np.zeros((h, w, 3), dtype=np.uint8) - - x, y, w, h = window - display_image[y:y+h, x:x+w] = display + items, display_image = SegmentDocument(self.sort_choice).subsegment( + self.document, self.row, seeds, callback=progress + ) self.items, self.display = items, display_image debug_print( - 'SegmentPlugin.__call__ exiting. Found [{0}] boxes'.format(len(rects)) + 'SegmentPlugin.__call__ exiting. Found [{0}] boxes'.format(len(items)) ) diff --git a/inselect/gui/sort_document_items.py b/inselect/gui/sort_document_items.py new file mode 100644 index 0000000..1dc860f --- /dev/null +++ b/inselect/gui/sort_document_items.py @@ -0,0 +1,40 @@ +from PySide.QtCore import QSettings + +from inselect.lib.sort_document_items import sort_document_items + +# QSettings path +_PATH = 'sort_by_columns' + +# Global - set to instance of CookieCutterChoice in cookie_cutter_boxes +_SORT_DOCUMENT = None + + +def sort_items_choice(): + "Returns an instance of SortDocumentItems" + global _SORT_DOCUMENT + if not _SORT_DOCUMENT: + _SORT_DOCUMENT = SortDocumentItems() + return _SORT_DOCUMENT + + +class SortDocumentItems(object): + def __init__(self): + # Key holds an integer + self._by_columns = 1 == QSettings().value(_PATH, False) + + @property + def by_columns(self): + """The user's preference for ordering by columns (True) or by rows + (False) + """ + return self._by_columns + + def sort_items(self, items, by_columns): + """Returns items sorted by columns (True) or by rows (False) or by the + user's most recent preference (None). + """ + self._by_columns = by_columns + # Pass integer to setValue - calling setValue with a bool with result + # in a string being written to the QSettings store. + QSettings().setValue(_PATH, 1 if by_columns else 0) + return sort_document_items(items, by_columns) diff --git a/inselect/lib/segment.py b/inselect/lib/segment.py index 4248468..7c2d7e3 100644 --- a/inselect/lib/segment.py +++ b/inselect/lib/segment.py @@ -4,62 +4,12 @@ import numpy as np -from .rect import Rect from .utils import debug_print # Breaks pyinstaller build # from skimage.morphology import watershed USE_OPENCV_WATERSHED = True -SEGMENTATION_PREFERRED_WIDTH = 4096 - - -def segment_document(doc, resize=None, *args, **kwargs): - """Returns doc with items replaced by the result of calling segment_edges(). - The caller is responsible for saving doc. - """ - debug_print('Segmenting [{0}]'.format(doc)) - - if doc.thumbnail: - img = doc.thumbnail - debug_print('Will segment using thumbnail [{0}]'.format(img)) - else: - img = doc.scanned - debug_print('Will segment using full-res scan [{0}]'.format(img)) - - # Make smaller images larger - height, width = img.array.shape[:2] - if resize is None and width != SEGMENTATION_PREFERRED_WIDTH: - # Resize, maintaining aspect ratio - # segment_edges() expects a tuple (height, width) - factor = float(SEGMENTATION_PREFERRED_WIDTH) / width - resize = (int(height * factor), SEGMENTATION_PREFERRED_WIDTH) - - msg = 'Resizing [{0}] from [{1}] to preferred size of [{2}]' - debug_print(msg.format(doc, (height, width), resize)) - else: - # Images of the preferred size or larger do not need resizing - debug_print('Image is of the preferred size or larger') - resize = False - - rects, display_image = segment_edges(img.array, resize=resize, *args, **kwargs) - - # Normalised Rects - rects = list(Rect(*map(lambda v: int(round(v)), rect[:4])) for rect in rects) - rects = img.to_normalised(rects) - - # Padding of one percent of height and width - rects = (r.padded(percent=1) for r in rects) - - # Constrain rects to be within image - rects = (r.intersect(Rect(0.0, 0.0, 1.0, 1.0)) for r in rects) - - items = [{"fields": {}, 'rect': r, 'rotation': 0} for r in rects] - doc = doc.copy() # Deep copy to avoid altering argument - doc.set_items(items) - debug_print('Segmented [{0}]'.format(doc)) - return doc, display_image - def _right_sized(contour, image, container_filter=True, size_filter=True): """Checks if contour size and shape is that of an object of interest. diff --git a/inselect/lib/segment_document.py b/inselect/lib/segment_document.py new file mode 100644 index 0000000..d693ddd --- /dev/null +++ b/inselect/lib/segment_document.py @@ -0,0 +1,115 @@ +import numpy as np + +from .rect import Rect +from .segment import segment_edges, segment_grabcut +from .sort_document_items import sort_document_items +from .utils import debug_print + +SEGMENTATION_PREFERRED_WIDTH = 4096 + + +class SegmentDocument(object): + """Segments and sub-segments documents, applies padding to rects + and orders rects. + """ + def __init__(self, sort_by_columns=False): + self.sort_by_columns = sort_by_columns + + def segment(self, doc, resize=None, *args, **kwargs): + """Returns doc with items replaced by the result of calling segment_edges(). + The caller is responsible for saving doc. + """ + debug_print('Segmenting [{0}]'.format(doc)) + + if doc.thumbnail: + img = doc.thumbnail + debug_print('Will segment using thumbnail [{0}]'.format(img)) + else: + img = doc.scanned + debug_print('Will segment using full-res scan [{0}]'.format(img)) + + # Make smaller images larger + height, width = img.array.shape[:2] + if resize is None and width != SEGMENTATION_PREFERRED_WIDTH: + # Resize, maintaining aspect ratio + # segment_edges() expects a tuple (height, width) + factor = float(SEGMENTATION_PREFERRED_WIDTH) / width + resize = (int(height * factor), SEGMENTATION_PREFERRED_WIDTH) + + msg = 'Resizing [{0}] from [{1}] to preferred size of [{2}]' + debug_print(msg.format(doc, (height, width), resize)) + else: + # Images of the preferred size or larger do not need resizing + debug_print('Image is of the preferred size or larger') + resize = False + + rects, display_image = segment_edges( + img.array, resize=resize, *args, **kwargs + ) + + rects = self._post_process_rects(img, rects) + + # Create item dicts + items = [{"fields": {}, 'rect': r, 'rotation': 0} for r in rects] + + # Sort items by user's most recent preference + items = sort_document_items(items, self.sort_by_columns) + + doc = doc.copy() # Deep copy to avoid altering argument + doc.set_items(items) + + debug_print('Segmented [{0}]'.format(doc)) + + return doc, display_image + + def subsegment(self, doc, row, seeds, *args, **kwargs): + """seeds - a list of tuples (x, y) with coordinates relative to + the top-left of the sub-segmentation window + """ + if doc.thumbnail: + debug_print('Subsegment will work on thumbnail') + img = doc.thumbnail + else: + debug_print('Segment will work on full-res scan') + img = doc.scanned + + items = doc.items + window = next(img.from_normalised([items[row]['rect']])) + rects, display = segment_grabcut(img.array, window, seeds) + + rects = list(self._post_process_rects(img, rects)) + + # Copy any existing metadata, rotation etc to the new items, update with + # new rects and replace the existing item + existing = items[row] + new_items = [None] * len(rects) + for index, rect in enumerate(rects): + new_items[index] = existing.copy() + new_items[index]['rect'] = rect + + # Sort items by user's most recent preference + new_items = sort_document_items(new_items, self.sort_by_columns) + + items[row:(1+row)] = new_items + + # Segmentation image + h, w = img.array.shape[:2] + display_image = np.zeros((h, w, 3), dtype=np.uint8) + + x, y, w, h = window + display_image[y:y+h, x:x+w] = display + + return items, display_image + + def _post_process_rects(self, img, rects): + """Generator of instances of normalised Rect with padding applied + """ + # Normalised coords and construct instances of Rect + rects = list(Rect(*map(lambda v: int(round(v)), rect[:4])) for rect in rects) + rects = img.to_normalised(rects) + + # Apply padding of one percent of height and width + rects = (r.padded(percent=1) for r in rects) + + # Constrain rects to be within image + return (r.intersect(Rect(0.0, 0.0, 1.0, 1.0)) for r in rects) diff --git a/inselect/lib/sort_document_items.py b/inselect/lib/sort_document_items.py new file mode 100644 index 0000000..1d3cbbb --- /dev/null +++ b/inselect/lib/sort_document_items.py @@ -0,0 +1,47 @@ +from itertools import izip +from operator import itemgetter + +import numpy as np + +from scipy.signal import argrelmin +from sklearn.neighbors import KernelDensity + + +def _do_kde(values): + """Uses kernel denstity estimation to assign values to clusters using + minima. Returns a generator of ints that are bin numbers. + """ + # http://stackoverflow.com/a/35151947 + RESCALE = 100 + values = np.array([int(v * RESCALE) for v in values]).reshape(-1, 1) + kde = KernelDensity().fit(values) + + # Identify minima and use as break points + samples = np.linspace(0, RESCALE) + evaluations = kde.score_samples(samples.reshape(-1, 1)) + minima = argrelmin(evaluations) + + # The right-hand edges of bins + bins = np.append(samples[minima], RESCALE) + + # Cut data + return (v[0] for v in np.digitize(values, bins, right=True).tolist()) + + +def sort_document_items(items, by_columns): + """Returns items sorted either by columns or by rows + """ + if not items: + # Algorithm is not tolerant of empty values + return [] + else: + rects = [i['rect'] for i in items] + x_bins = _do_kde(r.centre.x for r in rects) + y_bins = _do_kde(r.centre.y for r in rects) + + if by_columns: + keys = izip(x_bins, y_bins, (r.left for r in rects)) + else: + keys = izip(y_bins, x_bins, (r.left for r in rects)) + items_and_keys = sorted(izip(items, keys), key=itemgetter(1)) + return [v[0] for v in items_and_keys] diff --git a/inselect/scripts/export_metadata.py b/inselect/scripts/export_metadata.py index 0dfd88c..3683daf 100755 --- a/inselect/scripts/export_metadata.py +++ b/inselect/scripts/export_metadata.py @@ -9,10 +9,6 @@ from pathlib import Path -# Import numpy here to prevent PyInstaller build from breaking -# TODO LH find a better solution -import numpy # noqa - import inselect import inselect.lib.utils diff --git a/inselect/scripts/ingest.py b/inselect/scripts/ingest.py index e670eb4..34436d7 100755 --- a/inselect/scripts/ingest.py +++ b/inselect/scripts/ingest.py @@ -9,10 +9,6 @@ from pathlib import Path -# Import numpy here to prevent PyInstaller build from breaking -# TODO LH find a better solution -import numpy # noqa - import inselect import inselect.lib.utils diff --git a/inselect/scripts/read_barcodes.py b/inselect/scripts/read_barcodes.py index 470ab77..f3e5446 100755 --- a/inselect/scripts/read_barcodes.py +++ b/inselect/scripts/read_barcodes.py @@ -10,10 +10,6 @@ from itertools import count, izip from pathlib import Path -# Import numpy here to prevent PyInstaller build from breaking -# TODO LH find a better solution -import numpy # noqa - import inselect.lib.utils from inselect.lib.utils import debug_print diff --git a/inselect/scripts/save_crops.py b/inselect/scripts/save_crops.py index 7c45cd1..f633999 100755 --- a/inselect/scripts/save_crops.py +++ b/inselect/scripts/save_crops.py @@ -9,10 +9,6 @@ from pathlib import Path -# Import numpy here to prevent PyInstaller build from breaking -# TODO LH find a better solution -import numpy # noqa - import inselect import inselect.lib.utils diff --git a/inselect/scripts/segment.py b/inselect/scripts/segment.py index 1b34022..e908c47 100755 --- a/inselect/scripts/segment.py +++ b/inselect/scripts/segment.py @@ -9,29 +9,26 @@ from pathlib import Path -# Import numpy here to prevent PyInstaller build from breaking -# TODO LH find a better solution -import numpy # noqa - import inselect.lib.utils from inselect.lib.document import InselectDocument -from inselect.lib.segment import segment_document +from inselect.lib.segment_document import SegmentDocument from inselect.lib.utils import debug_print # TODO Recursive option # TODO Option to resegment documents with existing boxes -def segment(dir): +def segment(dir, sort_by_columns): dir = Path(dir) + segment_doc = SegmentDocument(sort_by_columns) for p in dir.glob('*' + InselectDocument.EXTENSION): doc = InselectDocument.load(p) if not doc.items: print(u'Segmenting [{0}]'.format(p)) try: debug_print(u'Will segment [{0}]'.format(p)) - doc, display_image = segment_document(doc) + doc, display_image = segment_doc.segment(doc) del display_image # We don't use this doc.save() except KeyboardInterrupt: @@ -49,13 +46,18 @@ def main(args): parser = argparse.ArgumentParser(description='Segments Inselect documents') parser.add_argument("dir", help='Directory containing Inselect documents') parser.add_argument('--debug', action='store_true') - parser.add_argument('-v', '--version', action='version', - version='%(prog)s ' + inselect.__version__) + parser.add_argument( + '--sort-by-columns', action='store_true', default=False, + help='Sort boxes by columns; default is to sort boxes by rows') + parser.add_argument( + '-v', '--version', action='version', + version='%(prog)s ' + inselect.__version__ + ) args = parser.parse_args(args) inselect.lib.utils.DEBUG_PRINT = args.debug - segment(args.dir) + segment(args.dir, args.sort_by_columns) if __name__ == '__main__': diff --git a/inselect/tests/gui/test_action_state.py b/inselect/tests/gui/test_action_state.py index afa01fc..1072ecf 100644 --- a/inselect/tests/gui/test_action_state.py +++ b/inselect/tests/gui/test_action_state.py @@ -29,6 +29,8 @@ def _test_no_document(self): self.assertFalse(w.previous_box_action.isEnabled()) self.assertFalse(w.rotate_clockwise_action.isEnabled()) self.assertFalse(w.rotate_counter_clockwise_action.isEnabled()) + self.assertTrue(w.sort_by_rows_action.isEnabled()) + self.assertTrue(w.sort_by_columns_action.isEnabled()) self.assertFalse(w.plugin_actions[0].isEnabled()) # View @@ -57,6 +59,8 @@ def _test_document_open(self): self.assertTrue(w.previous_box_action.isEnabled()) self.assertFalse(w.rotate_clockwise_action.isEnabled()) self.assertFalse(w.rotate_counter_clockwise_action.isEnabled()) + self.assertTrue(w.sort_by_rows_action.isEnabled()) + self.assertTrue(w.sort_by_columns_action.isEnabled()) self.assertTrue(w.plugin_actions[0].isEnabled()) # View diff --git a/inselect/tests/gui/test_segment.py b/inselect/tests/gui/test_segment.py index 14ea1e6..be42af4 100644 --- a/inselect/tests/gui/test_segment.py +++ b/inselect/tests/gui/test_segment.py @@ -9,6 +9,7 @@ from gui_test import MainWindowTest from inselect.gui.roles import RectRole +from inselect.gui.sort_document_items import SortDocumentItems TESTDATA = Path(__file__).parent.parent / 'test_data' @@ -34,8 +35,9 @@ def test_segment(self, mock_question): indexes = [w.model.index(r, 0) for r in xrange(0, w.model.rowCount())] expected = [w.model.data(i, RectRole) for i in indexes] - # Segment - self.run_async_operation(partial(w.run_plugin, 0)) + # Segment, sorting by rows + with patch.object(SortDocumentItems, 'by_columns', False): + self.run_async_operation(partial(w.run_plugin, 0)) # Get the rects of the new boxes self.assertEqual(5, w.model.rowCount()) diff --git a/inselect/tests/gui/test_subsegment.py b/inselect/tests/gui/test_subsegment.py index d2edd97..c885727 100644 --- a/inselect/tests/gui/test_subsegment.py +++ b/inselect/tests/gui/test_subsegment.py @@ -8,6 +8,7 @@ from PySide.QtGui import QMessageBox from inselect.gui.roles import MetadataRole, RectRole +from inselect.gui.sort_document_items import SortDocumentItems from gui_test import MainWindowTest @@ -37,8 +38,9 @@ def test_subsegment(self): for pos in seeds: box.append_point_of_interest(pos) - # Sub-segment - self.run_async_operation(partial(w.run_plugin, 1)) + # Sub-segment, sorting by rows + with patch.object(SortDocumentItems, 'by_columns', False): + self.run_async_operation(partial(w.run_plugin, 1)) # Should have three boxes with the same metadata self.assertEqual(3, w.model.rowCount()) diff --git a/inselect/tests/lib/test_document_export.py b/inselect/tests/lib/test_document_export.py index 2574c94..87c6867 100644 --- a/inselect/tests/lib/test_document_export.py +++ b/inselect/tests/lib/test_document_export.py @@ -144,13 +144,13 @@ def test_csv_export(self): self.assertEqual( (u'04_3.png', u'4', u'0', u'248', u'189', u'437', - u'', u'Elsinoë', u'3'), + u'4', u'Elsinoë', u'3'), metadata_cols(reader.next()) ) self.assertEqual( (u'05_4.png', u'5', u'271', u'248', u'459', u'437', - u'', u'D', u'4'), + u'5', u'D', u'4'), metadata_cols(reader.next()) ) self.assertIsNone(next(reader, None)) diff --git a/inselect/tests/lib/test_segment.py b/inselect/tests/lib/test_segment.py index 2171fa8..65d5287 100644 --- a/inselect/tests/lib/test_segment.py +++ b/inselect/tests/lib/test_segment.py @@ -2,28 +2,42 @@ from pathlib import Path from inselect.lib.document import InselectDocument -from inselect.lib.segment import segment_document +from inselect.lib.segment_document import SegmentDocument TESTDATA = Path(__file__).parent.parent / 'test_data' class TestSegment(unittest.TestCase): - def test_segment_document(self): - doc = InselectDocument.load(TESTDATA / 'test_segment.inselect') - + def _segment(self, doc, sort_by_columns, expected): self.assertEqual(5, len(doc.items)) - - # Compare the rects in pixels - expected = doc.scanned.from_normalised([i['rect'] for i in doc.items]) doc.set_items([]) self.assertEqual(0, len(doc.items)) - doc, display_image = segment_document(doc) + segment_doc = SegmentDocument(sort_by_columns=sort_by_columns) + doc, display_image = segment_doc.segment(doc) + # Compare the rects in pixels actual = doc.scanned.from_normalised([i['rect'] for i in doc.items]) self.assertEqual(list(expected), list(actual)) + def test_segment_document_sort_by_rows(self): + "Segment the document with boxes sorted by rows" + doc = InselectDocument.load(TESTDATA / 'test_segment.inselect') + expected = doc.scanned.from_normalised( + [i['rect'] for i in doc.items] + ) + self._segment(doc, False, expected) + + def test_segment_document_sort_by_columns(self): + "Segment the document with boxes sorted by columns" + doc = InselectDocument.load(TESTDATA / 'test_segment.inselect') + items = doc.items + expected = doc.scanned.from_normalised( + [items[index]['rect'] for index in (0, 3, 2, 1, 4)] + ) + self._segment(doc, True, expected) + if __name__ == '__main__': unittest.main() diff --git a/inselect/tests/lib/test_sort_boxes.py b/inselect/tests/lib/test_sort_boxes.py new file mode 100644 index 0000000..66a0cba --- /dev/null +++ b/inselect/tests/lib/test_sort_boxes.py @@ -0,0 +1,31 @@ +import unittest +from pathlib import Path + +from inselect.lib.document import InselectDocument +from inselect.lib.sort_document_items import sort_document_items + + +TESTDATA = Path(__file__).parent.parent / 'test_data' + + +class TestSortBoxes(unittest.TestCase): + def test_order_by_rows(self): + doc = InselectDocument.load(TESTDATA / 'test_segment.inselect') + + items = sort_document_items(doc.items, by_columns=False) + self.assertEqual( + ['1', '2', '3', '4', '5'], + [item['fields']['catalogNumber'] for item in items] + ) + + def test_order_by_columns(self): + doc = InselectDocument.load(TESTDATA / 'test_segment.inselect') + items = sort_document_items(doc.items, by_columns=True) + self.assertEqual( + ['1', '4', '3', '2', '5'], + [item['fields']['catalogNumber'] for item in items] + ) + + +if __name__ == '__main__': + unittest.main() diff --git a/inselect/tests/test_data/test_segment.inselect b/inselect/tests/test_data/test_segment.inselect index 725f2b4..b2b0996 100644 --- a/inselect/tests/test_data/test_segment.inselect +++ b/inselect/tests/test_data/test_segment.inselect @@ -42,6 +42,7 @@ }, { "fields": { + "catalogNumber": "4", "scientificName": "Elsinoë" }, "rect": [ @@ -54,6 +55,7 @@ }, { "fields": { + "catalogNumber": "5", "scientificName": "D" }, "rect": [ diff --git a/setup.py b/setup.py index a43a3fe..cc7d90a 100755 --- a/setup.py +++ b/setup.py @@ -47,13 +47,19 @@ } for script in SCRIPTS ], + # Strings in braces within 'include_files' tuples expanded in cx_setup 'include_files': [ ('{site_packages}/numpy', 'numpy'), + ('{site_packages}/scipy', 'scipy'), + ('{site_packages}/sklearn', 'sklearn'), + ('{environment_root}/Library/bin/mkl_core.dll', 'mkl_core.dll'), + ('{environment_root}/Library/bin/libiomp5md.dll', 'libiomp5md.dll'), ], 'extra_packages': ['win32com.gen_py'], 'excludes': [ - 'Tkinter', 'ttk', 'Tkconstants', 'tcl', - 'future.moves' # Errors from urllib otherwise + 'Tkinter', 'ttk', 'Tkconstants', 'tcl', '_ssl', + 'future.moves', # Errors from urllib otherwise + 'PySide.QtNetwork', ] } } @@ -78,13 +84,17 @@ def cx_setup(): """cx_Freeze setup. Used for building Windows installers""" from cx_Freeze import setup, Executable from distutils.sysconfig import get_python_lib + from pathlib import Path - # Set path to include files - site_packages = get_python_lib() + # Set paths to include files + format_strings = { + 'site_packages': get_python_lib(), + 'environment_root': Path(sys.executable).parent, + } include_files = [] for i in setup_data['win32']['include_files']: include_files.append(( - i[0].format(site_packages=site_packages), + i[0].format(**format_strings), i[1] )) @@ -97,6 +107,8 @@ def cx_setup(): 'packages': setup_data['packages'] + setup_data['win32']['extra_packages'], 'excludes': setup_data['win32']['excludes'], 'include_files': include_files, + 'include_msvcr': True, + 'optimize': 2, }, 'bdist_msi': { 'upgrade_code': '{fe2ed61d-cd5e-45bb-9d16-146f725e522f}'