Source code for girder_large_image_annotation.models.annotation

#  Copyright Kitware Inc.
#  Licensed under the Apache License, Version 2.0 ( the "License" );
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  See the License for the specific language governing permissions and
#  limitations under the License.

import copy
import datetime
import enum
import re
import threading
import time

import cherrypy
import jsonschema
import numpy
from bson import ObjectId
from girder_large_image import constants
from girder_large_image.models.image_item import ImageItem

from girder import events, logger
from girder.constants import AccessType, SortDir
from girder.exceptions import AccessException, ValidationException
from girder.models.folder import Folder
from girder.models.item import Item
from girder.models.model_base import AccessControlledModel
from girder.models.notification import Notification
from girder.models.setting import Setting
from girder.models.user import User

from .annotationelement import Annotationelement

# Some arrays longer than this are validated using numpy rather than jsonschema

[docs]def extendSchema(base, add): extend = copy.deepcopy(base) for key in add: if key == 'required' and 'required' in base: extend[key] = sorted(set(extend[key]) | set(add[key])) elif key != 'properties' and 'properties' in base: extend[key] = add[key] if 'properties' in add: extend['properties'].update(add['properties']) return extend
[docs]class AnnotationSchema: coordSchema = { 'type': 'array', # TODO: validate that z==0 for now 'items': { 'type': 'number' }, 'minItems': 3, 'maxItems': 3, 'name': 'Coordinate', # TODO: define origin for 3D images 'description': 'An X, Y, Z coordinate tuple, in base layer pixel ' 'coordinates, where the origin is the upper-left.' } coordValueSchema = { 'type': 'array', 'items': { 'type': 'number' }, 'minItems': 4, 'maxItems': 4, 'name': 'CoordinateWithValue', 'description': 'An X, Y, Z, value coordinate tuple, in base layer ' 'pixel coordinates, where the origin is the upper-left.' } colorSchema = { 'type': 'string', # We accept colors of the form # #aabbcc six digit RRGGBB hex # #abc three digit RGB hex # rgb(255, 255, 255) rgb decimal triplet # rgba(255, 255, 255, 1) rgba quad with RGB in the range [0-255] and # alpha [0-1] # TODO: make rgb and rgba spec validate that rgb is [0-255] and a is # [0-1], rather than just checking if they are digits and such. 'pattern': r'^(#[0-9a-fA-F]{3,6}|rgb\(\d+,\s*\d+,\s*\d+\)|' r'rgba\(\d+,\s*\d+,\s*\d+,\s*(\d?\.|)\d+\))$', } colorRangeSchema = { 'type': 'array', 'items': colorSchema, 'description': 'A list of colors', } rangeValueSchema = { 'type': 'array', 'items': {'type': 'number'}, 'description': 'A weakly monotonic list of range values', } userSchema = { 'type': 'object', 'additionalProperties': True } labelSchema = { 'type': 'object', 'properties': { 'value': {'type': 'string'}, 'visibility': { 'type': 'string', # TODO: change to True, False, None? 'enum': ['hidden', 'always', 'onhover'] }, 'fontSize': { 'type': 'number', 'exclusiveMinimum': 0, }, 'color': colorSchema, }, 'required': ['value'], 'additionalProperties': False } groupSchema = {'type': 'string'} baseElementSchema = { 'type': 'object', 'properties': { 'id': { 'type': 'string', 'pattern': '^[0-9a-f]{24}$', }, 'type': {'type': 'string'}, # schema free field for users to extend annotations 'user': userSchema, 'label': labelSchema, 'group': groupSchema }, 'required': ['type'], 'additionalProperties': True } baseShapeSchema = extendSchema(baseElementSchema, { 'properties': { 'lineColor': colorSchema, 'lineWidth': { 'type': 'number', 'minimum': 0 }, }, }) pointShapeSchema = extendSchema(baseShapeSchema, { 'properties': { 'type': { 'type': 'string', 'enum': ['point'] }, 'center': coordSchema, 'fillColor': colorSchema }, 'required': ['type', 'center'], 'additionalProperties': False }) arrowShapeSchema = extendSchema(baseShapeSchema, { 'properties': { 'type': { 'type': 'string', 'enum': ['arrow'] }, 'points': { 'type': 'array', 'items': coordSchema, 'minItems': 2, 'maxItems': 2, }, 'fillColor': colorSchema }, 'description': 'The first point is the head of the arrow', 'required': ['type', 'points'], 'additionalProperties': False }) circleShapeSchema = extendSchema(baseShapeSchema, { 'properties': { 'type': { 'type': 'string', 'enum': ['circle'] }, 'center': coordSchema, 'radius': { 'type': 'number', 'minimum': 0 }, 'fillColor': colorSchema }, 'required': ['type', 'center', 'radius'], 'additionalProperties': False }) polylineShapeSchema = extendSchema(baseShapeSchema, { 'properties': { 'type': { 'type': 'string', 'enum': ['polyline'] }, 'points': { 'type': 'array', 'items': coordSchema, 'minItems': 2, }, 'fillColor': colorSchema, 'closed': { 'type': 'boolean', 'description': 'polyline is open if closed flag is ' 'not specified' }, 'holes': { 'type': 'array', 'description': 'If closed is true, this is a list of polylines that are ' 'treated as holes in the base polygon. These should not ' 'cross each other and should be contained within the base ' 'polygon.', 'items': { 'type': 'array', 'items': coordSchema, 'minItems': 3, }, }, }, 'required': ['type', 'points'], 'additionalProperties': False }) baseRectangleShapeSchema = extendSchema(baseShapeSchema, { 'properties': { 'type': {'type': 'string'}, 'center': coordSchema, 'width': { 'type': 'number', 'minimum': 0 }, 'height': { 'type': 'number', 'minimum': 0 }, 'rotation': { 'type': 'number', 'description': 'radians counterclockwise around normal', }, 'normal': coordSchema, 'fillColor': colorSchema }, 'decription': 'normal is the positive z-axis unless otherwise ' 'specified', 'required': ['type', 'center', 'width', 'height'], }) rectangleShapeSchema = extendSchema(baseRectangleShapeSchema, { 'properties': { 'type': { 'type': 'string', 'enum': ['rectangle'] }, }, 'additionalProperties': False }) rectangleGridShapeSchema = extendSchema(baseRectangleShapeSchema, { 'properties': { 'type': { 'type': 'string', 'enum': ['rectanglegrid'] }, 'widthSubdivisions': { 'type': 'integer', 'minimum': 1 }, 'heightSubdivisions': { 'type': 'integer', 'minimum': 1 }, }, 'required': ['type', 'widthSubdivisions', 'heightSubdivisions'], 'additionalProperties': False, }) ellipseShapeSchema = extendSchema(baseRectangleShapeSchema, { 'properties': { 'type': { 'type': 'string', 'enum': ['ellipse'] }, }, 'required': ['type'], 'additionalProperties': False }) heatmapSchema = extendSchema(baseElementSchema, { 'properties': { 'type': { 'type': 'string', 'enum': ['heatmap'] }, 'points': { 'type': 'array', 'items': coordValueSchema, }, 'radius': { 'type': 'number', 'exclusiveMinimum': 0, }, 'colorRange': colorRangeSchema, 'rangeValues': rangeValueSchema, 'normalizeRange': { 'type': 'boolean', 'description': 'If true, rangeValues are on a scale of 0 to 1 ' 'and map to the minimum and maximum values on the ' 'data. If false (the default), the rangeValues ' 'are the actual data values.', }, 'scaleWithZoom': { 'type': 'boolean', 'description': 'If true, scale the size of points with the ' 'zoom level of the map.' } }, 'required': ['type', 'points'], 'additionalProperties': False, 'description': 'ColorRange and rangeValues should have a one-to-one ' 'correspondence.', }) griddataSchema = extendSchema(baseElementSchema, { 'properties': { 'type': { 'type': 'string', 'enum': ['griddata'] }, 'origin': coordSchema, 'dx': { 'type': 'number', 'description': 'grid spacing in the x direction', }, 'dy': { 'type': 'number', 'description': 'grid spacing in the y direction', }, 'gridWidth': { 'type': 'integer', 'minimum': 1, 'description': 'The number of values across the width of the grid', }, 'values': { 'type': 'array', 'items': {'type': 'number'}, 'description': 'The values of the grid. This must have a ' 'multiple of gridWidth entries', }, 'interpretation': { 'type': 'string', 'enum': ['heatmap', 'contour', 'choropleth'] }, 'radius': { 'type': 'number', 'exclusiveMinimum': 0, 'description': 'radius used for heatmap interpretation', }, 'colorRange': colorRangeSchema, 'rangeValues': rangeValueSchema, 'normalizeRange': { 'type': 'boolean', 'description': 'If true, rangeValues are on a scale of 0 to 1 ' 'and map to the minimum and maximum values on the ' 'data. If false (the default), the rangeValues ' 'are the actual data values.', }, 'stepped': {'type': 'boolean'}, 'minColor': colorSchema, 'maxColor': colorSchema, }, 'required': ['type', 'values', 'gridWidth'], 'additionalProperties': False, 'description': 'ColorRange and rangeValues should have a one-to-one ' 'correspondence except for stepped contours where ' 'rangeValues needs one more entry than colorRange. ' 'minColor and maxColor are the colors applies to values ' 'beyond the ranges in rangeValues.', }) transformArray = { 'type': 'array', 'items': { 'type': 'array', 'minItems': 2, 'maxItems': 2 }, 'minItems': 2, 'maxItems': 2, 'description': 'A 2D matrix representing the transform of an ' 'image overlay.' } overlaySchema = extendSchema(baseElementSchema, { 'properties': { 'type': { 'type': 'string', 'enum': ['image'] }, 'girderId': { 'type': 'string', 'pattern': '^[0-9a-f]{24}$', 'description': 'Girder item ID containing the image to ' 'overlay.' }, 'opacity': { 'type': 'number', 'minimum': 0, 'maximum': 1, 'description': 'Default opacity for this image overlay. Must ' 'be between 0 and 1. Defaults to 1.' }, 'hasAlpha': { 'type': 'boolean', 'description': 'If true, the image is treated assuming it has an alpha ' 'channel.', }, 'transform': { 'type': 'object', 'description': 'Specification for an affine transform of the ' 'image overlay. Includes a 2D transform matrix, ' 'an X offset and a Y offset.', 'properties': { 'xoffset': { 'type': 'number' }, 'yoffset': { 'type': 'number' }, 'matrix': transformArray }, } }, 'required': ['girderId', 'type'], 'additionalProperties': False, 'description': 'An image overlay on top of the base resource.', }) pixelmapCategorySchema = { 'type': 'object', 'properties': { 'fillColor': colorSchema, 'strokeColor': colorSchema, 'label': { 'type': 'string', 'description': 'A string representing the semantic ' 'meaning of regions of the map with ' 'the corresponding color.' }, 'description': { 'type': 'string', 'description': 'A more detailed explanation of the ' 'meaining of this category.' } }, 'required': ['fillColor'], 'additionalProperties': False, } pixelmapSchema = extendSchema(overlaySchema, { 'properties': { 'type': { 'type': 'string', 'enum': ['pixelmap'], }, 'values': { 'type': 'array', 'items': {'type': 'integer'}, 'description': 'An array where the indices ' 'correspond to pixel values in the ' 'pixel map image and the values are ' 'used to look up the appropriate ' 'color in the categories property.' }, 'categories': { 'type': 'array', 'items': pixelmapCategorySchema, 'description': 'An array used to map between the ' 'values array and color values. ' 'Can also contain semantic ' 'information for color values.' }, 'boundaries': { 'type': 'boolean', 'description': 'True if the pixelmap doubles pixel ' 'values such that even values are the ' 'fill and odd values the are stroke ' 'of each superpixel. If true, the ' 'length of the values array should be ' 'half of the maximum value in the ' 'pixelmap.' }, }, 'required': ['values', 'categories', 'boundaries'], 'additionalProperties': False, 'description': 'A tiled pixelmap to overlay onto a base resource.', }) annotationElementSchema = { # Shape subtypes are mutually exclusive, so for efficiency, don't use # 'oneOf' 'anyOf': [ # If we include the baseShapeSchema, then shapes that are as-yet # invented can be included. # baseShapeSchema, arrowShapeSchema, circleShapeSchema, ellipseShapeSchema, griddataSchema, heatmapSchema, pointShapeSchema, polylineShapeSchema, rectangleShapeSchema, rectangleGridShapeSchema, overlaySchema, pixelmapSchema, ] } annotationSchema = { '$schema': '', 'type': 'object', 'properties': { 'name': { 'type': 'string', # TODO: Disallow empty? 'minLength': 1, }, 'description': {'type': 'string'}, 'attributes': { 'type': 'object', 'additionalProperties': True, 'title': 'Image Attributes', 'description': 'Subjective things that apply to the entire ' 'image.' }, 'elements': { 'type': 'array', 'items': annotationElementSchema, # We want to ensure unique element IDs, if they are set. If # they are not set, we assign them from Mongo. 'title': 'Image Markup', 'description': 'Subjective things that apply to a ' 'spatial region.' } }, 'additionalProperties': False }
[docs]class Annotation(AccessControlledModel): """ This model is used to represent an annotation that is associated with an item. The annotation can contain any number of annotationelements, which are included because they reference this annotation as a parent. The annotation acts like these are a native part of it, though they are each stored as independent models to (eventually) permit faster spatial searching. """ validatorAnnotation = jsonschema.Draft6Validator( AnnotationSchema.annotationSchema) validatorAnnotationElement = jsonschema.Draft6Validator( AnnotationSchema.annotationElementSchema) idRegex = re.compile('^[0-9a-f]{24}$') numberInstance = (int, float)
[docs] class Skill(enum.Enum): NOVICE = 'novice' EXPERT = 'expert'
# This is everything except the annotation field, and is used, in part, to # determine what gets returned in a general find. baseFields = ( '_id', 'itemId', 'creatorId', 'created', 'updated', 'updatedId', 'public', 'publicFlags', 'groups' # 'skill', # 'startTime' # 'stopTime' )
[docs] def initialize(self): self._writeLock = threading.Lock() = 'annotation' self.ensureIndices([ 'itemId', 'created', 'creatorId', ([ ('itemId', SortDir.ASCENDING), ('_active', SortDir.ASCENDING), ], {}), ([ ('_annotationId', SortDir.ASCENDING), ('_version', SortDir.DESCENDING), ], {}), 'updated', ]) self.ensureTextIndex({ '': 10, 'annotation.description': 1, }) self.exposeFields(AccessType.READ, ( 'annotation', '_version', '_elementQuery', '_active', ) + self.baseFields) events.bind('model.item.remove', 'large_image_annotation', self._onItemRemove) events.bind('model.item.copy.prepare', 'large_image_annotation', self._prepareCopyItem) events.bind('model.item.copy.after', 'large_image_annotation', self._handleCopyItem) self._historyEnabled = Setting().get( constants.PluginSettings.LARGE_IMAGE_ANNOTATION_HISTORY) # Listen for changes to our relevant settings events.bind('', 'large_image_annotation', self._onSettingChange) events.bind('model.setting.remove', 'large_image_annotation', self._onSettingChange)
def _onItemRemove(self, event): """ When an item is removed, also delete associated annotations. :param event: the event with the item information. """ item = annotations = Annotation().find({'itemId': item['_id']}) for annotation in annotations: if self._historyEnabled: # just mark the annotations as inactive self.update({'_id': annotation['_id']}, {'$set': {'_active': False}}) else: Annotation().remove(annotation) def _prepareCopyItem(self, event): # check if this copy should include annotations if (cherrypy.request and cherrypy.request.params and str(cherrypy.request.params.get('copyAnnotations')).lower() == 'false'): return srcItem, newItem = if Annotation().findOne({ '_active': {'$ne': False}, 'itemId': srcItem['_id']}): newItem['_annotationItemId'] = srcItem['_id'] Item().save(newItem, triggerEvents=False) def _handleCopyItem(self, event): newItem = srcItemId = newItem.pop('_annotationItemId', None) if srcItemId: Item().save(newItem, triggerEvents=False) self._copyAnnotationsFromOtherItem(srcItemId, newItem) def _copyAnnotationsFromOtherItem(self, srcItemId, destItem): # Copy annotations from the original item to this one query = {'_active': {'$ne': False}, 'itemId': srcItemId} annotations = Annotation().find(query) total = annotations.count() if not total: return destItemId = destItem['_id'] folder = Folder().load(destItem['folderId'], force=True) count = 0 for annotation in annotations:'Copying annotation %d of %d from %s to %s', count + 1, total, srcItemId, destItemId) # Make sure we have the elements annotation = Annotation().load(annotation['_id'], force=True) # This could happen, for instance, if the annotation were deleted # while we are copying other annotations. if annotation is None: continue annotation['itemId'] = destItemId del annotation['_id'] # Remove existing permissions, then give it the same permissions # as the item's folder. annotation.pop('access', None) self.copyAccessPolicies(destItem, annotation, save=False) self.setPublic(annotation, folder.get('public'), save=False) count += 1'Copied %d annotations from %s to %s ', count, srcItemId, destItemId) def _onSettingChange(self, event): settingDoc = if settingDoc['key'] == constants.PluginSettings.LARGE_IMAGE_ANNOTATION_HISTORY: self._historyEnabled = settingDoc['value'] def _migrateDatabase(self): # Check that all entries have ACL for annotation in self.collection.find({'access': {'$exists': False}}): self._migrateACL(annotation) # Check that all annotations have groups for annotation in self.collection.find({'groups': {'$exists': False}}): self.injectAnnotationGroupSet(annotation) def _migrateACL(self, annotation): """ Add access control information to an annotation model. Originally annotation models were not access controlled. This function performs the migration for annotations created before this change was made. The access object is copied from the folder containing the image the annotation is attached to. In addition, the creator is given admin access. """ if annotation is None or 'access' in annotation: return annotation item = Item().load(annotation['itemId'], force=True) if item is None: logger.warning( 'Could not generate annotation ACL due to missing item %s', annotation['_id']) return annotation folder = Folder().load(item['folderId'], force=True) if folder is None: logger.warning( 'Could not generate annotation ACL due to missing folder %s', annotation['_id']) return annotation user = None if annotation.get('creatorId'): user = User().load(annotation['creatorId'], force=True) if user is None: logger.warning( 'Could not generate annotation ACL due to missing user %s', annotation['_id']) return annotation self.copyAccessPolicies(item, annotation, save=False) self.setUserAccess(annotation, user, AccessType.ADMIN, force=True, save=False) self.setPublic(annotation, folder.get('public'), save=False) # call the super class save method to avoid messing with elements super().save(annotation)'Generated annotation ACL for %s', annotation['_id']) return annotation
[docs] def createAnnotation(self, item, creator, annotation, public=None): now = datetime.datetime.utcnow() doc = { 'itemId': item['_id'], 'creatorId': creator['_id'], 'created': now, 'updatedId': creator['_id'], 'updated': now, 'annotation': annotation, } if annotation and not annotation.get('name'): annotation['name'] = now.strftime('Annotation %Y-%m-%d %H:%M') # copy access control from the folder containing the image folder = Folder().load(item['folderId'], force=True) self.copyAccessPolicies(src=folder, dest=doc, save=False) if public is None: public = folder.get('public', False) self.setPublic(doc, public, save=False) # give the current user admin access self.setUserAccess(doc, user=creator, level=AccessType.ADMIN, save=False) doc = Notification().createNotification( type='large_image_annotation.create', data={'_id': doc['_id'], 'itemId': doc['itemId']}, user=creator, expires=datetime.datetime.utcnow() + datetime.timedelta(seconds=1)) return doc
[docs] def load(self, id, region=None, getElements=True, *args, **kwargs): """ Load an annotation, adding all or a subset of the elements to it. :param region: if present, a dictionary restricting which annotations are returned. See annotationelement.getElements. :param getElements: if False, don't get elements associated with this annotation. :returns: the matching annotation or none. """ annotation = super().load(id, *args, **kwargs) if annotation is None: return if getElements: # It is possible that we are trying to read the elements of an # annotation as another thread is updating them. In this case, # there is a chance, that between when we get the annotation and # ask for the elements, the version will have been updated and the # elements will have gone away. To work around the lack of # transactions in Mongo, if we don't get any elements, we check if # the version has shifted under us, and, if so, requery. I've put # an arbitrary retry limit on this to prevent an infinite loop. maxRetries = 3 for retry in range(maxRetries): Annotationelement().getElements( annotation, region) if (len(annotation.get('annotation', {}).get('elements')) or retry + 1 == maxRetries): break recheck = super().load(id, *args, **kwargs) if (recheck is None or annotation.get('_version') == recheck.get('_version')): break annotation = recheck self.injectAnnotationGroupSet(annotation) return annotation
[docs] def remove(self, annotation, *args, **kwargs): """ When removing an annotation, remove all element associated with it. This overrides the collection delete_one method so that all of the triggers are fired as expected and cancelling from an event will work as needed. :param annotation: the annotation document to remove. """ if self._historyEnabled: # just mark the annotations as inactive result = self.update({'_id': annotation['_id']}, {'$set': {'_active': False}}) else: with self._writeLock: delete_one = self.collection.delete_one def deleteElements(query, *args, **kwargs): ret = delete_one(query, *args, **kwargs) Annotationelement().removeElements(annotation) return ret with self._writeLock: self.collection.delete_one = deleteElements try: result = super().remove(annotation, *args, **kwargs) finally: self.collection.delete_one = delete_one Notification().createNotification( type='large_image_annotation.remove', data={'_id': annotation['_id'], 'itemId': annotation['itemId']}, user=User().load(annotation['creatorId'], force=True), expires=datetime.datetime.utcnow() + datetime.timedelta(seconds=1)) return result
[docs] def save(self, annotation, *args, **kwargs): """ When saving an annotation, override the collection insert_one and replace_one methods so that we don't save the elements with the main annotation. Still use the super class's save method, so that all of the triggers are fired as expected and cancelling and modifications can be done as needed. Because Mongo doesn't support transactions, a version number is stored with the annotation and with the associated elements. This is used to add the new elements first, then update the annotation, and delete the old elements. The allows version integrity if another thread queries the annotation at the same time. :param annotation: the annotation document to save. :returns: the saved document. If it is a new document, the _id has been added. """ starttime = time.time() with self._writeLock: replace_one = self.collection.replace_one insert_one = self.collection.insert_one version = Annotationelement().getNextVersionValue() if '_id' not in annotation: oldversion = None else: if '_annotationId' in annotation: annotation['_id'] = annotation['_annotationId'] # We read the old version from the existing record, because we # don't want to trust that the input _version has not been altered # or is present. oldversion = self.collection.find_one( {'_id': annotation['_id']}).get('_version') annotation['_version'] = version _elementQuery = annotation.pop('_elementQuery', None) annotation.pop('_active', None) annotation.pop('_annotationId', None) def replaceElements(query, doc, *args, **kwargs): Annotationelement().updateElements(doc) elements = doc['annotation'].pop('elements', None) if self._historyEnabled: oldAnnotation = self.collection.find_one(query) if oldAnnotation: oldAnnotation['_annotationId'] = oldAnnotation.pop('_id') oldAnnotation['_active'] = False insert_one(oldAnnotation) ret = replace_one(query, doc, *args, **kwargs) if elements: doc['annotation']['elements'] = elements if not self._historyEnabled: Annotationelement().removeOldElements(doc, oldversion) return ret def insertElements(doc, *args, **kwargs): # When creating an annotation, store the elements first, then store # the annotation without elements, then restore the elements. doc.setdefault('_id', ObjectId()) if doc['annotation'].get('elements') is not None: Annotationelement().updateElements(doc) # If we are inserting, we shouldn't have any old elements, so don't # bother removing them. elements = doc['annotation'].pop('elements', None) ret = insert_one(doc, *args, **kwargs) if elements is not None: doc['annotation']['elements'] = elements return ret with self._writeLock: self.collection.replace_one = replaceElements self.collection.insert_one = insertElements try: result = super().save(annotation, *args, **kwargs) finally: self.collection.replace_one = replace_one self.collection.insert_one = insert_one if _elementQuery: result['_elementQuery'] = _elementQuery annotation.pop('groups', None) self.injectAnnotationGroupSet(annotation) logger.debug('Saved annotation in %5.3fs' % (time.time() - starttime)) events.trigger('large_image.annotations.save_history', { 'annotation': annotation }, asynchronous=True) return result
[docs] def updateAnnotation(self, annotation, updateUser=None): """ Update an annotation. :param annotation: the annotation document to update. :param updateUser: the user who is creating the update. :returns: the annotation document that was updated. """ annotation['updated'] = datetime.datetime.utcnow() annotation['updatedId'] = updateUser['_id'] if updateUser else None annotation = Notification().createNotification( type='large_image_annotation.update', data={'_id': annotation['_id'], 'itemId': annotation['itemId']}, user=User().load(annotation['creatorId'], force=True), expires=datetime.datetime.utcnow() + datetime.timedelta(seconds=1)) return annotation
def _similarElementStructure(self, a, b, parentKey=None): # noqa """ Compare two elements to determine if they are similar enough that if one validates, the other should, too. This is called recursively to validate dictionaries. In general, types must be the same, dictionaries must contain the same keys, arrays must be the same length. The only differences that are allowed are numerical values may be different, ids may be different, and point arrays may contain different numbers of elements. :param a: first element :param b: second element :param parentKey: if set, the key of the dictionary that used for this part of the comparison. :returns: True if the elements are similar. False if they are not. """ # This function exceeds the recommended complexity, but since it is # needs to be relatively fast, breaking it into smaller functions is # probably undesirable. if not isinstance(a, type(b)): return False if isinstance(a, dict): if len(a) != len(b): return False for k in a: if k not in b: return False if k == 'id': if not isinstance(b[k], str) or not self.idRegex.match(b[k]): return False elif parentKey != 'label' or k != 'value': if not self._similarElementStructure(a[k], b[k], k): return False elif isinstance(a, list): if parentKey == 'holes': return all( len(hole) == 3 and # this is faster than checking the instance type, and, if # it raises an exception, it would have failed validation # any way. 1 + hole[0] + hole[1] + hole[2] is not None # isinstance(hole[0], self.numberInstance) and # isinstance(hole[1], self.numberInstance) and # isinstance(hole[2], self.numberInstance) for hlist in b for hole in hlist) if len(a) != len(b): if parentKey not in {'points', 'values'} or len(a) < 2 or len(b) < 2: return False # If this is an array of points, let it pass return all( len(elem) == 3 and # this is faster than checking the instance type, and, if # it raises an exception, it would have failed validation # any way. 1 + elem[0] + elem[1] + elem[2] is not None # isinstance(elem[0], self.numberInstance) and # isinstance(elem[1], self.numberInstance) and # isinstance(elem[2], self.numberInstance) for elem in b) for idx in range(len(a)): if not self._similarElementStructure(a[idx], b[idx], parentKey): return False elif not isinstance(a, self.numberInstance): return a == b # Either a number or the dictionary or list comparisons passed return True
[docs] def validate(self, doc): # noqa startTime = lastTime = time.time() try: # This block could just use the json validator: # jsonschema.validate(doc.get('annotation'), # AnnotationSchema.annotationSchema) # but this is very slow. Instead, validate the main structure and # then validate each element. If sequential elements are similar # in structure, skip validating them. annot = doc.get('annotation') elements = annot.get('elements', []) annot['elements'] = [] self.validatorAnnotation.validate(annot) lastValidatedElement = None lastValidatedElement2 = None for idx, element in enumerate(elements): # Discard element keys beginning with _ for key in list(element): if key.startswith('_'): del element[key] if isinstance(element.get('id'), ObjectId): element['id'] = str(element['id']) # Handle elements with large arrays by checking that a # conversion to a numpy array works keys = None if len(element.get('points', element.get('values', []))) > VALIDATE_ARRAY_LENGTH: key = 'points' if 'points' in element else 'values' try: # Check if the entire array converts in an obvious # manner numpy.array(element[key], dtype=float) keys[key] = element[key] element[key] = element[key][:VALIDATE_ARRAY_LENGTH] except Exception: pass if any(len(h) > VALIDATE_ARRAY_LENGTH for h in element.get('holes', [])): key = 'holes' try: for h in element['holes']: numpy.array(h, dtype=float) keys[key] = element[key] element[key] = [] except Exception: pass try: if (not self._similarElementStructure(element, lastValidatedElement) and not self._similarElementStructure(element, lastValidatedElement2)): self.validatorAnnotationElement.validate(element) lastValidatedElement2 = lastValidatedElement lastValidatedElement = element except TypeError: self.validatorAnnotationElement.validate(element) if keys: element.update(keys) if time.time() - lastTime > 10:'Validated %s of %d elements in %5.3fs', idx + 1, len(elements), time.time() - startTime) lastTime = time.time() annot['elements'] = elements except jsonschema.ValidationError as exp: raise ValidationException(exp) if time.time() - startTime > 10:'Validated in %5.3fs' % (time.time() - startTime)) elementIds = [entry['id'] for entry in doc['annotation'].get('elements', []) if 'id' in entry] if len(set(elementIds)) != len(elementIds): raise ValidationException('Annotation Element IDs are not unique') return doc
[docs] def versionList(self, annotationId, user=None, limit=0, offset=0, sort=(('_version', -1), ), force=False): """ List annotation history entries for a specific annotationId. Only annotations that belong to an existing item that the user is allowed to view are included. If the user is an admin, all annotations will be included. :param annotationId: the annotation to get history for. :param user: the Girder user. :param limit: maximum number of history entries to return. :param offset: skip this many entries. :param sort: the sort method used. Defaults to reverse _id. :param force: if True, don't authenticate the user. :yields: the entries in the list """ if annotationId and not isinstance(annotationId, ObjectId): annotationId = ObjectId(annotationId) # Make sure we have only one of each version, plus apply our filter and # sort. Don't apply limit and offset here, as they are subject to # access control and other effects entries = self.collection.aggregate([ {'$match': {'$or': [{'_id': annotationId}, {'_annotationId': annotationId}]}}, {'$group': {'_id': '$_version', '_doc': {'$first': '$$ROOT'}}}, {'$replaceRoot': {'newRoot': '$_doc'}}, {'$sort': {s[0]: s[1] for s in sort}}]) if not force: entries = self.filterResultsByPermission( cursor=entries, user=user, level=AccessType.READ, limit=limit, offset=offset) return entries
[docs] def getVersion(self, annotationId, version, user=None, force=False, *args, **kwargs): """ Get an annotation history version. This reconstructs the original annotation. :param annotationId: the annotation to get history for. :param version: the specific version to get. :param user: the Girder user. If the user is not an admin, they must have read access on the item and the item must exist. :param force: if True, don't get the user access. """ if annotationId and not isinstance(annotationId, ObjectId): annotationId = ObjectId(annotationId) entry = self.findOne({ '$or': [{'_id': annotationId}, {'_annotationId': annotationId}], '_version': int(version) }, fields=['_id']) if not entry: return None result = self.load(entry['_id'], user=user, force=force, *args, **kwargs) result['_versionId'] = result['_id'] result['_id'] = result.pop('annotationId', result['_id']) return result
[docs] def revertVersion(self, id, version=None, user=None, force=False): """ Revert to a previous version of an annotation. :param id: the annotation id. :param version: the version to revert to. None reverts to the previous version. If the annotation was deleted, this is the most recent version. :param user: the user doing the reversion. :param force: if True don't authenticate the user with the associated item access. """ if version is None: oldVersions = list(Annotation().versionList(id, limit=2, force=True)) if len(oldVersions) >= 1 and oldVersions[0].get('_active') is False: version = oldVersions[0]['_version'] elif len(oldVersions) >= 2: version = oldVersions[1]['_version'] annotation = Annotation().getVersion(id, version, user, force=force) if annotation is None: return # If this is the most recent (active) annotation, don't do anything. # Otherwise, revert it. if not annotation.get('_active', True): if not force: self.requireAccess(annotation, user=user, level=AccessType.WRITE) annotation = Annotation().updateAnnotation(annotation, updateUser=user) return annotation
[docs] def findAnnotatedImages(self, imageNameFilter=None, creator=None, user=None, level=AccessType.ADMIN, force=None, offset=0, limit=0, sort=None, **kwargs): r""" Find images associated with annotations. The list returned by this function is paginated and filtered by access control using the standard girder kwargs. :param imageNameFilter: A string used to filter images by name. An image name matches if it (or a subtoken) begins with this string. Subtokens are generated by splitting by the regex ``[\W_]+`` This filter is case-insensitive. :param creator: Filter by a user who is the creator of the annotation. """ query = {'_active': {'$ne': False}} if creator: query['creatorId'] = creator['_id'] annotations = self.find( query, sort=sort, fields=['itemId']) images = [] imageIds = set() for annotation in annotations: # short cut if the image has already been added to the results if annotation['itemId'] in imageIds: continue try: item = ImageItem().load(annotation['itemId'], level=level, user=user, force=force) except AccessException: item = None # ignore if no such item exists if not item: continue if not self._matchImageName(item['name'], imageNameFilter or ''): continue if len(imageIds) >= offset: images.append(item) imageIds.add(item['_id']) if len(images) == limit: break return images
def _matchImageName(self, imageName, matchString): matchString = matchString.lower() imageName = imageName.lower() if imageName.startswith(matchString): return True tokens = re.split(r'[\W_]+', imageName, flags=re.UNICODE) return any(token.startswith(matchString) for token in tokens)
[docs] def injectAnnotationGroupSet(self, annotation): if 'groups' not in annotation: annotation['groups'] = Annotationelement().getElementGroupSet(annotation) query = { '_id': ObjectId(annotation['_id']) } update = { '$set': { 'groups': annotation['groups'] } } self.collection.update_one(query, update) return annotation
[docs] def setAccessList(self, doc, access, save=False, **kwargs): """ The super class's setAccessList function can save a document. However, annotations which have not loaded elements lose their elements when this occurs, because the validation step of the save function adds an empty element list. By using an update instead of a save, this prevents the problem. """ update = save and '_id' in doc save = save and '_id' not in doc doc = super().setAccessList(doc, access, save=save, **kwargs) if update: self.update({'_id': doc['_id']}, {'$set': {'access': doc['access']}}) return doc
[docs] def removeOldAnnotations(self, remove=False, minAgeInDays=30, keepInactiveVersions=5): # noqa """ Remove annotations that (a) have no item or (b) are inactive and at least (1) a minimum age in days and (2) not the most recent inactive versions. Also remove any annotation elements that don't have associated annotations and are a minimum age in days. :param remove: if False, just report on what would be done. If true, actually remove the annotations and compact the collections. :param minAgeInDays: only work on annotations that are at least this old. This must be greater than or equal to 7. :param keepInactiveVersions: keep at least this many inactive versions of any annotation, regardless of age. """ if (remove and minAgeInDays < 7) or minAgeInDays < 0: raise ValidationException('minAgeInDays must be >= 7') age = datetime.datetime.utcnow() + datetime.timedelta(-minAgeInDays) if keepInactiveVersions < 0: raise ValidationException('keepInactiveVersions mist be non-negative') report = {'fromDeletedItems': 0, 'oldVersions': 0, 'active': 0, 'recentVersions': 0} if remove: report['removedVersions'] = 0 itemIds = {} processedIds = set() annotVersions = set()'Checking old annotations') logtime = time.time() for annot in self.collection.find().sort([('_id', SortDir.ASCENDING)]): if time.time() - logtime > 10:'Still checking old annotations, checked %d with %d versions, %r' % ( len(processedIds), len(annotVersions), report)) logtime = time.time() id = annot.get('_annotationId', annot['_id']) version = annot.get('_version') annotVersions.add(version) if id in processedIds: continue itemId = annot.get('itemId') if itemId not in itemIds: if len(itemIds) > 10000: itemIds = {} itemIds[itemId] = Item().findOne({'_id': itemId}) is not None keep = keepInactiveVersions if itemIds[itemId] else 0 history = self.versionList(id, force=True) for record in history: if record.get('_active') is not False and itemIds[itemId]: report['active'] += 1 continue if keep: keep -= 1 report['recentVersions'] += 1 continue if max(record['created'], record['updated']) < age: if remove: self.collection.delete_one({'_id': record['_id']}) Annotationelement().removeWithQuery({'_version': record['_version']}) report['removedVersions'] += 1 if not itemIds[itemId]: report['fromDeletedItems'] += 1 else: report['oldVersions'] += 1 else: report['recentVersions'] += 1 processedIds.add(id)'Getting distinct element versions') elemVersions = Annotationelement().collection.distinct( '_version', filter={'created': {'$lt': age}})'Got %d distinct element versions' % len(elemVersions)) logtime = time.time() abandonedVersions = set(elemVersions) - set(annotVersions) report['abandonedVersions'] = len(abandonedVersions) if remove: for version in abandonedVersions: if time.time() - logtime > 10:'Removing abandoned versions, %r' % report) logtime = time.time() Annotationelement().removeWithQuery({'_version': version}) report['removedVersions'] += 1'Compacting annotation collection') self.collection.database.command('compact','Compacting annotationelement collection') self.collection.database.command('compact', Annotationelement().name)'Done compacting collections')'Finished checking old annotations, %r' % report) return report
[docs] def setMetadata(self, annotation, metadata, allowNull=False): """ Set metadata on an annotation. A `ValidationException` is thrown in the cases where the metadata JSON object is badly formed, or if any of the metadata keys contains a period ('.'). :param annotation: The annotation to set the metadata on. :type annotation: dict :param metadata: A dictionary containing key-value pairs to add to the annotations meta field :type metadata: dict :param allowNull: Whether to allow `null` values to be set in the annotation's metadata. If set to `False` or omitted, a `null` value will cause that metadata field to be deleted. :returns: the annotation document """ if 'attributes' not in annotation['annotation']: annotation['annotation']['attributes'] = {} # Add new metadata to existing metadata annotation['annotation']['attributes'].update(metadata.items()) # Remove metadata fields that were set to null if not allowNull: toDelete = [k for k, v in metadata.items() if v is None] for key in toDelete: del annotation['annotation']['attributes'][key] self.validateKeys(annotation['annotation']['attributes']) annotation['updated'] = datetime.datetime.utcnow() # Validate and save the annotation return super().save(annotation)
[docs] def deleteMetadata(self, annotation, fields): """ Delete metadata on an annotation. A `ValidationException` is thrown if the metadata field names contain a period ('.') or begin with a dollar sign ('$'). :param annotation: The annotation to delete metadata from. :type annotation: dict :param fields: An array containing the field names to delete from the annotation's meta field :type field: list :returns: the annotation document """ self.validateKeys(fields) if 'attributes' not in annotation['annotation']: annotation['annotation']['attributes'] = {} for field in fields: annotation['annotation']['attributes'].pop(field, None) annotation['updated'] = datetime.datetime.utcnow() return super().save(annotation)