コード例 #1
0
ファイル: media.py プロジェクト: pixelsforhumans/giza
    def process_media_row(media, current_id):
        id = row[indices['id_index']]
        media_type_key = int(row[indices['media_type_id_index']])
        media_type = MEDIATYPES.get(media_type_key)

        # for now, ignore Microfilm and Document media types
        if (media_type_key in [4, 5]):
            return (media, current_id)

        if id != current_id:
            save(media)
            current_id = id
            media = {}
            if elasticsearch_connection.item_exists(id, media_type):
                media = elasticsearch_connection.get_item(id, media_type)
            else:
                print "%s could not be found!" % id
                return (media, current_id)
        if 'relateditems' not in media:
            media['relateditems'] = {}

        constituent_id = row[indices['constituent_id_index']]
        display_name = row[indices['display_name_index']]
        description = row[indices['remarks_index']] if row[
            indices['remarks_index']] != "NULL" else ""
        display_date = ""
        if row[indices['display_date_index']] != "NULL":
            display_date = row[indices['display_date_index']]
        thumbnail_url = get_media_url(row[indices['thumb_path_index']],
                                      row[indices['thumb_file_index']])

        constituent_dict = {}
        role = row[indices['role_index']]
        # update the set of roles for this media
        if role not in media['roles']:
            # make sure Photographer is first
            if role == "Photographer":
                media['roles'].insert(0, role)
            else:
                media['roles'].append(role)

        constituent_dict['role'] = row[indices['role_index']]
        constituent_dict['roleid'] = row[indices['role_id_index']]
        constituent_dict['id'] = constituent_id
        constituent_dict['displayname'] = display_name
        constituent_dict['displaydate'] = display_date
        constituent_dict['displaytext'] = display_name
        constituent_dict['description'] = description
        constituent_dict['thumbnail'] = thumbnail_url

        constituent_type_key = int(row[indices['constituent_type_id_index']])
        constituent_type = CONSTITUENTTYPES.get(constituent_type_key)
        if constituent_type not in media['relateditems']:
            media['relateditems'][constituent_type] = []
        media['relateditems'][constituent_type].append(constituent_dict)
        # keep the related items sorted
        media['relateditems'][constituent_type].sort(
            key=operator.itemgetter('displaytext'))

        return (media, current_id)
コード例 #2
0
ファイル: media.py プロジェクト: pixelsforhumans/giza
    def process_media_row(media, current_id):
        id = row[indices['id_index']]
        media_type_key = int(row[indices['media_type_id_index']])
        media_type = MEDIATYPES.get(media_type_key)

        # for now, ignore Microfilm and Document media types
        if (media_type_key in [4, 5]):
            return (media, current_id)

        if id != current_id:
            save(media)
            current_id = id
            media = {}

        media['id'] = id
        media['mediatype'] = media_type
        number = "" if row[indices['rendition_number_index']].lower(
        ) == "null" else row[indices['rendition_number_index']]
        media['number'] = number
        prefix_idx = number.find('_')
        media['allnumbers'] = list(
            set([
                number, number[number.find('_') + 1:],
                number[number.find('_') + 1:number.rfind('_')],
                "".join(number.split()), "".join(number.split('_'))
            ]))
        media['description'] = "" if row[indices['description_index']].lower(
        ) == "null" else row[indices['description_index']]
        mediaview = "" if row[indices['media_view_index']].lower(
        ) == "null" else row[indices['media_view_index']]
        caption = "" if row[indices['caption_index']].lower(
        ) == "null" else row[indices['caption_index']]
        subjects = ": ".join([mediaview, caption])
        media['mediaview'] = mediaview
        media['subjects'] = subjects
        media['displaytext'] = subjects
        media['remarks'] = "" if row[indices['remarks_index']].lower(
        ) == "null" else row[indices['remarks_index']]
        media['department'] = "" if row[indices['department_index']].lower(
        ) == "null" else row[indices['department_index']]
        media['date'] = "" if row[indices['date_index']].lower(
        ) == "null" else row[indices['date_index']]
        media['problemsquestions'] = "" if row[
            indices['problems_index']].lower() == "null" else row[
                indices['problems_index']]
        thumbnail_url = get_media_url(row[indices['thumb_path_index']],
                                      row[indices['thumb_file_index']])
        main_url = get_media_url(row[indices['main_path_index']],
                                 row[indices['main_file_index']])
        media['primarydisplay'] = {
            'thumbnail': thumbnail_url,
            'main': main_url
        }
        media['roles'] = []

        return (media, current_id)
コード例 #3
0
ファイル: media.py プロジェクト: pixelsforhumans/giza
    def process_media_row(media, current_id):
        id = row[indices['media_id_index']]
        media_type_key = int(row[indices['media_type_id_index']])
        media_type = MEDIATYPES.get(media_type_key)

        # for now, ignore Microfilm and Document media types
        if (media_type_key in [4, 5]):
            return (media, current_id)

        if id != current_id:
            save(media)
            current_id = id
            media = {}
            if elasticsearch_connection.item_exists(id, media_type):
                media = elasticsearch_connection.get_item(id, media_type)
            else:
                print "%s could not be found!" % id
                return (media, current_id)

        if 'relateditems' not in media:
            media['relateditems'] = {}
        classification_key = int(row[indices['classification_id_index']])
        classification = CLASSIFICATIONS.get(classification_key)
        object_id = int(row[indices['object_id_index']])
        thumbnail_url = get_media_url(row[indices['thumb_path_index']],
                                      row[indices['thumb_file_index']])

        date = "" if row[indices['object_date_index']].lower(
        ) == "null" else row[indices['object_date_index']]
        object_title = row[indices['object_title_index']]
        object_number = row[indices['object_number_index']]
        if classification == "diarypages" and object_title.lower() == "null":
            idx = object_number.find('_')
            object_title = object_number[idx + 1:]
        if object_title.lower() == "null":
            object_title = "[No Title]"

        if classification not in media['relateditems']:
            media['relateditems'][classification] = []
        media['relateditems'][classification].append({
            'id': object_id,
            'title': object_title,
            'displaytext': object_title,
            'classificationid': classification_key,
            'number': object_number,
            'date': date,
            'thumbnail': thumbnail_url
        })
        # keep the related items sorted
        media['relateditems'][classification].sort(
            key=operator.itemgetter('displaytext'))

        return (media, current_id)
コード例 #4
0
ファイル: objects.py プロジェクト: rsinghal/giza
	def process_object_row(object, current_id):
		id = row[indices['id_index']]
		classification_key = int(row[indices['classification_id_index']])
		classification = CLASSIFICATIONS.get(classification_key)

		if id != current_id:
			# may have multiple rows for one object because of many related constituents
			save(object)
			current_id = id
			object = {}
			if elasticsearch_connection.item_exists(id, classification):
				object = elasticsearch_connection.get_item(id, classification)
			else:
				print "%s could not be found!" % id
				return(object, current_id)
		if 'relateditems' not in object:
			object['relateditems'] = {}

		media_type_key = int(row[indices['media_type_id_index']])
		media_type = MEDIATYPES.get(media_type_key)
		media_master_id = row[indices['media_master_id_index']]
		thumbnail_url = get_media_url(row[indices['thumb_path_index']], row[indices['thumb_file_index']])
		main_url = get_media_url(row[indices['main_path_index']], row[indices['main_file_index']])
		display_text = row[indices['caption_index']]

		# this is a bit of a hack because the MediaFormats for videos (in the TMS database) does not correctly identify the type of video
		# so, make sure we are only using videos that are mp4s
		if media_type_key == 3:
			if not row[indices['main_file_index']].endswith('mp4'):
				return(object, current_id)

		if media_type not in object['relateditems']:
			object['relateditems'][media_type] = []

		if media_type == 'photos':
			object['hasphoto'] = "Yes"
		# add primary photo as a top level item as well
		if row[indices['primary_display_index']] == '1':
			object['primarydisplay'] = {
			'thumbnail' : thumbnail_url,
			'main' : main_url,
			'displaytext' : display_text
			}
		if not (classification == '3dmodels' and media_type == '3dmodels'):
			object['relateditems'][media_type].append({
				'id' : media_master_id,
				'displaytext' : display_text,
				'primarydisplay' : True if row[indices['primary_display_index']] == '1' else False,
				'thumbnail' : thumbnail_url,
				'main' : main_url
				})
		return(object, current_id)
コード例 #5
0
ファイル: media.py プロジェクト: artshumrc/giza
    def process_media_row(media, current_id):
        id = row[indices['id_index']]
        media_type_key = int(row[indices['media_type_id_index']])
        media_type = MEDIATYPES.get(media_type_key)

        # for now, ignore Microfilm and Document media types
        if (media_type_key in [4, 5]):
            return (media, current_id)

        if id != current_id:
            save(media)
            current_id = id
            media = {}
            if elasticsearch_connection.item_exists(id, media_type,
                                                    ELASTICSEARCH_INDEX):
                media = elasticsearch_connection.get_item(
                    id, media_type, ELASTICSEARCH_INDEX)
            else:
                print("%s could not be found!" % id)
                return (media, current_id)
        if 'relateditems' not in media:
            media['relateditems'] = {}

        site_id = row[indices['site_id_index']]
        site_name = row[indices['site_name_index']]
        site_number = row[indices['site_number_index']]
        thumbnail_url = get_media_url(row[indices['thumb_path_index']],
                                      row[indices['thumb_file_index']])
        drs_id = "" if row[indices['drs_id']].lower() == "null" else row[
            indices['drs_id']]
        if not thumbnail_url and drs_id:
            thumbnail_url = create_thumbnail_url(drs_id)

        site_dict = {}
        site_dict['id'] = site_id
        site_dict['sitename'] = site_name
        site_dict['sitenumber'] = site_number
        site_dict['displaytext'] = site_number
        site_dict['thumbnail'] = thumbnail_url

        if 'sites' not in media['relateditems']:
            media['relateditems']['sites'] = []
        media['relateditems']['sites'].append(site_dict)
        # keep the related items sorted
        media['relateditems']['sites'].sort(
            key=operator.itemgetter('displaytext'))

        return (media, current_id)
コード例 #6
0
ファイル: sites.py プロジェクト: rsinghal/giza
	def process_site_row(site, current_id):
		site_id = row[indices['site_id_index']]
		#if site_id not in SAMPLE_SITES:
		#	continue
		if site_id != current_id:
			# will likely have multiple rows for one site because of many related photos
			# only get a new site if we have a new site id, but first save old site to elasticsearch
			save(site)
			current_id = site_id
			site = {}
			if elasticsearch_connection.item_exists(site_id, 'sites'):
				site = elasticsearch_connection.get_item(site_id, 'sites')
			else:
				print "%s could not be found!" % site_id
				return(site, current_id)
		if 'relateditems' not in site:
			site['relateditems'] = {}

		media_type_key = int(row[indices['media_type_id_index']])
		media_type = MEDIATYPES.get(media_type_key)
		media_master_id = row[indices['media_master_id_index']]
		thumbnail_url = get_media_url(row[indices['thumb_path_index']], row[indices['thumb_file_index']])
		main_url = get_media_url(row[indices['main_path_index']], row[indices['main_file_index']])
		display_text = row[indices['caption_index']]

		# this is a bit of a hack because the MediaFormats for videos (in the TMS database) does not correctly identify the type of video
		# so, make sure we are only using videos that are mp4s
		if media_type_key == 3:
			if not row[indices['main_file_index']].endswith('mp4'):
				return(site, current_id)

		if media_type not in site['relateditems']:
			site['relateditems'][media_type] = []
		# add primary photo as a top level item as well
		if row[indices['primary_display_index']] == '1':
			site['primarydisplay'] = {
			'thumbnail' : thumbnail_url,
			'main' : main_url,
			'displaytext' : display_text
			}
		site['relateditems'][media_type].append({
			'id' : media_master_id,
			'displaytext' : display_text,
			'primarydisplay' : True if row[indices['primary_display_index']] == '1' else False,
			'thumbnail' : thumbnail_url,
			'main' : main_url
			})
		return(site, current_id)
コード例 #7
0
ファイル: constituents.py プロジェクト: rsinghal/giza
    def process_constituent_row(constituent, current_id):
        constituent_id = row[indices["constituent_id_index"]]
        type_key = int(row[indices["type_id_index"]])
        type = CONSTITUENTTYPES.get(type_key)

        if constituent_id != current_id:
            # will likely have multiple rows for one constituent because of many related photos
            # only get a new constituent if we have a new constituent id, but first save old constituent to elasticsearch
            save(constituent)
            current_id = constituent_id
            constituent = {}
            if elasticsearch_connection.item_exists(constituent_id, type):
                constituent = elasticsearch_connection.get_item(constituent_id, type)
            else:
                print "%s could not be found!" % constituent_id
                return (constituent, current_id)
        if "relateditems" not in constituent:
            constituent["relateditems"] = {}

        media_type_key = int(row[indices["media_type_id_index"]])
        media_type = MEDIATYPES.get(media_type_key)
        media_master_id = row[indices["media_master_id_index"]]
        thumbnail_url = get_media_url(row[indices["thumb_path_index"]], row[indices["thumb_file_index"]])
        main_url = get_media_url(row[indices["main_path_index"]], row[indices["main_file_index"]])
        display_text = row[indices["caption_index"]]

        # this is a bit of a hack because the MediaFormats for videos (in the TMS database) does not correctly identify the type of video
        # so, make sure we are only using videos that are mp4s
        if media_type_key == 3:
            if not row[indices["main_file_index"]].endswith("mp4"):
                return (constituent, current_id)

        if media_type not in constituent["relateditems"]:
            constituent["relateditems"][media_type] = []
            # add primary photo as a top level item as well
        if row[indices["primary_display_index"]] == "1":
            constituent["primarydisplay"] = {"thumbnail": thumbnail_url, "main": main_url, "displaytext": display_text}
        constituent["relateditems"][media_type].append(
            {
                "id": media_master_id,
                "displaytext": display_text,
                "primarydisplay": True if row[indices["primary_display_index"]] == "1" else False,
                "thumbnail": thumbnail_url,
                "main": main_url,
            }
        )
        return (constituent, current_id)
コード例 #8
0
ファイル: media.py プロジェクト: artshumrc/giza
    def process_media_row(media, current_id):
        id = row[indices['id_index']]
        media_type_key = int(row[indices['media_type_id_index']])
        media_type = MEDIATYPES.get(media_type_key)

        # for now, ignore Microfilm and Document media types
        if (media_type_key in [4, 5]):
            return (media, current_id)

        if id != current_id:
            save(media)
            current_id = id
            media = {}
            if elasticsearch_connection.item_exists(id, media_type,
                                                    ELASTICSEARCH_INDEX):
                media = elasticsearch_connection.get_item(
                    id, media_type, ELASTICSEARCH_INDEX)
            else:
                print("%s could not be found!" % id)
                return (media, current_id)
        if 'relateditems' not in media:
            media['relateditems'] = {}

        reference_id = row[indices['reference_id_index']]
        title = row[indices['title_index']]
        boiler_text = row[indices['boiler_text_index']]
        date = row[indices['date_index']]
        main_url = get_media_url(row[indices['path_index']],
                                 row[indices['file_index']])

        if 'pubdocs' not in media['relateditems']:
            media['relateditems']['pubdocs'] = []
        media['relateditems']['pubdocs'].append({
            'id': reference_id,
            'boilertext': boiler_text,
            'displaytext': boiler_text,
            'date': date,
            'url': main_url
        })
        # keep the related items sorted
        media['relateditems']['pubdocs'].sort(
            key=operator.itemgetter('displaytext'))

        return (media, current_id)
コード例 #9
0
    def process_media_row(manifest, current_id):
        media_id = row[indices['id_index']]
        media_type_key = int(row[indices['media_type_id_index']])
        media_type = MEDIATYPES.get(media_type_key)
        manifest_id = media_type + '-' + media_id

        # ignore non-photos, if they somehow managed to show up in the query results
        if media_type_key != 1:
            return (manifest, current_id)

        if manifest_id != current_id:
            save(manifest)
            current_id = manifest_id
            manifest = {}
            if elasticsearch_connection.item_exists(manifest_id, 'manifest',
                                                    ELASTICSEARCH_INDEX):
                manifest = elasticsearch_connection.get_item(
                    manifest_id, 'manifest', ELASTICSEARCH_INDEX)
            else:
                print("%s could not be found!" % manifest_id)
                return (manifest, current_id)

        role = "" if row[indices['role_index']].lower() == "null" else row[
            indices['role_index']]
        display_name = "" if row[indices['display_name_index']].lower(
        ) == "null" else row[indices['display_name_index']]
        display_date = "" if row[indices['display_date_index']].lower(
        ) == "null" else row[indices['display_date_index']]

        if display_date:
            value = display_name + ", " + display_date
        else:
            value = display_name
        manifest['manifest']['metadata'].append({
            'label': role,
            'value': value
        })

        return (manifest, current_id)
コード例 #10
0
ファイル: sites.py プロジェクト: artshumrc/giza
    def process_site_row(site, current_id):
        site_id = row[indices['site_id_index']]
        #if site_id not in SAMPLE_SITES:
        #	continue
        if site_id != current_id:
            # will likely have multiple rows for one site because of many related photos
            # only get a new site if we have a new site id, but first save old site to elasticsearch
            save(site)
            current_id = site_id
            site = {}
            if elasticsearch_connection.item_exists(site_id, 'sites',
                                                    ELASTICSEARCH_INDEX):
                site = elasticsearch_connection.get_item(
                    site_id, 'sites', ELASTICSEARCH_INDEX)
            else:
                print("%s could not be found!" % site_id)
                return (site, current_id)
        if 'relateditems' not in site:
            site['relateditems'] = {}

        media_type_key = int(row[indices['media_type_id_index']])
        media_type = MEDIATYPES.get(media_type_key)
        number = "" if row[indices['rendition_number_index']].lower(
        ) == "null" else row[indices['rendition_number_index']]
        description = "" if row[indices['description_index']].lower(
        ) == "null" else row[indices['description_index']]
        mediaview = "" if row[indices['media_view_index']].lower(
        ) == "null" else row[indices['media_view_index']]
        caption = "" if row[indices['caption_index']].lower(
        ) == "null" else row[indices['caption_index']]
        display_text = ": ".join([mediaview, caption])
        media_master_id = row[indices['media_master_id_index']]
        main_url = get_media_url(row[indices['main_path_index']],
                                 row[indices['main_file_index']])
        drs_id = "" if row[indices['drs_id']].lower() == "null" else row[
            indices['drs_id']]
        has_manifest = False if drs_id == "" else True
        primary_display = True if row[
            indices['primary_display_index']] == '1' else False
        thumbnail_url = get_media_url(row[indices['thumb_path_index']],
                                      row[indices['thumb_file_index']])
        if not thumbnail_url and drs_id:
            thumbnail_url = create_thumbnail_url(drs_id)

        # this is a bit of a hack because the MediaFormats for videos (in the TMS database) does not correctly identify the type of video
        # so, make sure we are only using videos that are mp4s
        if media_type_key == 3:
            if not row[indices['main_file_index']].endswith('mp4'):
                return (site, current_id)

        if media_type not in site['relateditems']:
            site['relateditems'][media_type] = []
        # add primary photo as a top level item as well
        if primary_display:
            site['primarydisplay'] = {
                'thumbnail': thumbnail_url,
                'main': main_url,
                'displaytext': display_text,
                'number': number,
                'description': description,
                'has_manifest': has_manifest,
                'media_id': media_master_id
            }
        site['relateditems'][media_type].append({
            'id': media_master_id,
            'displaytext': display_text,
            'primarydisplay': primary_display,
            'thumbnail': thumbnail_url,
            'main': main_url,
            'number': number,
            'description': description,
            'has_manifest': has_manifest,
            'drs_id': drs_id
        })

        if has_manifest:
            object = elasticsearch_connection.get_item(
                media_type + '-' + media_master_id, 'manifest',
                ELASTICSEARCH_IIIF_INDEX)
            resource = object['manifest']['sequences'][0]['canvases'][0][
                'images'][0]['resource']
            canvas_label = object['manifest']['description']
            canvas_metadata = object['manifest'][
                'metadata']  #add photo manifest-level metadata as canvas-level metadata for site

            if site_id not in SITE_RELATIONS.keys():
                metadata = add_metadata_to_manifest(site)

                SITE_RELATIONS[site_id] = {
                    'description': site['description'],
                    'label': site['displaytext'],
                    'resources': [resource],
                    'drs_ids': [drs_id],
                    'canvas_labels': [canvas_label],
                    'canvas_metadatas': [canvas_metadata],
                    'metadata': metadata
                }
            else:
                SITE_RELATIONS[site_id]['resources'].append(resource)
                SITE_RELATIONS[site_id]['drs_ids'].append(drs_id)
                SITE_RELATIONS[site_id]['canvas_labels'].append(canvas_label)
                SITE_RELATIONS[site_id]['canvas_metadatas'].append(
                    canvas_metadata)
            if primary_display:
                SITE_RELATIONS[site_id]['startCanvas'] = drs_id

        return (site, current_id)
コード例 #11
0
ファイル: objects.py プロジェクト: pixelsforhumans/giza
    def process_object_row(object, current_id):
        id = row[indices['id_index']]
        classification_key = int(row[indices['classification_id_index']])
        classification = CLASSIFICATIONS.get(classification_key)

        if id != current_id:
            # may have multiple rows for one object because of many related constituents
            save(object)
            current_id = id
            object = {}
            if elasticsearch_connection.item_exists(id, classification):
                object = elasticsearch_connection.get_item(id, classification)
            else:
                print "%s could not be found!" % id
                return (object, current_id)
        if 'relateditems' not in object:
            object['relateditems'] = {}

        media_type_key = int(row[indices['media_type_id_index']])
        media_type = MEDIATYPES.get(media_type_key)
        number = "" if row[indices['rendition_number_index']].lower(
        ) == "null" else row[indices['rendition_number_index']]
        media_master_id = row[indices['media_master_id_index']]
        thumbnail_url = get_media_url(row[indices['thumb_path_index']],
                                      row[indices['thumb_file_index']])
        main_url = get_media_url(row[indices['main_path_index']],
                                 row[indices['main_file_index']])
        description = "" if row[indices['description_index']].lower(
        ) == "null" else row[indices['description_index']]
        mediaview = "" if row[indices['media_view_index']].lower(
        ) == "null" else row[indices['media_view_index']]
        caption = "" if row[indices['caption_index']].lower(
        ) == "null" else row[indices['caption_index']]
        display_text = ": ".join([mediaview, caption])
        # this is a bit of a hack because the MediaFormats for videos (in the TMS database) does not correctly identify the type of video
        # so, make sure we are only using videos that are mp4s
        if media_type_key == 3:
            if not row[indices['main_file_index']].endswith('mp4'):
                return (object, current_id)

        if media_type not in object['relateditems']:
            object['relateditems'][media_type] = []

        if media_type == 'photos':
            object['hasphoto'] = "Yes"
        # add primary photo as a top level item as well
        if row[indices['primary_display_index']] == '1':
            object['primarydisplay'] = {
                'thumbnail': thumbnail_url,
                'main': main_url,
                'displaytext': display_text,
                'number': number,
                'description': description
            }
        if not (classification == '3dmodels' and media_type == '3dmodels'):
            object['relateditems'][media_type].append({
                'id':
                media_master_id,
                'displaytext':
                display_text,
                'primarydisplay':
                True
                if row[indices['primary_display_index']] == '1' else False,
                'thumbnail':
                thumbnail_url,
                'main':
                main_url,
                'number':
                number,
                'description':
                description
            })
        return (object, current_id)
コード例 #12
0
ファイル: sites.py プロジェクト: pixelsforhumans/giza
    def process_site_row(site, current_id):
        site_id = row[indices['site_id_index']]
        #if site_id not in SAMPLE_SITES:
        #	continue
        if site_id != current_id:
            # will likely have multiple rows for one site because of many related photos
            # only get a new site if we have a new site id, but first save old site to elasticsearch
            save(site)
            current_id = site_id
            site = {}
            if elasticsearch_connection.item_exists(site_id, 'sites'):
                site = elasticsearch_connection.get_item(site_id, 'sites')
            else:
                print "%s could not be found!" % site_id
                return (site, current_id)
        if 'relateditems' not in site:
            site['relateditems'] = {}

        media_type_key = int(row[indices['media_type_id_index']])
        media_type = MEDIATYPES.get(media_type_key)
        number = "" if row[indices['rendition_number_index']].lower(
        ) == "null" else row[indices['rendition_number_index']]
        description = "" if row[indices['description_index']].lower(
        ) == "null" else row[indices['description_index']]
        mediaview = "" if row[indices['media_view_index']].lower(
        ) == "null" else row[indices['media_view_index']]
        caption = "" if row[indices['caption_index']].lower(
        ) == "null" else row[indices['caption_index']]
        display_text = ": ".join([mediaview, caption])
        media_master_id = row[indices['media_master_id_index']]
        thumbnail_url = get_media_url(row[indices['thumb_path_index']],
                                      row[indices['thumb_file_index']])
        main_url = get_media_url(row[indices['main_path_index']],
                                 row[indices['main_file_index']])

        # this is a bit of a hack because the MediaFormats for videos (in the TMS database) does not correctly identify the type of video
        # so, make sure we are only using videos that are mp4s
        if media_type_key == 3:
            if not row[indices['main_file_index']].endswith('mp4'):
                return (site, current_id)

        if media_type not in site['relateditems']:
            site['relateditems'][media_type] = []
        # add primary photo as a top level item as well
        if row[indices['primary_display_index']] == '1':
            site['primarydisplay'] = {
                'thumbnail': thumbnail_url,
                'main': main_url,
                'displaytext': display_text,
                'number': number,
                'description': description
            }
        site['relateditems'][media_type].append({
            'id':
            media_master_id,
            'displaytext':
            display_text,
            'primarydisplay':
            True if row[indices['primary_display_index']] == '1' else False,
            'thumbnail':
            thumbnail_url,
            'main':
            main_url,
            'number':
            number,
            'description':
            description
        })
        return (site, current_id)
コード例 #13
0
    def process_media_row():
        media_id = row[indices['id_index']]
        media_type_key = int(row[indices['media_type_id_index']])
        media_type = MEDIATYPES.get(media_type_key)

        # ignore non-photos, if they somehow managed to show up in the query results
        if media_type_key != 1:
            return

        description = "" if row[indices['description_index']].lower(
        ) == "null" else row[indices['description_index']]
        mediaview = "" if row[indices['media_view_index']].lower(
        ) == "null" else row[indices['media_view_index']]
        caption = "" if row[indices['caption_index']].lower(
        ) == "null" else row[indices['caption_index']]
        subjects = ": ".join([mediaview, caption])
        drs_id = "" if row[indices['drs_id']].lower() == "null" else row[
            indices['drs_id']]
        number = "" if row[indices['rendition_number_index']].lower(
        ) == "null" else row[indices['rendition_number_index']]
        department = "" if row[indices['department_index']].lower(
        ) == "null" else row[indices['department_index']]
        date = "" if row[indices['date_index']].lower() == "null" else row[
            indices['date_index']]
        problemsquestions = "" if row[indices['problems_index']].lower(
        ) == "null" else row[indices['problems_index']]
        manifest_id = media_type + '-' + media_id

        metadata = []
        if number:
            metadata.append({'label': 'ID', 'value': number})
        if department:
            metadata.append({'label': 'Department', 'value': department})
        if subjects:
            metadata.append({'label': 'Subjects', 'value': subjects})
        if date:
            metadata.append({'label': 'Date', 'value': date})
        if problemsquestions:
            metadata.append({
                'label': 'Problems/Questions',
                'value': problemsquestions
            })

        if description == "":
            description = caption

        manifest_ob = {
            "manifest_id": manifest_id,
            "drs_id": drs_id,
            "description": description,
            "label": mediaview,
            "metadata": metadata
        }

        ## see if manifest exists to grab the existing resource data so we can avoid checking the CSV file or doing a network call to IDS
        if elasticsearch_connection.item_exists(media_type + '-' + media_id,
                                                'manifest',
                                                ELASTICSEARCH_INDEX):
            existing_manifest = elasticsearch_connection.get_item(
                media_type + '-' + media_id, 'manifest', ELASTICSEARCH_INDEX)
            resource = existing_manifest['manifest']['sequences'][0][
                'canvases'][0]['images'][0]['resource']
            if drs_id in resource['@id']:
                manifest_ob['resource'] = resource

        object = {
            "id": manifest_id,
            "manifest": generate_iiif_manifest(manifest_ob)
        }
        save(object)