Python Metadata.average_source_relevance Beispiele

Programmiersprache: Python

Namespace / Paketname: calibre.ebooks.metadata.book.base

Klasse / Typ: Metadata

Methode / Funktion: average_source_relevance

Beispiele auf hotexamples.com: 1

Python Metadata.average_source_relevance - 1 Beispiele gefunden. Dies sind die am besten bewerteten Python Beispiele für die calibre.ebooks.metadata.book.base.Metadata.average_source_relevance, die aus Open Source-Projekten extrahiert wurden. Sie können Beispiele bewerten, um die Qualität der Beispiele zu verbessern.

Häufig verwendete Methoden

Anzeigen Verbergen

Metadata(30)

pubdate(30)

set_identifier(30)

rating(30)

publisher(30)

comments(30)

tags(30)

series(30)

isbn(24)

languages(21)

has_cover(21)

source_relevance(20)

series_index(18)

identifiers(16)

author_sort(12)

timestamp(11)

authors(11)

title(9)

cover_data(8)

set(8)

cover_url(8)

set_identifiers(7)

uuid(6)

set_all_user_metadata(5)

all_isbns(5)

__init__(5)

set_user_metadata(4)

ozon_cover_url(4)

title_sort(4)

is_null(4)

has_douban_cover(4)

website(3)

source(3)

id(3)

get_all_user_metadata(3)

book_producer(3)

douban_author_intro(2)

douban_subtitle(2)

cover(2)

provider_value(2)

provider_key(2)

douban_id(2)

author_link_map(2)

application_id(2)

metadata_date(2)

links(2)

last_modified(2)

user_categories(2)

language(2)

has_cached_cover_url(2)

Beispiel #1

Datei anzeigen

    def merge(self, results, min_year, do_asr=True):
        ans = Metadata(_('Unknown'))

        # We assume the shortest title has the least cruft in it
        ans.title = self.length_merge('title', results, null_value=ans.title)

        # No harm in having extra authors, maybe something useful like an
        # editor or translator
        ans.authors = self.length_merge('authors', results,
                null_value=ans.authors, shortest=False)

        # We assume the shortest publisher has the least cruft in it
        ans.publisher = self.length_merge('publisher', results,
                null_value=ans.publisher)

        # We assume the smallest set of tags has the least cruft in it
        ans.tags = self.length_merge('tags', results,
                null_value=ans.tags, shortest=msprefs['fewer_tags'])

        # We assume the longest series has the most info in it
        ans.series = self.length_merge('series', results,
                null_value=ans.series, shortest=False)
        for r in results:
            if r.series and r.series == ans.series:
                ans.series_index = r.series_index
                break

        # Average the rating over all sources
        ratings = []
        for r in results:
            rating = r.rating
            if rating and rating > 0 and rating <= 5:
                ratings.append(rating)
        if ratings:
            ans.rating = int(round(sum(ratings)/len(ratings)))

        # Smallest language is likely to be valid
        ans.language = self.length_merge('language', results,
                null_value=ans.language)

        # Choose longest comments
        ans.comments = self.length_merge('comments', results,
                null_value=ans.comments, shortest=False)

        # Published date
        if min_year:
            for r in results:
                year = getattr(r.pubdate, 'year', None)
                if year == min_year:
                    ans.pubdate = r.pubdate
                    break
            if getattr(ans.pubdate, 'year', None) == min_year:
                min_date = datetime(min_year, ans.pubdate.month, ans.pubdate.day,
                                    tzinfo=utc_tz)
            else:
                min_date = datetime(min_year, 1, 2, tzinfo=utc_tz)
            ans.pubdate = min_date
        else:
            min_date = datetime(3001, 1, 1, tzinfo=utc_tz)
            for r in results:
                if r.pubdate is not None:
                    candidate = as_utc(r.pubdate)
                    if candidate < min_date:
                        min_date = candidate
            if min_date.year < 3000:
                ans.pubdate = min_date

        # Identifiers
        for r in results:
            ans.identifiers.update(r.identifiers)

        # Cover URL
        ans.has_cached_cover_url = bool([r for r in results if
            getattr(r, 'has_cached_cover_url', False)])

        # Merge any other fields with no special handling (random merge)
        touched_fields = set()
        for r in results:
            if hasattr(r, 'identify_plugin'):
                touched_fields |= r.identify_plugin.touched_fields

        for f in touched_fields:
            if f.startswith('identifier:') or not ans.is_null(f):
                continue
            setattr(ans, f, self.random_merge(f, results,
                null_value=getattr(ans, f)))

        if do_asr:
            avg = [x.relevance_in_source for x in results]
            avg = sum(avg)/len(avg)
            ans.average_source_relevance = avg

        return ans