Python ElasticSearch.flush Examples

Programming Language: Python

Namespace/Package Name: pyelasticsearch

Class/Type: ElasticSearch

Method/Function: flush

Examples at hotexamples.com: 3

Python ElasticSearch.flush - 3 examples found. These are the top rated real world Python examples of pyelasticsearch.ElasticSearch.flush extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

ElasticSearch(30)

search(30)

create_index(22)

delete_index(21)

index(18)

bulk(17)

bulk_index(15)

index_op(15)

refresh(12)

get(11)

put_mapping(9)

update(5)

update_op(3)

delete_op(3)

get_mapping(3)

delete(3)

status(2)

send_request(2)

open_index(2)

update_settings(2)

close_index(2)

count(2)

multi_get(1)

optimize(1)

health(1)

flush(1)

delete_by_query(1)

delete_all_indexes(1)

delete_all(1)

get_settings(1)

Example #1

Show file

File: create_es.py Project: pombredanne/monolith

def feed(index='monolith', type='downloads', es_port=9200):
    client = ElasticSearch('http://0.0.0.0:%d/' % es_port)
    platforms = ['Mac OS X', 'Windows 8', 'Ubuntu']

    # indexing a year of data (2012)
    first_day = datetime.datetime(2012, 1, 1)
    last_day = datetime.datetime(2012, 12, 31)
    day_range = last_day - first_day

    for month in range(1, 13):
        name = 'time_2012-%.2d' % month
        try:
            client.delete_index(name)
        except Exception:
            pass
        client.create_index(name,
                            settings={
                                'number_of_shards': 1,
                                'number_of_replicas': 0,
                                'analysis': {
                                    'analyzer': {
                                        'default': {
                                            'type': 'custom',
                                            'tokenizer': 'keyword'
                                        }
                                    }
                                },
                                'store': {
                                    'compress': {
                                        'stored': 'true'
                                    }
                                },
                            })

    # indexing 100 apps
    for add_on in range(100):
        docs = defaultdict(list)
        for delta in range(day_range.days):
            date = first_day + datetime.timedelta(days=delta)
            data = {
                'date': date,
                'os': random.choice(platforms),
                'downloads_count': random.randint(1000, 1500),
                'users_count': random.randint(10000, 15000),
                'add_on': add_on + 1
            }
            docs[date.month].append(data)
        for month, values in docs.items():
            client.bulk_index('time_2012-%.2d' % month, type, values)
            sys.stdout.write('.')
            sys.stdout.flush()

    client.optimize('time_*', max_num_segments=1, wait_for_merge=True)
    client.flush()
    sys.stdout.write('\nDone!\n')

Example #2

Show file

File: create_es.py Project: mozilla/monolith.js

def feed(index='monolith', type='downloads', es_port=9200):
    client = ElasticSearch('http://0.0.0.0:%d/' % es_port)
    platforms = ['Mac OS X', 'Windows 8', 'Ubuntu']

    # indexing a year of data (2012)
    first_day = datetime.datetime(2012, 1, 1)
    last_day = datetime.datetime(2012, 12, 31)
    day_range = last_day - first_day

    for month in range(1, 13):
        name = 'time_2012-%.2d' % month
        try:
            client.delete_index(name)
        except Exception:
            pass
        client.create_index(name, settings={
            'number_of_shards': 1,
            'number_of_replicas': 0,
            'analysis': {'analyzer': {'default': {
                'type': 'custom', 'tokenizer': 'keyword'
            }}},
            'store': {'compress': {'stored': 'true'}},
        })

    # indexing 100 apps
    for add_on in range(100):
        docs = defaultdict(list)
        for delta in range(day_range.days):
            date = first_day + datetime.timedelta(days=delta)
            data = {'date': date,
                    'os': random.choice(platforms),
                    'downloads_count': random.randint(1000, 1500),
                    'users_count': random.randint(10000, 15000),
                    'add_on': add_on + 1}
            docs[date.month].append(data)
        for month, values in docs.items():
            client.bulk_index('time_2012-%.2d' % month, type, values)
            sys.stdout.write('.')
            sys.stdout.flush()

    client.optimize('time_*', max_num_segments=1, wait_for_merge=True)
    client.flush()
    sys.stdout.write('\nDone!\n')

Example #3

Show file

File: GOParser.py Project: ENCODE-DCC/encodedES

for term in terms:
    
    print term
    words = iterativeChildren(terms[term]['data'])
    for word in words:
        terms[term]['closure'].append(word)

    d = iterativeDev(terms[term]['data_with_develops_from'])
    for dd in d:
        terms[term]['closure_with_develops_from'].append(dd)
    
    terms[term]['closure'] = list(set(terms[term]['closure']))
    terms[term]['closure'].append(term)
    
    terms[term]['closure_with_develops_from'] = list(set(terms[term]['closure_with_develops_from']))
    terms[term]['closure_with_develops_from'].append(term)

    terms[term]['systems'] = getSystemSlims(term)
    terms[term]['organs'] = getOrganSlims(term)
    terms[term]['developmental'] = getDevelopmentSlims(term)
    
    # Indexing the data in ElasticSearch
    connection.index(index_name, doc_type_name, terms[term], id=term)
    if count % 1000 == 0:
        connection.flush(index=index_name)
    connection.refresh()
    count = count + 1

print
print "Total GO Terms indexed " + str(count)