Ejemplos de Utils.dtw en Python

Lenguaje de programación: Python

Namespace/Package Name: lib.utils

Clase / Tipo: Utils

Método / Función: dtw

Ejemplos en hotexamples.com: 2

Python Utils.dtw - 2 ejemplos encontrados. Estos son los ejemplos en Python del mundo real mejor valorados de lib.utils.Utils.dtw extraídos de proyectos de código abierto. Puedes valorar ejemplos para ayudarnos a mejorar la calidad de los ejemplos.

Métodos usados con frecuencia

Mostrar Ocultar

cmd(26)

confirm(12)

default_week(8)

print_result_error(7)

fetch_image(7)

get_local_ipv4_address(6)

ensure_sources(6)

create_hash(5)

download_binary(5)

get_index_name(4)

get_image_path(4)

createDataDir(4)

Utils(4)

env_with_default(4)

exit_if_git_release_not_set(4)

exit_with_cmd_error(4)

capture_webcam(4)

build_uri(4)

add_new_fields(3)

exit_if_docker_image_not_built(3)

is_docker_image(3)

list_builds(3)

list_releases(3)

list_sources(3)

check_hashed_password(3)

is_docker_available(2)

getCountryPortsMapper(2)

is_git_available(2)

get_distribution(2)

platform(2)

print_builds(2)

getDbprefix(2)

write_text(2)

clean_examples_numeric(2)

date_difference(2)

delete_files(2)

dtw(2)

formatPoint(1)

is_xcode_available(1)

consul_service_data(1)

configure_vars(1)

click_to_element(1)

list_supported_operating_systems(1)

parse_git_config(1)

checkState(1)

is_svn_available(1)

calculate_entropy(1)

readGeneralConfigFromXml(1)

read_stdin(1)

reload_consul(1)

Ejemplo n.º 1

Mostrar archivo

Archivo: paragraph.py Proyecto: zsoltgere/DocumentHandler

    def recursiveLevenshtein(self, mode, new_fragments,
                             words_to_substitute_in_new, old_list, start_after,
                             end_before):

        if not words_to_substitute_in_new:
            return

        words_to_substitute_in_old = old_list[start_after + 1:end_before]
        if words_to_substitute_in_old:

            distance_matrix = Utils.dtw(words_to_substitute_in_new,
                                        words_to_substitute_in_old)
            index = self.findMostSimilarWordIndex(distance_matrix,
                                                  words_to_substitute_in_new,
                                                  words_to_substitute_in_old)
            index_to_append = start_after + 1 + index[1]
            fragment_to_append = self.getFragmentID(index_to_append)

            if index[0] != 0:  # there are at least one word left from this
                left = words_to_substitute_in_new[:index[0]]
                self.recursiveLevenshtein(False, new_fragments, left, old_list,
                                          start_after, index_to_append)

            if mode:
                new_fragments[
                    fragment_to_append] += words_to_substitute_in_new[
                        index[0]] + " "
            else:
                new_fragments[fragment_to_append] = words_to_substitute_in_new[
                    index[0]] + " " + new_fragments[fragment_to_append]

            if len(words_to_substitute_in_new) - 1 > index[
                    0]:  # there are at least one word right from this
                right = words_to_substitute_in_new[index[0] + 1:]
                self.recursiveLevenshtein(True, new_fragments, right, old_list,
                                          index_to_append, end_before)

        else:  # add the remaining new words
            fragment_to_append = self.getFragmentID(start_after + 1)
            for word in words_to_substitute_in_new:
                new_fragments[fragment_to_append] += word + " "

Ejemplo n.º 2

Mostrar archivo

Archivo: paragraph.py Proyecto: zsoltgere/DocumentHandler

    def updateWithDynamicTimeWarping(self, new_paragraph):

        old_paragraph = self.getParagraph()
        if old_paragraph != new_paragraph:  # it's the same? -> if yes, do nothing
            if self.fragments == 0:  # safety check to avoid error
                print(
                    "Warning! Into empty paragraphs, inserting is not available."
                )
            elif not len(
                    new_paragraph):  # empty input, all fragment must erased
                self.eraseFragments()
            elif len(
                    self.fragments
            ) == 1:  # if there is only one fragment, there are no problem (optimal case)
                self.fragments[0] = new_paragraph
            else:  # more than one fragment, so this is where the fun begins

                old_paragraph = self.createSplitableParagraph()
                old_list = old_paragraph.split(" ")  # init arrays
                new_list = new_paragraph.split(" ")
                distance_matrix = Utils.dtw(
                    new_list, old_list
                )  # run dtw, based on edit distance algorithm(Levenshtein)
                self.calculateWordFreqs()

                new_fragments = [""] * len(self.fragments)

                depth_limit = 0  # limit to spare time and avoid fake matches from the repeating words
                actual_fragment = 0  # store the actual fragment's index for further use
                last_assigned_from_old = -1  # pointer to store which old word was handled at the last match

                for col_index in range(len(
                        distance_matrix[0])):  # col_index ->  old words
                    for row_index in range(
                            depth_limit,
                            len(distance_matrix)):  #row_index -> new words

                        if distance_matrix[
                                row_index,
                                col_index] == 0:  # if the Levenshtein dist is 0, it's the same word

                            actual_fragment = self.getFragmentID(
                                col_index
                            )  # get the original place of the matched word
                            self.alignAddedWords(
                                new_fragments, new_list, old_list,
                                actual_fragment, last_assigned_from_old,
                                col_index, depth_limit, row_index
                            )  # add the words from the new before the match

                            new_fragments[actual_fragment] += old_list[
                                col_index] + " "  # add the match

                            last_assigned_from_old = col_index
                            depth_limit = row_index + 1  # set new limit -> under this the matrix can contain "fake" matches (they're coming from the repeating words)
                            break

                self.alignAddedWords(new_fragments, new_list, old_list,
                                     actual_fragment, last_assigned_from_old,
                                     col_index, depth_limit,
                                     len(new_list))  #add the remaining words

                self.removeUnwantedSpaces(new_fragments)
                self.fragments = new_fragments