def test_rolling_similarity(self):
        """Should compute similarity between the sequence of vectors defined by the given columns, and given
        similarity function"""
        test_df = pd.DataFrame({"dx_dt": [1, 1, 1], "dy_dt": [1, 1, -1]})

        transform_result = streams.rolling_similarity(test_df, cosine_similarity, "dx_dt", "dy_dt")

        self.assertEqual(list(transform_result.columns.values), ["dx_dt", "dy_dt", "cosine_similarity_dx_dt_dy_dt"])
        self.assertTrue(np.isnan(transform_result.cosine_similarity_dx_dt_dy_dt[0]))
        self.assertAlmostEqual(transform_result.cosine_similarity_dx_dt_dy_dt[1], 1.0, 9)
        self.assertAlmostEqual(transform_result.cosine_similarity_dx_dt_dy_dt[2], 0, 9)
示例#2
0
    def __total_deviation(self, activity_id):
        stream_df = load_stream(self.database_driver, activity_id, 'latlng')

        if stream_df is not None:
            stream_df = lat_long_to_x_y(stream_df)
            stream_df = smooth(stream_df, smooth_colname='x')
            stream_df = smooth(stream_df, smooth_colname='y')
            stream_df = derivative(stream_df, derivative_colname='x_smooth')
            stream_df = derivative(stream_df, derivative_colname='y_smooth')
            stream_df = rolling_similarity(stream_df, cosine_similarity, 'dx_smooth_dt', 'dy_smooth_dt')

            try:
                return np.nansum([cosine_to_deviation(cos)
                                  for cos in stream_df.cosine_similarity_dx_smooth_dt_dy_smooth_dt])
            except ValueError:
                logging.warning('Failed to compute route deviation for activity %d, returning NaN' % activity_id)
                return np.nan
        else:
            logging.warning('No gps stream available for activity %d, returning NaN' % activity_id)
            return np.nan