def test_config_with_custom_name(self): layer = categorical_crossing.CategoryCrossing(depth=2, name='hashing') config = layer.get_config() layer_1 = categorical_crossing.CategoryCrossing.from_config(config) self.assertEqual(layer_1.name, layer.name) layer = categorical_crossing.CategoryCrossing(name='hashing') config = layer.get_config() layer_1 = categorical_crossing.CategoryCrossing.from_config(config) self.assertEqual(layer_1.name, layer.name)
def test_crossing_sparse_inputs_depth_tuple(self): layer = categorical_crossing.CategoryCrossing(depth=(2, 3)) inputs_0 = sparse_tensor.SparseTensor(indices=[[0, 0], [1, 0], [2, 0]], values=['a', 'b', 'c'], dense_shape=[3, 1]) inputs_1 = sparse_tensor.SparseTensor(indices=[[0, 0], [1, 0], [2, 0]], values=['d', 'e', 'f'], dense_shape=[3, 1]) inputs_2 = sparse_tensor.SparseTensor(indices=[[0, 0], [1, 0], [2, 0]], values=['g', 'h', 'i'], dense_shape=[3, 1]) inp_0_t = input_layer.Input(shape=(1, ), sparse=True, dtype=dtypes.string) inp_1_t = input_layer.Input(shape=(1, ), sparse=True, dtype=dtypes.string) inp_2_t = input_layer.Input(shape=(1, ), sparse=True, dtype=dtypes.string) out_t = layer([inp_0_t, inp_1_t, inp_2_t]) model = training.Model([inp_0_t, inp_1_t, inp_2_t], out_t) output = model.predict([inputs_0, inputs_1, inputs_2]) self.assertIsInstance(output, sparse_tensor.SparseTensor) output = sparse_ops.sparse_tensor_to_dense(output) expected_outputs_0 = [[b'a_X_d', b'a_X_g', b'd_X_g', b'a_X_d_X_g']] expected_outputs_1 = [[b'b_X_e', b'b_X_h', b'e_X_h', b'b_X_e_X_h']] expected_outputs_2 = [[b'c_X_f', b'c_X_i', b'f_X_i', b'c_X_f_X_i']] expected_out = array_ops.concat( [expected_outputs_0, expected_outputs_1, expected_outputs_2], axis=0) self.assertAllEqual(expected_out, output)
def test_crossing_dense_inputs_depth_int(self): layer = categorical_crossing.CategoryCrossing(depth=1) inputs_0 = constant_op.constant([['a'], ['b'], ['c']]) inputs_1 = constant_op.constant([['d'], ['e'], ['f']]) output = layer([inputs_0, inputs_1]) expected_output = [[b'a', b'd'], [b'b', b'e'], [b'c', b'f']] self.assertAllEqual(expected_output, output) layer = categorical_crossing.CategoryCrossing(depth=2) inp_0_t = input_layer.Input(shape=(1,), dtype=dtypes.string) inp_1_t = input_layer.Input(shape=(1,), dtype=dtypes.string) out_t = layer([inp_0_t, inp_1_t]) model = training.Model([inp_0_t, inp_1_t], out_t) crossed_output = [[b'a_X_d'], [b'b_X_e'], [b'c_X_f']] expected_output = array_ops.concat([expected_output, crossed_output], axis=1) self.assertAllEqual(expected_output, model.predict([inputs_0, inputs_1]))
def test_crossing_ragged_inputs_depth_int(self): layer = categorical_crossing.CategoryCrossing(depth=1) inputs_0 = ragged_factory_ops.constant([['a'], ['b'], ['c']]) inputs_1 = ragged_factory_ops.constant([['d'], ['e'], ['f']]) output = layer([inputs_0, inputs_1]) expected_output = [[b'a', b'd'], [b'b', b'e'], [b'c', b'f']] self.assertIsInstance(output, ragged_tensor.RaggedTensor) self.assertAllEqual(expected_output, output) layer = categorical_crossing.CategoryCrossing(depth=2) inp_0_t = input_layer.Input(shape=(None,), ragged=True, dtype=dtypes.string) inp_1_t = input_layer.Input(shape=(None,), ragged=True, dtype=dtypes.string) out_t = layer([inp_0_t, inp_1_t]) model = training.Model([inp_0_t, inp_1_t], out_t) expected_output = [[b'a', b'd', b'a_X_d'], [b'b', b'e', b'b_X_e'], [b'c', b'f', b'c_X_f']] self.assertAllEqual(expected_output, model.predict([inputs_0, inputs_1]))
def test_crossing_compute_output_signature(self): input_shapes = [ tensor_shape.TensorShape([2, 2]), tensor_shape.TensorShape([2, 3]) ] input_specs = [ tensor_spec.TensorSpec(input_shape, dtypes.string) for input_shape in input_shapes ] layer = categorical_crossing.CategoryCrossing() output_spec = layer.compute_output_signature(input_specs) self.assertEqual(output_spec.shape.dims[0], input_shapes[0].dims[0]) self.assertEqual(output_spec.dtype, dtypes.string) layer = categorical_crossing.CategoryCrossing(num_bins=2) output_spec = layer.compute_output_signature(input_specs) self.assertEqual(output_spec.shape.dims[0], input_shapes[0].dims[0]) self.assertEqual(output_spec.dtype, dtypes.int64)
def test_invalid_mixed_sparse_and_ragged_input(self): with self.assertRaises(ValueError): layer = categorical_crossing.CategoryCrossing(num_bins=2) inputs_0 = ragged_factory_ops.constant( [['omar'], ['marlo']], dtype=dtypes.string) inputs_1 = sparse_tensor.SparseTensor( indices=[[0, 1], [1, 2]], values=['d', 'e'], dense_shape=[2, 3]) layer([inputs_0, inputs_1])
def test_crossing_hashed_basic(self): layer = categorical_crossing.CategoryCrossing(num_bins=1) inputs_0 = sparse_tensor.SparseTensor( indices=[[0, 0], [1, 0], [1, 1]], values=['a', 'b', 'c'], dense_shape=[2, 2]) inputs_1 = sparse_tensor.SparseTensor( indices=[[0, 1], [1, 2]], values=['d', 'e'], dense_shape=[2, 3]) output = layer([inputs_0, inputs_1]) self.assertAllClose(np.asarray([[0, 0], [1, 0], [1, 1]]), output.indices) self.assertAllClose([0, 0, 0], output.values)
def test_crossing_sparse_inputs(self): layer = categorical_crossing.CategoryCrossing() inputs_0 = sparse_tensor.SparseTensor(indices=[[0, 0], [1, 0], [1, 1]], values=['a', 'b', 'c'], dense_shape=[2, 2]) inputs_1 = sparse_tensor.SparseTensor(indices=[[0, 1], [1, 2]], values=['d', 'e'], dense_shape=[2, 3]) output = layer([inputs_0, inputs_1]) self.assertAllClose(np.asarray([[0, 0], [1, 0], [1, 1]]), output.indices) self.assertAllEqual([b'a_X_d', b'b_X_e', b'c_X_e'], output.values)
def test_crossing_sparse_inputs_depth_int(self): layer = categorical_crossing.CategoryCrossing(depth=1) inputs_0 = sparse_tensor.SparseTensor(indices=[[0, 0], [1, 0], [2, 0]], values=['a', 'b', 'c'], dense_shape=[3, 1]) inputs_1 = sparse_tensor.SparseTensor(indices=[[0, 0], [1, 0], [2, 0]], values=['d', 'e', 'f'], dense_shape=[3, 1]) output = layer([inputs_0, inputs_1]) self.assertIsInstance(output, sparse_tensor.SparseTensor) output = sparse_ops.sparse_tensor_to_dense(output) expected_out = [[b'a', b'd'], [b'b', b'e'], [b'c', b'f']] self.assertAllEqual(expected_out, output)
def test_crossing_hashed_ragged_inputs(self): layer = categorical_crossing.CategoryCrossing(num_bins=2) inputs_0 = ragged_factory_ops.constant( [['omar', 'skywalker'], ['marlo']], dtype=dtypes.string) inputs_1 = ragged_factory_ops.constant( [['a'], ['b']], dtype=dtypes.string) out_data = layer([inputs_0, inputs_1]) expected_output = [[0, 0], [0]] self.assertAllClose(expected_output, out_data) inp_0_t = input_layer.Input(shape=(None,), ragged=True, dtype=dtypes.string) inp_1_t = input_layer.Input(shape=(None,), ragged=True, dtype=dtypes.string) out_t = layer([inp_0_t, inp_1_t]) model = training.Model(inputs=[inp_0_t, inp_1_t], outputs=out_t) self.assertAllClose(expected_output, model.predict([inputs_0, inputs_1])) non_hashed_layer = categorical_crossing.CategoryCrossing() out_t = non_hashed_layer([inp_0_t, inp_1_t]) model = training.Model(inputs=[inp_0_t, inp_1_t], outputs=out_t) expected_output = [[b'omar_X_a', b'skywalker_X_a'], [b'marlo_X_b']] self.assertAllEqual(expected_output, model.predict([inputs_0, inputs_1]))
def test_crossing_dense_inputs_depth_tuple(self): layer = categorical_crossing.CategoryCrossing(depth=[2, 3]) inputs_0 = constant_op.constant([['a'], ['b'], ['c']]) inputs_1 = constant_op.constant([['d'], ['e'], ['f']]) inputs_2 = constant_op.constant([['g'], ['h'], ['i']]) inp_0_t = input_layer.Input(shape=(1,), dtype=dtypes.string) inp_1_t = input_layer.Input(shape=(1,), dtype=dtypes.string) inp_2_t = input_layer.Input(shape=(1,), dtype=dtypes.string) out_t = layer([inp_0_t, inp_1_t, inp_2_t]) model = training.Model([inp_0_t, inp_1_t, inp_2_t], out_t) expected_outputs_0 = [[b'a_X_d', b'a_X_g', b'd_X_g', b'a_X_d_X_g']] expected_outputs_1 = [[b'b_X_e', b'b_X_h', b'e_X_h', b'b_X_e_X_h']] expected_outputs_2 = [[b'c_X_f', b'c_X_i', b'f_X_i', b'c_X_f_X_i']] expected_output = array_ops.concat( [expected_outputs_0, expected_outputs_1, expected_outputs_2], axis=0) self.assertAllEqual(expected_output, model.predict([inputs_0, inputs_1, inputs_2]))
def test_distribution(self, distribution): input_array_1 = np.array([['a', 'b'], ['c', 'd']]) input_array_2 = np.array([['e', 'f'], ['g', 'h']]) # pyformat: disable expected_output = [[b'a_X_e', b'a_X_f', b'b_X_e', b'b_X_f'], [b'c_X_g', b'c_X_h', b'd_X_g', b'd_X_h']] config.set_soft_device_placement(True) with distribution.scope(): input_data_1 = keras.Input(shape=(2, ), dtype=dtypes.string) input_data_2 = keras.Input(shape=(2, ), dtype=dtypes.string) input_data = [input_data_1, input_data_2] layer = categorical_crossing.CategoryCrossing() int_data = layer(input_data) model = keras.Model(inputs=input_data, outputs=int_data) output_dataset = model.predict([input_array_1, input_array_2]) self.assertAllEqual(expected_output, output_dataset)
def bm_layer_implementation(self, batch_size): input_1 = keras.Input(shape=(1, ), dtype=dtypes.int64, name="word") input_2 = keras.Input(shape=(1, ), dtype=dtypes.int64, name="int") layer = categorical_crossing.CategoryCrossing() _ = layer([input_1, input_2]) num_repeats = 5 starts = [] ends = [] for _ in range(num_repeats): ds = dataset_ops.Dataset.from_generator( int_gen, (dtypes.int64, dtypes.int64), (tensor_shape.TensorShape([1]), tensor_shape.TensorShape([1]))) ds = ds.shuffle(batch_size * 100) ds = ds.batch(batch_size) num_batches = 5 ds = ds.take(num_batches) ds = ds.prefetch(num_batches) starts.append(time.time()) # Benchmarked code begins here. for i in ds: _ = layer([i[0], i[1]]) # Benchmarked code ends here. ends.append(time.time()) avg_time = np.mean(np.array(ends) - np.array(starts)) / num_batches name = "categorical_crossing|batch_%s" % batch_size baseline = self.run_dataset_implementation(batch_size) extras = { "dataset implementation baseline": baseline, "delta seconds": (baseline - avg_time), "delta percent": ((baseline - avg_time) / baseline) * 100 } self.report_benchmark(iters=num_repeats, wall_time=avg_time, extras=extras, name=name)
def test_crossing_with_dense_inputs(self): layer = categorical_crossing.CategoryCrossing() inputs_0 = np.asarray([[1, 2]]) inputs_1 = np.asarray([[1, 3]]) output = layer([inputs_0, inputs_1]) self.assertAllEqual([[b'1_X_1', b'1_X_3', b'2_X_1', b'2_X_3']], output)
def test_crossing_hashed_with_dense_inputs(self): layer = categorical_crossing.CategoryCrossing(num_bins=2) inputs_0 = np.asarray([[1, 2]]) inputs_1 = np.asarray([[1, 3]]) output = layer([inputs_0, inputs_1]) self.assertAllClose([[1, 1, 0, 0]], output)