Exemplo n.º 1
0
    def __init__(self, prefix, pretrained_text=False):
        self.prefix = prefix
        self.pretrained_text = pretrained_text
        self.context_length = 128
        self.num_classes = 700
        self.vocab_size = sp_vocab_size
        self.sp_model_path = sp_model_path
        self.sp_model = load_sp_model(sp_model_path)
        self.sp_id_generator = sentencepiece_numericalizer(self.sp_model)
        self.start_token, self.end_token = self.sp_id_generator(
            ["<|startoftext|>", "<|endoftext|>"])
        self.text_dict = pickle.load(
            open(f"{raw_text_dir}/kinetics_{prefix}.pickle", "rb"))

        # Fetch paths to audio, video, text features for samples
        self.a_paths, self.v_paths, self.t_paths = get_npy_paths(
            prefix, pretrained_text=pretrained_text)
        print(len(self.t_paths))

        # length = len(self.a_paths)
        # limit = length // 3

        # self.a_paths, self.v_paths, self.t_paths = self.a_paths[:limit], self.v_paths[:limit], self.t_paths[:limit]

        self.tags = []
Exemplo n.º 2
0
    def __init__(self, prefix):
        self.prefix = prefix
        self.num_classes = 700

        _, self.v_paths, _ = get_npy_paths(prefix, pretrained_text=False)

        print(len(self.v_paths))
Exemplo n.º 3
0
    def __init__(self,
                 prefix,
                 num_classes=700,
                 zero_shot=False,
                 pretrained_text=False):

        self.prefix = prefix
        self.num_classes = num_classes
        self.zero_shot = zero_shot
        self.pretrained_text = pretrained_text

        self.context_length = 128
        self.vocab_size = 20000
        self.sp_model_path = sp_model_path
        self.sp_model = load_sp_model(sp_model_path)
        self.sp_id_generator = sentencepiece_numericalizer(self.sp_model)
        self.start_token, self.end_token = self.sp_id_generator(
            ["<|startoftext|>", "<|endoftext|>"])
        self.text_dict = pickle.load(
            open(f"{raw_text_dir}/kinetics_{prefix}.pickle", "rb"))

        # Fetch paths to audio, video, text features for samples
        self.a_paths, self.v_paths, self.t_paths = get_npy_paths(
            prefix, pretrained_text=pretrained_text)
        self.labels = pickle.load(
            open("{}/{}.pickle".format(pickle_root_dir, prefix), "rb"))
Exemplo n.º 4
0
    def __init__(
        self,
        prefix,
        num_classes=700,
    ):

        self.prefix = prefix
        self.eval = prefix == "val"
        self.num_classes = num_classes

        _, self.v_paths, _ = get_npy_paths(prefix, pretrained_text=False)
        print(self.v_paths[0])
        self.labels = pickle.load(
            open("{}/{}.pickle".format(pickle_root_dir, prefix), "rb"))