Python Bunch.filenames Exemples

Langage de programmation: Python

Espace de nommage/Pack: sklearn.datasets.base

Class/Type: Bunch

Méthode/Fonction: filenames

Exemples au hotexamples.com: 4

Python Bunch.filenames - 4 exemples trouvés. Ce sont les exemples réels les mieux notés de sklearn.datasets.base.Bunch.filenames extraits de projets open source. Vous pouvez noter les exemples pour nous aider à en améliorer la qualité.

Méthodes fréquemment utilisées

Afficher Cacher

Bunch(30)

data(22)

label(6)

remaining(5)

predicted(5)

sentence(3)

oracle(3)

contents(3)

fixk(3)

labels(3)

X(2)

entities(2)

keys(2)

kwords(2)

filenames(2)

text(2)

meta(2)

lable(1)

masker(1)

hyperparams(1)

offset(1)

groups(1)

mask(1)

fig(1)

func(1)

condition_mask(1)

accu(1)

ax(1)

bow(1)

category_labels(1)

clfreg(1)

cmap(1)

content(1)

feature_names(1)

contents_seq(1)

contents_seq_pad(1)

coordinate_names(1)

coordinates(1)

data_fn(1)

data_test(1)

description(1)

zmaps(1)

Méthodes fréquemment utilisées

Bunch (30)

data (22)

label (6)

remaining (5)

predicted (5)

sentence (3)

oracle (3)

contents (3)

fixk (3)

labels (3)

Méthodes fréquemment utilisées

X (2)

entities (2)

keys (2)

kwords (2)

filenames (2)

text (2)

meta (2)

lable (1)

masker (1)

hyperparams (1)

offset (1)

groups (1)

mask (1)

fig (1)

func (1)

condition_mask (1)

accu (1)

ax (1)

bow (1)

category_labels (1)

Méthodes fréquemment utilisées

offset (1)

groups (1)

mask (1)

fig (1)

func (1)

condition_mask (1)

accu (1)

ax (1)

bow (1)

category_labels (1)

clfreg (1)

cmap (1)

content (1)

feature_names (1)

contents_seq (1)

contents_seq_pad (1)

coordinate_names (1)

coordinates (1)

data_fn (1)

data_test (1)

description (1)

zmaps (1)

Méthodes fréquemment utilisées

clfreg (1)

cmap (1)

content (1)

feature_names (1)

contents_seq (1)

contents_seq_pad (1)

coordinate_names (1)

coordinates (1)

data_fn (1)

data_test (1)

description (1)

zmaps (1)

Exemple #1

0

Afficher le fichier

Fichier : tf-idffinal.py Projet : Pengfei-Zhu/DataMining

#导入训练预料 data_set={} #训练语料集路径 train_path='text_corpus1_wordbag/train_set.data' file_obj=open(train_path,'rb') #读取持久化后的对象 data_set=pickle.load(file_obj) file_obj.close() #定义词袋数据结构 wordbag=Bunch(target_name=[],label=[],filenames=[],tdm=[],vocabulary={}) wordbag.target_name=data_set.target_name wordbag.label=data_set.label wordbag.filenames=data_set.filenames #构建语料 corpus=data_set.contents #从文件导入停用词表 stpwrdpath='extra_dict/hlt_stop_words.txt' stpwrd_dic=open(stpwrdpath,'rb') stpwrd_content=stpwrd_dic.read() #将停用词转换为list stpwrdlst=stpwrd_content.splitlines() stpwrd_dic.close() #计算词袋创建时间：获取开始时间 start=datetime.datetime.now()

Exemple #2

0

Afficher le fichier

Fichier : 20_save_train_and_test_data.py Projet : xueanxi/learnAi

bunch.lable.append(list[0]) elif children.tag == 'contenttitle': contenttitle = children.text elif children.tag == 'content': content = str(contenttitle)+' '+str(children.text) if (len(content) > 0): seg = jieba.cut(content, cut_all=False) bunch.contents.append(' '.join(seg)) else: bunch.contents.append('null') print('finish train file:',filePath) fileutils.saveBatchObj(trainRawPath, bunch) # parser all test data and save it to bunch bunch.lable=[] bunch.filenames=[] bunch.contents=[] contenttitle ='' for file in os.listdir(testDataPath): filePath = testDataPath + os.sep + file if os.path.isdir(filePath): print(file, ' is dir. continue') continue with open(filePath, 'r') as file: text = file.read() text = re.sub(u"[\x00-\x08\x0b-\x0c\x0e-\x1f|&]+", u"", text) root = ET.fromstring(text) for child in root: # 第二层节点的标签名称和属性,遍历xml文档的第三层 for children in child: # 第三层节点的标签名称和属性

Exemple #3

0

Afficher le fichier

Fichier : tf-idffinal.py Projet : Pengfei-Zhu/DataMining_Assignment

#导入训练预料 data_set = {} #训练语料集路径 train_path = 'text_corpus1_wordbag/train_set.data' file_obj = open(train_path, 'rb') #读取持久化后的对象 data_set = pickle.load(file_obj) file_obj.close() #定义词袋数据结构 wordbag = Bunch(target_name=[], label=[], filenames=[], tdm=[], vocabulary={}) wordbag.target_name = data_set.target_name wordbag.label = data_set.label wordbag.filenames = data_set.filenames #构建语料 corpus = data_set.contents #从文件导入停用词表 stpwrdpath = 'extra_dict/hlt_stop_words.txt' stpwrd_dic = open(stpwrdpath, 'rb') stpwrd_content = stpwrd_dic.read() #将停用词转换为list stpwrdlst = stpwrd_content.splitlines() stpwrd_dic.close() #计算词袋创建时间：获取开始时间 start = datetime.datetime.now()

Exemple #4

0

Afficher le fichier

Fichier : mask_to_rect.py Projet : wkentaro/d-image-pipeline

import numpy as np from skimage import io from sklearn.datasets.base import Bunch from dip.load_data import load_image_files, load_mask_images from dip.mask import bounding_rect_of_mask datasets = load_mask_images() data = [] for f, mask in zip( datasets.filenames, load_image_files(datasets.filenames), ): # rect: (min_x, max_x, min_y, max_x) rect = bounding_rect_of_mask(mask, negative=True) data.append(list(rect)) print('{0}: {1}'.format(f, rect)) bunch = Bunch(name='mask rects') bunch.data = np.array(data) bunch.filenames = datasets.filenames bunch.target = datasets.target bunch.target_names = datasets.target_names bunch.description = 'mask rects: (min_x, min_y, max_x, max_y)' with gzip.open('rects.pkl.gz', 'wb') as f: pickle.dump(bunch, f)