Python Bed._close_bed 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: pysnptools.snpreader

클래스/타입: Bed

메소드/함수: _close_bed

hotexamples.com에서의 예제들: 2

Python Bed._close_bed - 2개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 pysnptools.snpreader.Bed._close_bed에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

Bed(30)

read(30)

write(14)

sid_to_index(8)

as_dist(4)

iid_to_index(4)

read_kernel(3)

_close_bed(2)

_read(1)

reshape(1)

standardize(1)

예제 #1

파일 보기

class BedReader(object):
    def __init__(self, path, shape, dtype=np.int8, count_A1=True):
        # n variants (sid = SNP id), n samples (iid = Individual id)
        n_sid, n_iid = shape
        # Initialize Bed with empty arrays for axis data, otherwise it will
        # load the bim/map/fam files entirely into memory (it does not do out-of-core for those)
        self.bed = Bed(
            str(path),
            count_A1=count_A1,
            # Array (n_sample, 2) w/ FID and IID
            iid=np.empty((n_iid, 2), dtype="str"),
            # SNP id array (n_variants)
            sid=np.empty((n_sid, ), dtype="str"),
            # Contig and positions array (n_variants, 3)
            pos=np.empty((n_sid, 3), dtype="int"),
        )
        self.shape = (n_sid, n_iid, 2)
        self.dtype = dtype
        self.ndim = 3

    def __getitem__(self, idx):
        if not isinstance(idx, tuple):
            raise IndexError(  # pragma: no cover
                f"Indexer must be tuple (received {type(idx)})")
        if len(idx) != self.ndim:
            raise IndexError(  # pragma: no cover
                f"Indexer must be two-item tuple (received {len(idx)} slices)")
        # Slice using reversal of first two slices --
        # pysnptools uses sample x variant orientation
        arr = self.bed[idx[1::-1]].read(dtype=np.float32, view_ok=False).val.T
        # Convert missing calls as nan to -1
        arr = np.nan_to_num(arr, nan=-1.0)
        arr = arr.astype(self.dtype)
        # Add a ploidy dimension, so allele counts of 0, 1, 2 correspond to 00, 10, 11
        arr = np.stack(
            [
                np.where(arr < 0, -1, np.where(arr == 0, 0, 1)),
                np.where(arr < 0, -1, np.where(arr == 2, 1, 0)),
            ],
            axis=-1,
        )

        # Apply final slice to 3D result
        return arr[:, :, idx[-1]]

    def close(self):
        # This is not actually crucial since a Bed instance with no
        # in-memory bim/map/fam data is essentially just a file pointer
        # but this will still be problematic if the an array is created
        # from the same PLINK dataset many times
        self.bed._close_bed()  # pragma: no cover

예제 #2

파일 보기

파일: pysnptools_backend.py 프로젝트: related-sciences/gwas-analysis

class BedReader(object):
    def __init__(self, path, shape, dtype=np.int8, count_A1=True):
        from pysnptools.snpreader import Bed
        # n variants (sid = SNP id), n samples (iid = Individual id)
        n_sid, n_iid = shape
        # Initialize Bed with empty arrays for axis data, otherwise it will
        # load the bim/map/fam files entirely into memory (it does not do out-of-core for those)
        self.bed = Bed(
            str(path),
            count_A1=count_A1,
            # Array (n_sample, 2) w/ FID and IID
            iid=np.empty((n_iid, 2), dtype='str'),
            # SNP id array (n_variants)
            sid=np.empty((n_sid, ), dtype='str'),
            # Contig and positions array (n_variants, 3)
            pos=np.empty((n_sid, 3), dtype='int'))
        self.shape = (n_sid, n_iid)
        self.dtype = dtype
        self.ndim = 2

    @staticmethod
    def _is_empty_slice(s):
        return s.start == s.stop

    def __getitem__(self, idx):
        if not isinstance(idx, tuple):
            raise IndexError(f'Indexer must be tuple (received {type(idx)})')
        if len(idx) != self.ndim:
            raise IndexError(
                f'Indexer must be two-item tuple (received {len(idx)} slices)')

        # This is called by dask with empty slices before trying to read any chunks, so it may need
        # to be handled separately if pysnptools is slow here
        # if all(map(BedReader._is_empty_slice, idx)):
        #     return np.empty((0, 0), dtype=self.dtype)

        arr = self.bed[idx[::-1]].read(dtype=np.float32, view_ok=False).val.T
        arr = np.ma.masked_invalid(arr)
        arr = arr.astype(self.dtype)
        return arr

    def close(self):
        # This is not actually crucial since a Bed instance with no
        # in-memory bim/map/fam data is essentially just a file pointer
        # but this will still be problematic if the an array is created
        # from the same PLINK dataset many times
        self.bed._close_bed()