Python get_data примеры, camparitraj.get_data Python примеры использования

Пример #1

0

Показать файл

def test_get_interchain_distance_failing_atom():
    protein_groups = [[0, 1, 2, 3, 4], [5, 6, 7, 8, 9], [10, 11, 12, 13, 14]]
    pdb_filename = os.path.join(camparitraj.get_data('test_data'), 'ntl9.pdb')
    traj_filename = os.path.join(camparitraj.get_data('test_data'),
                                 'ntl9.xtc')  # ntl9 has 56 residues
    trajectory = cttrajectory.CTTrajectory(trajectory_filename=traj_filename,
                                           pdb_filename=pdb_filename,
                                           protein_grouping=protein_groups)

    mode = 'atom'
    atoms1 = ['X', 'CA']
    atoms2 = atoms1[::-1]
    for protein_group in itertools.combinations(range(len(protein_groups)),
                                                r=2):
        protein_a, protein_b = protein_group

        # There appears to be an issue where R1 > R2 - the calculation crashes for sidechain-heavy.
        # See `test_get_interchain_distance`
        R1 = 0  #random.choice(range(len(protein_groups[protein_a])))
        R2 = 1  #random.choice(range(len(protein_groups[protein_b])))

        for A1, A2 in zip(atoms1, atoms2):
            with pytest.raises(CTException):
                trajectory.get_interchain_distance(protein_a, protein_b, R1,
                                                   R2, A1, A2, mode)

Пример #2

0

Показать файл

def test_read_in_compare_trajectories(GS6_CO):
    pdb_filename = os.path.join(camparitraj.get_data('test_data'), 'gs6.pdb')
    traj_filename = os.path.join(camparitraj.get_data('test_data'), 'gs6.xtc')
    trajectory = cttrajectory.CTTrajectory(trajectory_filename=traj_filename,
                                           pdb_filename=pdb_filename)

    assert np.allclose(trajectory.traj.xyz, GS6_CO.traj.xyz)

Пример #3

0

Показать файл

def test_intrachain_inter_residue_atomic_distance():

    # A custom version of NTL9 is needed, since we want to have multiple protein chains
    protein_groups_residues = [[0, 1, 2, 3, 4, 5, 6, 7, 8, 9],
                               [10, 11, 12, 13, 14, 15, 16, 17, 18, 19],
                               [20, 21, 22, 23, 24, 25, 26, 27, 28, 29],
                               [30, 31, 32, 33, 34, 35, 36, 37, 38, 39],
                               [40, 41, 42, 43, 44, 45, 46, 47, 48, 49]]
    pdb_filename = os.path.join(camparitraj.get_data('test_data'), 'ntl9.pdb')
    traj_filename = os.path.join(camparitraj.get_data('test_data'),
                                 'ntl9.xtc')  # ntl9 has 56 residues
    trajectory = cttrajectory.CTTrajectory(
        trajectory_filename=traj_filename,
        pdb_filename=pdb_filename,
        protein_grouping=protein_groups_residues)

    for protein_group in itertools.combinations(range(
            len(protein_groups_residues)),
                                                r=2):
        protein_a, protein_b = protein_group
        a_residues = protein_groups_residues[protein_a]
        b_residues = protein_groups_residues[protein_b]

        residue_a = random.randint(0, len(a_residues) - 1)
        residue_b = random.randint(0, len(b_residues) - 1)

        distances = trajectory.get_interchain_distance(protein_a, protein_b,
                                                       residue_a, residue_b)
        assert len(distances) == len(a_residues)

Пример #4

0

Показать файл

def test_read_in_trajectory_pdblead(GS6_CO):
    pdb_filename = os.path.join(camparitraj.get_data('test_data'), 'gs6.pdb')
    traj_filename = os.path.join(camparitraj.get_data('test_data'), 'gs6.xtc')
    traj = cttrajectory.CTTrajectory(pdb_filename=pdb_filename,
                                     trajectory_filename=traj_filename,
                                     pdblead=True)

    # Since we're using the PDB as an initial frame, the number of frames should have increased by 1.
    assert len(traj) == len(GS6_CO) + 1

Пример #5

0

Показать файл

def test_read_in_protein_grouping_simple():
    protein_groups = [[0]]
    pdb_filename = os.path.join(camparitraj.get_data('test_data'), 'gs6.pdb')
    traj_filename = os.path.join(camparitraj.get_data('test_data'), 'gs6.xtc')
    trajectory = cttrajectory.CTTrajectory(trajectory_filename=traj_filename,
                                           pdb_filename=pdb_filename,
                                           protein_grouping=protein_groups)

    # verify that we have loaded the number of proteins expected
    assert trajectory.num_proteins == len(protein_groups)

Пример #6

0

Показать файл

def test_read_in_protein_grouping_multiple():
    protein_groups = [[0, 1, 2], [3, 4, 5], [6, 7, 8]]
    pdb_filename = os.path.join(camparitraj.get_data('test_data'), 'ntl9.pdb')
    traj_filename = os.path.join(camparitraj.get_data('test_data'),
                                 'ntl9.xtc')  # ntl9 has 56 residues
    trajectory = cttrajectory.CTTrajectory(trajectory_filename=traj_filename,
                                           pdb_filename=pdb_filename,
                                           protein_grouping=protein_groups)

    # verify that we have loaded the number of proteins expected
    assert trajectory.num_proteins == len(protein_groups)

Пример #7

0

Показать файл

def test_read_in_protein_grouping_multiple_mixed_order():
    # TODO: This test passes - it shouldn't. Look into this further.
    protein_groups = [[1, 2, 0], [10, 3, 7], [11, 1, 3]]
    pdb_filename = os.path.join(camparitraj.get_data('test_data'), 'ntl9.pdb')
    traj_filename = os.path.join(camparitraj.get_data('test_data'),
                                 'ntl9.xtc')  # ntl9 has 56 residues
    trajectory = cttrajectory.CTTrajectory(trajectory_filename=traj_filename,
                                           pdb_filename=pdb_filename,
                                           protein_grouping=protein_groups)

    # verify that we have loaded the number of proteins expected
    assert trajectory.num_proteins == len(protein_groups)

Пример #8

0

Показать файл

def test_read_in_protein_grouping_invalid_residues():
    protein_groups = [[1000, 1001, 1002], [1003, 1004, 1005],
                      [1006, 1007, 1008]]
    pdb_filename = os.path.join(camparitraj.get_data('test_data'), 'ntl9.pdb')
    traj_filename = os.path.join(camparitraj.get_data('test_data'),
                                 'ntl9.xtc')  # ntl9 has 56 residues
    trajectory = cttrajectory.CTTrajectory(trajectory_filename=traj_filename,
                                           pdb_filename=pdb_filename,
                                           protein_grouping=protein_groups)

    # Since this is a failing but non-disruptive test (i.e. no Exceptions), we
    # check the number of proteins which should be 0.
    assert trajectory.num_proteins == 0

Пример #9

0

Показать файл

def test_export_intra_chain_distance_map_protein_groups_with_residue_indices():
    # Note that the residues for the resID1 and resID2 indices are with respect to the residues of the protein chain
    # and not the full protein itself.
    protein_groups_residues = [[0, 1, 2, 3, 4, 5, 6, 7, 8, 9],
                               [10, 11, 12, 13, 14, 15, 16, 17, 18, 19],
                               [20, 21, 22, 23, 24, 25, 26, 27, 28, 29],
                               [30, 31, 32, 33, 34, 35, 36, 37, 38, 39],
                               [40, 41, 42, 43, 44, 45, 46, 47, 48, 49]]
    pdb_filename = os.path.join(camparitraj.get_data('test_data'), 'ntl9.pdb')
    traj_filename = os.path.join(camparitraj.get_data('test_data'),
                                 'ntl9.xtc')  # ntl9 has 56 residues
    trajectory = cttrajectory.CTTrajectory(
        trajectory_filename=traj_filename,
        pdb_filename=pdb_filename,
        protein_grouping=protein_groups_residues)

    # select pairwise protein ids (no repetitions).
    for protein_index, protein_group in enumerate(
            itertools.combinations(range(len(protein_groups_residues)), r=2)):
        protein_a, protein_b = protein_group

        # now, let's randomly choose a set of residues to select for `protein_a` and `protein_b`
        num_residues_a = random.randint(
            1, len(protein_groups_residues[protein_a]))
        num_residues_b = random.randint(
            1, len(protein_groups_residues[protein_b]))

        protein_a_residues = protein_groups_residues[protein_a]
        a_residues = list(
            sorted(random.sample(protein_a_residues, num_residues_a)))
        a_residues = [(r - protein_a_residues[0]) for r in a_residues
                      ]  # offset by the starting residue number

        protein_b_residues = protein_groups_residues[protein_b]
        b_residues = list(
            sorted(random.sample(protein_b_residues, num_residues_b)))
        b_residues = [(r - protein_b_residues[0]) for r in b_residues
                      ]  # offset by the starting residue number

        distance_map, stddev_map = trajectory.get_interchain_distance_map(
            protein_a, protein_b)
        assert distance_map.shape == stddev_map.shape

        temp_save_filepath = os.path.join(
            TMP_DIR, 'gs6_map_{index}_{protein}'.format(index=protein_index,
                                                        protein=protein_index))
        temp_filename = '{filename}.csv'.format(filename=temp_save_filepath)

Пример #10

0

Показать файл

def test_get_intra_chain_distance_map_protein_groups():
    protein_groups = [[0, 1, 2, 3, 4], [5, 6, 7, 8, 9], [10, 11, 12, 13, 14]]
    pdb_filename = os.path.join(camparitraj.get_data('test_data'), 'ntl9.pdb')
    traj_filename = os.path.join(camparitraj.get_data('test_data'),
                                 'ntl9.xtc')  # ntl9 has 56 residues
    trajectory = cttrajectory.CTTrajectory(trajectory_filename=traj_filename,
                                           pdb_filename=pdb_filename,
                                           protein_grouping=protein_groups)

    for protein_group in itertools.combinations(range(len(protein_groups)),
                                                r=2):
        protein_a, protein_b = protein_group
        distance_map, stddev_map = trajectory.get_interchain_distance_map(
            protein_a, protein_b)
        assert distance_map.shape == stddev_map.shape
        assert np.count_nonzero(distance_map) == len(
            distance_map.flatten())  # since the residue indices are unique

Пример #11

0

Показать файл

Файл: test_numbering.py Проект: jaredl7/camparitraj

def test_cap_DSSP():
    """
    Tests DSSP (and hence R1/R2 selection) works
    """

    test_data_dir = camparitraj.get_data('test_data')
    pdb_files = ['ACE_NME_multichain', 'ACE_NME_start_at_5']
    for cap_name in pdb_files:
        cap_path = os.path.join(test_data_dir, 'cap_tests', '{}.pdb'.format(cap_name))
        cap_trajectory = cttrajectory.CTTrajectory(cap_path, cap_path)

Пример #12

0

Показать файл

def test_get_interchain_distance_invalid_protein_ids():
    protein_groups = [[0, 1, 2, 3, 4], [5, 6, 7, 8, 9], [10, 11, 12, 13, 14]]
    pdb_filename = os.path.join(camparitraj.get_data('test_data'), 'ntl9.pdb')
    traj_filename = os.path.join(camparitraj.get_data('test_data'),
                                 'ntl9.xtc')  # ntl9 has 56 residues
    trajectory = cttrajectory.CTTrajectory(trajectory_filename=traj_filename,
                                           pdb_filename=pdb_filename,
                                           protein_grouping=protein_groups)

    R1 = 0
    R2 = 1
    A1 = 'CA'
    A2 = 'CA'
    modes = 'atom,ca,closest,closest-heavy,sidechain,sidechain-heavy'.split(
        ',')

    protein_a = 100
    protein_b = 101
    for mode in modes:
        with pytest.raises(CTException):
            trajectory.get_interchain_distance(protein_a, protein_b, R1, R2,
                                               A1, A2, mode)

Пример #13

0

Показать файл

def test_get_interchain_distance_invalid_mode():
    protein_groups = [[0, 1, 2, 3, 4], [5, 6, 7, 8, 9], [10, 11, 12, 13, 14]]
    pdb_filename = os.path.join(camparitraj.get_data('test_data'), 'ntl9.pdb')
    traj_filename = os.path.join(camparitraj.get_data('test_data'),
                                 'ntl9.xtc')  # ntl9 has 56 residues
    trajectory = cttrajectory.CTTrajectory(trajectory_filename=traj_filename,
                                           pdb_filename=pdb_filename,
                                           protein_grouping=protein_groups)

    mode = 'unknown'
    for protein_group in itertools.combinations(range(len(protein_groups)),
                                                r=2):
        protein_a, protein_b = protein_group

        # There appears to be an issue where R1 > R2 - the calculation crashes for sidechain-heavy.
        R1 = 0  #random.choice(range(len(protein_groups[protein_a])))
        R2 = 1  #random.choice(range(len(protein_groups[protein_b])))
        A1 = 'CA'
        A2 = 'CA'

        with pytest.raises(CTException):
            trajectory.get_interchain_distance(protein_a, protein_b, R1, R2,
                                               A1, A2, mode)

Пример #14

0

Показать файл

def test_get_interchain_distance():
    protein_groups = [[0, 1, 2, 3, 4], [5, 6, 7, 8, 9], [10, 11, 12, 13, 14]]
    pdb_filename = os.path.join(camparitraj.get_data('test_data'), 'ntl9.pdb')
    traj_filename = os.path.join(camparitraj.get_data('test_data'),
                                 'ntl9.xtc')  # ntl9 has 56 residues
    trajectory = cttrajectory.CTTrajectory(trajectory_filename=traj_filename,
                                           pdb_filename=pdb_filename,
                                           protein_grouping=protein_groups)

    for protein_group in itertools.combinations(range(len(protein_groups)),
                                                r=2):
        protein_a, protein_b = protein_group

        # There appears to be an issue where R1 > R2 - the calculation crashes for sidechain-heavy.
        R1 = 0  #random.choice(range(len(protein_groups[protein_a])))
        R2 = 1  #random.choice(range(len(protein_groups[protein_b])))
        A1 = 'CA'
        A2 = 'CA'
        modes = 'atom,ca,closest,closest-heavy,sidechain,sidechain-heavy'.split(
            ',')
        for mode in modes:
            distances = trajectory.get_interchain_distance(
                protein_a, protein_b, R1, R2, A1, A2, mode)
            assert len(distances) > 0

Пример #15

0

Показать файл

def test_get_interchain_distance_failing_residues():
    protein_groups = [[0, 1, 2, 3, 4], [5, 6, 7, 8, 9], [10, 11, 12, 13, 14]]
    pdb_filename = os.path.join(camparitraj.get_data('test_data'), 'ntl9.pdb')
    traj_filename = os.path.join(camparitraj.get_data('test_data'),
                                 'ntl9.xtc')  # ntl9 has 56 residues
    trajectory = cttrajectory.CTTrajectory(trajectory_filename=traj_filename,
                                           pdb_filename=pdb_filename,
                                           protein_grouping=protein_groups)

    residues1 = [0, 100]
    residues2 = residues1[::-1]
    A1 = 'CA'
    A2 = 'CA'
    modes = 'atom,ca,closest,closest-heavy,sidechain,sidechain-heavy'.split(
        ',')

    for protein_group in itertools.combinations(range(len(protein_groups)),
                                                r=2):
        protein_a, protein_b = protein_group
        for mode in modes:
            for R1, R2 in zip(residues1, residues2):
                with pytest.raises(CTException):
                    trajectory.get_interchain_distance(protein_a, protein_b,
                                                       R1, R2, A1, A2, mode)

Пример #16

0

Показать файл

def test_phi_psi_bbseg(NTL9_CP):
    """
    Test that ensures our representation of the BBSEG2 matrix
    reproduces the version from CAMPARI

    """

    # read in BBSEG file
    bbseg_file = camparitraj.get_data('bbseg2.dat')
    with open(bbseg_file, 'r') as fh:
        content = fh.readlines()

    idx = 0
    for psi in range(179, -180, -10):

        local = ''
        for phi in range(-179, 180, 10):
            local = local + '%i ' % (NTL9_CP._CTProtein__phi_psi_bbseg(
                [phi], [psi])[0])

        assert (content[idx].strip() == local.strip())
        idx = idx + 1

Пример #17

0

Показать файл

Файл: test_caps.py Проект: jaredl7/camparitraj

import camparitraj
from camparitraj import cttrajectory
import pytest
import sys

test_data_dir = camparitraj.get_data('test_data')

CAPNAMES = [
    'ACE_NH2', 'ACE_NME', 'ACE_UCAP', 'FOR_NH2', 'FOR_NME', 'FOR_UCAP',
    'UCAP_NH2', 'UCAP_NME', 'UCAP_UCAP', 'ACE_NME_start_at_5',
    'ACE_NME_multichain'
]

#CAPNAMES = ['ACE_NME_multichain']

CCAP = [
    'ACE_NH2', 'ACE_NME', 'FOR_NH2', 'FOR_NME', 'UCAP_NH2', 'UCAP_NME',
    'ACE_NME_start_at_5', 'ACE_NME_multichain'
]
NCAP = [
    'ACE_NH2', 'ACE_NME', 'ACE_UCAP', 'FOR_NH2', 'FOR_NME', 'FOR_UCAP',
    'ACE_NME_start_at_5', 'ACE_NME_multichain'
]


def test_cap_DSSP():
    """
    Tests DSSP (and hence R1/R2 selection) works
    """

    for CN in CAPNAMES:

Пример #18

0

Показать файл

def test_read_in_no_trajectory():
    pdb_filename = os.path.join(camparitraj.get_data('test_data'), 'gs6.pdb')
    with pytest.raises(CTException):
        cttrajectory.CTTrajectory(pdb_filename=pdb_filename)

Пример #19

0

Показать файл

def test_trajectory_initialization_debug():
    pdb_filename = os.path.join(camparitraj.get_data('test_data'), 'gs6.pdb')
    traj_filename = os.path.join(camparitraj.get_data('test_data'), 'gs6.xtc')
    cttrajectory.CTTrajectory(pdb_filename=pdb_filename,
                              trajectory_filename=traj_filename,
                              debug=True)

Пример #20

0

Показать файл

def test_read_in_no_topology_dcd():
    """The `CTTrajectory.__init__` references that `.dcd` files are supported too."""
    traj_filename = os.path.join(camparitraj.get_data('test_data'), 'gs6.dcd')
    with pytest.raises(CTException):
        cttrajectory.CTTrajectory(trajectory_filename=traj_filename)

Пример #21

0

Показать файл

def test_read_in_no_topology_xtc():
    traj_filename = os.path.join(camparitraj.get_data('test_data'), 'gs6.xtc')
    with pytest.raises(CTException):
        cttrajectory.CTTrajectory(trajectory_filename=traj_filename)

Python get_data примеры использования