示例#1
0
import matplotlib.pyplot as plt
import seaborn as sns
import numpy as np
import pandas as pd
import Bio.Cluster as bc

f = "/data/Lei_student/Hussain/ML/dm6/peakerror/summary.csv"
o = "/data/Lei_student/Hussain/ML/dm6/peakerror/cluster_out.png"

df = pd.read_csv(f)
data = df[["mcc", "q_value"]]

matrix = bc.distancematrix(data)
cdata, cmask = bc.clustercentroids(data)
distance = bc.clusterdistance(data)
tree = bc.treecluster(data)

print(matrix)

fig = plt.figure(figsize=(10, 8))
ax = fig.add_subplot(111)
ax.set_title("MCC distance matrix")
plt.scatter(range(45000), matrix)
plt.savefig(o)