-
Notifications
You must be signed in to change notification settings - Fork 9
/
Copy path37_2.py
90 lines (80 loc) · 3.24 KB
/
37_2.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
import torch
import numpy as np
import operator
from torch.utils.data import dataloader
import torchvision.datasets as dsets
import torchvision.transforms as transforms
import matplotlib.pyplot as plt
batch_size=100
def KNN_classify(k,dis,X_train,x_train,Y_test):
assert dis=='E' or dis=='M'
num_test = Y_test.shape[0]
labellist=[]
if (dis=='E'):
for i in range(num_test):
distances=np.sqrt(np.sum(((X_train-np.tile(Y_test[i],(X_train.shape[0],1)))**2),axis=1))
print(distances)
nearest_k=np.argsort(distances)
topK=nearest_k[:k]
classCount={}
print(x_train[i])
for i in topK:
print(x_train[i])
classCount[x_train[i]]=classCount.get(x_train[i],0)+1
print(classCount)
sortedClassCount=sorted(classCount.items(),key=operator.itemgetter(1),reverse=True)
print(sortedClassCount)
labellist.append(sortedClassCount[0][0])
return np.array(labellist)
elif (dis=='M'):
for i in range(num_test):
distances=np.sqrt(np.sum((np.fabs(X_train-np.tile(Y_test[i],(X_train.shape[0],1)))),axis=1))
print(distances)
nearest_k=np.argsort(distances)
topK=nearest_k[:k]
classCount={}
print(x_train[i])
for i in topK:
print(x_train[i])
classCount[x_train[i]]=classCount.get(x_train[i],0)+1
print(classCount)
sortedClassCount=sorted(classCount.items(),key=operator.itemgetter(1),reverse=True)
print(sortedClassCount)
labellist.append(sortedClassCount[0][0])
return np.array(labellist)
def getXmean(x_train):
x_train=np.reshape(x_train,(x_train.shape[0],-1))
mean_image=np.mean(x_train,axis=0)
return mean_image
def centralized(x_test,mean_image):
x_test = np.reshape(x_test,(x_test.shape[0],-1))
x_test = x_test.astype(np.float)
x_test -= mean_image
return x_test
train_dataset=dsets.MNIST(root='m1/pymnist',train=True,transform=None,download=True)
test_dataset=dsets.MNIST(root='m1/pymnist',train=False,transform=None,download=True)
#加载数据
train_loader=torch.utils.data.DataLoader(dataset=train_dataset,batch_size=batch_size,shuffle=True)
test_loader=torch.utils.data.DataLoader(dataset=test_dataset,batch_size=batch_size,shuffle=True)
print("train_data:",train_dataset.data.size())
print("train_labels:",train_dataset.targets.size())
print("test_dataset:",test_dataset.data.size())
print("test_labels:",test_dataset.targets.size())
'''digit=train_loader.dataset.train_data[0]
plt.imshow(digit,cmap=plt.cm.binary)
plt.show()
print(train_loader.dataset.targets[0])'''
x_train = train_loader.dataset.data.numpy()
x_train = x_train.reshape(x_train.shape[0],28*28)
y_train=train_loader.dataset.targets.numpy()
X_test=test_loader.dataset.data[:1000].numpy()
X_test=X_test.reshape(X_test.shape[0],28*28)
y_test=test_loader.dataset.targets[:1000].numpy()
num_test=y_test.shape[0]
mean_image=getXmean(x_train)
cdata=centralized(test_loader.dataset.data.numpy(),mean_image)
cdata=cdata.reshape(cdata.shape[0],28,28)
print("---------------")
plt.imshow(cdata[0],cmap=plt.cm.binary)
plt.show()
print(cdata.dataset.targets[0])