import pandas as pd
import numpy as np
data = pd.read_excel(r'E:\dataset\clusterData\didi_1.xls',header=None,index_col=None)
data = np.array(data)
print(data.shape)
y = data[:,-1]
n = len(y)
labels = np.zeros(n)
for i in range(n):
if y[i]<=5:
labels[i] = -1
elif 5<y[i]<= 12:
labels[i] = 0
elif 12 < y[i] <=20:
labels[i] = 1
elif y[i] > 20:
labels[i] = 3
labels = np.vstack(labels)
Data = np.hstack((data,labels))
print(Data.shape)
Data = pd.DataFrame(Data)
Data.to_csv(r'E:\dataset\clusterData\didi_1.csv',header=None,index=None)