13 lines
386 B
Python
13 lines
386 B
Python
import pandas as pd
|
|
import numpy as np
|
|
from sklearn.datasets import dump_svmlight_file
|
|
|
|
df1 = pd.read_csv("./dataset/input_label.csv")
|
|
df2 = pd.read_csv("./dataset/input.csv")
|
|
res = pd.merge(df1, df2, how='left', left_on='id', right_on='id')
|
|
|
|
X = res[np.setdiff1d(res.columns,['label','id'])]
|
|
y = res.label
|
|
|
|
dump_svmlight_file(X,y,'/host/smvlight.dat',zero_based=True,multilabel=False)
|