Created
May 28, 2017 18:02
-
-
Save anonymous/d27e448edbea145dbe4db3362bbf75f2 to your computer and use it in GitHub Desktop.
Revisions
-
There are no files selected for viewing
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters. Learn more about bidirectional Unicode charactersOriginal file line number Diff line number Diff line change @@ -0,0 +1,27 @@ import numpy as np import pandas as pd from sklearn.decomposition import PCA from sklearn.cluster import KMeans import matplotlib.pyplot as plt import seaborn as sb np.seterr(divide='ignore', invalid='ignore') # Quick way to test just a few column features # stocks = pd.read_csv('supercolumns-elements-nasdaq-nyse-otcbb-general-UPDATE-2017-03-01.csv', usecols=range(1,16)) stocks = pd.read_csv('supercolumns-elements-nasdaq-nyse-otcbb-general-UPDATE-2017-03-01.csv') print(stocks.head()) str_list = [] for colname, colvalue in stocks.iteritems(): if type(colvalue[1]) == str: str_list.append(colname) # Get to the numeric columns by inversion num_list = stocks.columns.difference(str_list) stocks_num = stocks[num_list] print(stocks_num.head())