%%capture
%config InlineBackend.figure_format = 'svg'
%matplotlib inline
import scipy as sc, pandas as pd, seaborn as sns
import gpflow as gp
import numpy as np
import matplotlib.pyplot as plt
sns.set()
Following are some visualizations and tables based on the data gathered in the march survey here. The raw data can be accessed here in the form of a .csv file.
The plots were made by mapping kyu ranks to negative integers, so that 1d corresponds to 0 (i.e. 1k -> -1, 2d -> 1). The tables are based on OGS ranks. They range from 15k to 7d as that's where almost all the responses lie.
data = pd.read_csv('Go Rank Survey March 2018.csv')
data.head()
data.info()
def mapping(x):
try:
t = x[-1]
except:
return x
if t == 'k':
n = -int(x[:-1])
else:
n = int(x[:-1])-1
return n
X = data.iloc[:,1:].copy()
X = X.applymap(mapping)
X=X.iloc[:,((X.shape[0]-X.isna().sum())>5).values]
X.dropna().shape
# outliers
X.drop([164,95,], inplace=True)
%%capture --no-display
sns.pairplot(X.iloc[:,((X.shape[0]-X.isna().sum())>5*3).values], diag_kind='kde', kind='reg');