-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathgetPlots.py
More file actions
37 lines (30 loc) · 1.08 KB
/
getPlots.py
File metadata and controls
37 lines (30 loc) · 1.08 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
from getModels import getData
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
def rand_jitter(arr):
stdev = .01*(max(arr)-min(arr))
return arr + np.random.randn(len(arr)) * stdev
def printDistribution(data, naics=None, col=None):
if naics:
data = data[(data["naics"] == naics) & (data["countStatcan"] > 0)]
distPlot = sns.distplot(data["osmCompleteness"])
elif col:
data = data[col]
data.replace([np.inf, -np.inf], np.nan, inplace=True)
data = data.dropna()
distPlot = sns.distplot(data)
plt.show()
def printScatter(data, naics, col):
data = data[(data["naics"] == naics) & (data["countStatcan"] > 0)]
data["osmCompleteness"] = rand_jitter(data["osmCompleteness"])
relPlot = sns.relplot(col, "osmCompleteness", size="countStatcan", data=data, alpha=0.5)
plt.show()
def main():
data = getData()
# printDistribution(data, naics=44511)
# printDistribution(data, col="COL1")
printScatter(data, naics=44511, col="COL6")
if __name__ == "__main__":
main()