diff --git a/engineers-employability/data/.~lock.data.csv# b/engineers-employability/data/.~lock.data.csv# new file mode 100644 index 0000000..db852a0 --- /dev/null +++ b/engineers-employability/data/.~lock.data.csv# @@ -0,0 +1 @@ +,thrishik,thrishik-Aspire-E5-573,16.11.2019 20:27,file:///home/thrishik/.config/libreoffice/4; \ No newline at end of file diff --git a/engineers-employability/plots/salary vs frequency.png b/engineers-employability/plots/salary vs frequency.png new file mode 100644 index 0000000..66eff85 Binary files /dev/null and b/engineers-employability/plots/salary vs frequency.png differ diff --git a/engineers-employability/scripts/salary.py b/engineers-employability/scripts/salary.py new file mode 100644 index 0000000..002d8f5 --- /dev/null +++ b/engineers-employability/scripts/salary.py @@ -0,0 +1,25 @@ +import pandas as pd + +import matplotlib.pyplot as plt + + +#load dataset +data = pd.read_csv("../data/data.csv") + + +#Sumarry statistics +print(data.describe()) + +n=max(data['Salary']) +#Create a histogram of all columns +range = (0, n) +bins = 10 + +# plotting a histogram +plt.hist(data['Salary'], bins, range, color = 'green', + histtype = 'bar', rwidth = 0.8) +plt.xlabel('Salary') +plt.ylabel('frequency') +plt.xticks(fontsize=8) +plt.tight_layout() +plt.show()