#!/usr/bin/python3 # -*- coding: utf-8 -*- # %% pandas # Many stats will just be methods of your data frame with pandas: import numpy as np import pandas as pd help(pd.DataFrame) df = pd.read_csv("employee_birthday.csv") df["eid"] = np.array([1, 2, 3, 4, 5, 6, 7, 8, 9]) df["salary"] = np.array([1, 2, 3, 4, 5, 6, 7, 8, 9]) df.describe() df["eid"].mean() df["eid"].plot() df["eid"].plot.box() df.plot() # see: https://pandas.pydata.org/pandas-docs/stable/getting_started/intro_tutorials/index.html