Esempio n. 1
0
    def process(self):
        claimsDf = pd.read_csv(r("claims.csv"))

        d1 = claimsDf.groupby(["month", "airline"]).count()

        flightsDf = pd.read_csv(r("flights.csv"))
        d2 = flightsDf.groupby(["month", "airline"]).agg({
            "delay": np.sum,
            "cancelled": np.sum
        })

        print(pd.concat([d1, d2]))
        pd.concat([
            d1.filter(["month", "airline", "Item"], axis=1),
            d2.filter(["month", "airline", "delay"], axis=1)
        ]).to_csv(t("all.csv"))
Esempio n. 2
0
def reply(update, context):
    try:
        update.effective_message.reply_text(
            r(
                update.effective_message.text
            )
        )
    except:
        pass
Esempio n. 3
0
 def process(self):
     df = pd.read_csv(r("flights.csv"))
     # df['delay'] = df.apply(lambda x: x['late_aircraft_delay'] + x['carrier_delay'], axis=1)
     df.groupby(["date", "airline"]).agg({
         "delay": np.sum,
         "cancelled": np.sum
     }).to_csv(t("airline_delays.csv"))
     df.groupby(["date",
                 "airline"]).count().to_csv(t("airline_delay_count.csv"))
Esempio n. 4
0
 def process(self):
     df = pd.read_csv(r("claims.csv"))
     df.groupby(["date", "airline"]).count().to_csv(t("claims_count.csv"))
Esempio n. 5
0
def reply(update, context):
    try:
        context.bot.send_chat_action(update.effective_chat.id, "typing")
        update.effective_message.reply_text(r(update.effective_message.text))
    except:
        pass
Esempio n. 6
0
import datetime

from helpers import processedPath as r, tidyPath as t
import pandas as pd
import numpy as np
import sys
import matplotlib
import matplotlib.pyplot as plt

claimsDf = pd.read_csv(r("claims.csv"))
flightsDf = pd.read_csv(r("flights.csv"))

# mostDelayedAirline = flightsDf.groupby(["airline"]).agg({"delay":np.sum})["delay"].sort_values().nlargest(10).index.values
# d = flightsDf[((flightsDf["airline"].isin(mostDelayedAirline)))]
# print(d)
# print(d.groupby(["month","airline"]).agg({"delay":np.sum}))
# sys.exit()

d1 = claimsDf.groupby(["month", "airline"]).count()
d2 = flightsDf.groupby(["month", "airline"]).agg({
    "delay": np.sum,
    "cancelled": np.sum
})

e = lambda x: "../figures/exploratory/" + x
f = lambda x: "../figures/final/" + x
# 1. number of claims
plt.figure()
ax = claimsDf.groupby(["month"])["item"].count().plot()
plt.tight_layout(pad=7)
ax.get_figure().savefig(e("1"))