def testRFC822(self):
        # rfc822 conversion
        dt = DateTime('2002-05-02T08:00:00+00:00')
        self.assertEqual(dt.rfc822(), 'Thu, 02 May 2002 08:00:00 +0000')

        dt = DateTime('2002-05-02T08:00:00+02:00')
        self.assertEqual(dt.rfc822(), 'Thu, 02 May 2002 08:00:00 +0200')

        dt = DateTime('2002-05-02T08:00:00-02:00')
        self.assertEqual(dt.rfc822(), 'Thu, 02 May 2002 08:00:00 -0200')

        # Checking that conversion from local time is working.
        dt = DateTime()
        dts = dt.rfc822().split(' ')
        times = dts[4].split(':')
        _isDST = time.localtime(time.time())[8]
        if _isDST:
            offset = time.altzone
        else:
            offset = time.timezone
        self.assertEqual(dts[0], dt.aDay() + ',')
        self.assertEqual(int(dts[1]), dt.day())
        self.assertEqual(dts[2], dt.aMonth())
        self.assertEqual(int(dts[3]), dt.year())
        self.assertEqual(int(times[0]), dt.h_24())
        self.assertEqual(int(times[1]), dt.minute())
        self.assertEqual(int(times[2]), int(dt.second()))
        self.assertEqual(dts[5], "%+03d%02d" % divmod((-offset / 60), 60))
    def testRFC822(self):
        # rfc822 conversion
        dt = DateTime('2002-05-02T08:00:00+00:00')
        self.assertEqual(dt.rfc822(), 'Thu, 02 May 2002 08:00:00 +0000')

        dt = DateTime('2002-05-02T08:00:00+02:00')
        self.assertEqual(dt.rfc822(), 'Thu, 02 May 2002 08:00:00 +0200')

        dt = DateTime('2002-05-02T08:00:00-02:00')
        self.assertEqual(dt.rfc822(), 'Thu, 02 May 2002 08:00:00 -0200')

        # Checking that conversion from local time is working.
        dt = DateTime()
        dts = dt.rfc822().split(' ')
        times = dts[4].split(':')
        _isDST = time.localtime(time.time())[8]
        if _isDST:
            offset = time.altzone
        else:
            offset = time.timezone
        self.assertEqual(dts[0], dt.aDay() + ',')
        self.assertEqual(int(dts[1]), dt.day())
        self.assertEqual(dts[2], dt.aMonth())
        self.assertEqual(int(dts[3]), dt.year())
        self.assertEqual(int(times[0]), dt.h_24())
        self.assertEqual(int(times[1]), dt.minute())
        self.assertEqual(int(times[2]), int(dt.second()))
        self.assertEqual(dts[5], "%+03d%02d" % divmod((-offset / 60), 60))
Esempio n. 3
0
 def len_month(self, date):
     """ fetches a monthname and returns translation plus lenght """
     if type(date)== StringType:
         date = DateTime(date)
     month = date.aMonth().lower()
     label = 'month_'+month
     tmonth = pmf(label)
     return (tmonth, len(tmonth))
     
Esempio n. 4
0
    def get_time(self):
        """ Get timestamp at the initiation of task

        Returns:
            [string]: [time at task initiation]
        """
        current_time = DateTime(time.time(), "US/Eastern")
        self.timestamp = (str(current_time.year()) +
                          str(current_time.aMonth()) +
                          str(current_time.day()) + str(current_time.h_24()) +
                          str(current_time.minute()) + str(time.time())[:2])
Esempio n. 5
0
def init(dirt,
         task,
         runlist,
         timelist,
         foldlist,
         rep,
         task_token,
         fitmetrics=False):
    current_time = DateTime(time.time(), "US/Eastern")
    if task == "bt":
        taskname = 'binaryTarget'
        if not fitmetrics:
            fitmetrics = autosklearn.metrics.log_loss
    elif task == "bre":
        taskname = 'binaryRareEvent'
        if not fitmetrics:
            fitmetrics = autosklearn.metrics.log_loss
    elif task == "it":
        taskname = 'intervalTarget'
        if not fitmetrics:
            fitmetrics = autosklearn.metrics.mean_squared_error
    sasdatalist = sorted(glob.glob(dirt + taskname + "/*sas7bdat"),
                         key=os.path.getsize)
    print(sasdatalist)
    sasdatalist = remove_dirt(sasdatalist, dirt + "/" + taskname + "/")
    print(sasdatalist)
    sasdatalist = [i[:-9] for i in sasdatalist]
    print("sas datalist\n", sasdatalist)
    #sasdatalist = sorted(sasdatalist)

    csvdatalist = sorted(glob.glob(dirt + taskname + "/*.csv"),
                         key=os.path.getsize)
    csvdatalist = remove_dirt(csvdatalist, dirt + "/" + taskname + "/")
    csvdatalist = [i[:-4] for i in csvdatalist]
    print("csv datalist\n", csvdatalist)
    #csvdatalist = sorted(csvdatalist)

    #glob.glob(dirt + taskname+"/*sas7bdat")
    metalist = glob.glob(dirt + "/tmp_metadata/*meta.csv")
    metalist = remove_dirt(metalist, dirt + "/tmp_metadata/")
    metalist = [i[:-9] for i in metalist]
    print("working dirt\t", dirt)
    print("metadatalit\n", metalist)
    #metalist = sorted(metalist)
    timestamp = (str(current_time.year()) + str(current_time.aMonth()) +
                 str(current_time.day()) + str(current_time.h_24()) +
                 str(current_time.minute()) + str(time.time())[:2])
    logfile = open(
        "results/log_" + str(len(runlist)) + "dataset_" + str(timelist[0]) +
        "s_" + str(foldlist[0]) + "f_rep" + str(rep) + "_task_" +
        str(task_token) + ".txt",
        "w",
    )
    return dirt, taskname, logfile, csvdatalist, sasdatalist, metalist, timestamp, fitmetrics,
Esempio n. 6
0
    def fromLineFrom(self,email,date):
        """
        Generate a conformant mbox From line from email and date strings.

        (unless date is unparseable, in which case we omit that part)
        """
        # "email" is in fact a real name or zwiki username - adapt it
        email = re.sub(r'\s','',email) or 'unknown'
        try:
            d = DateTime(date)
            return 'From %s %s %s %d %02d:%02d:%02d %s %d\n' % (
                email,d.aDay(),d.aMonth(),d.day(),d.hour(),
                d.minute(),d.second(),d.timezone(),d.year())
        except (DateTimeSyntaxError,AttributeError,IndexError):
            return 'From %s\n' % email
Esempio n. 7
0
    warnings.simplefilter("ignore")
current_time = DateTime(time.time(), 'US/Eastern')
###################################################################
# Use sklearn to holdout, read in original data
#######################################################################

framework = 'autosklearn'
datasetn = 'bankmarketing'
foldn = 3
timeforjob = foldn * 2 * 1800
prepart = True
ncore = 4
dirt = '/root/data/'
############################################################################################################
resultfile = str(datasetn)+str(foldn) +"fold"+ str(timeforjob) + "seconds" + str(ncore)+"core"+\
str(current_time.year()) + str(current_time.aMonth())+ str(current_time.day()) + \
str(current_time.h_24()) + str(current_time.minute())  + str(time.time())[:2] + str(framework)+'prepart.txt'
dataset = "uci_bank_marketing_pd"
numeric_features = []
categorical_features = []


def prep(dataset,
         dirt,
         numeric_features,
         categorical_features,
         delim=',',
         indexdrop=False):
    index_features = ['_dmIndex_', '_PartInd_']
    data = pd.read_csv(dirt + dataset + '.csv',
                       delimiter=delim)  # panda.DataFrame