Python Datasets.ZooplaMatchedDaily Beispiele

Programmiersprache: Python

Klasse / Typ: Datasets

Methode / Funktion: ZooplaMatchedDaily

Beispiele auf hotexamples.com: 3

Python Datasets.ZooplaMatchedDaily - 3 Beispiele gefunden. Dies sind die am besten bewerteten Python Beispiele für die Datasets.ZooplaMatchedDaily vom Programmpaket modeldb, die aus Open Source-Projekten extrahiert wurden. Sie können Beispiele bewerten, um die Qualität der Beispiele zu verbessern.

Häufig verwendete Methoden

Anzeigen Verbergen

Datasets(9)

EHSinterview(5)

Dataset(3)

ZooplaMatchedDaily(3)

FastDepthDataset(3)

SpeechYoloDataSet(3)

ImbalancedDatasetSampler(2)

KittiDataset(2)

PrepareCrossFold(2)

ZooplaRawCollated(2)

CelebA(2)

PSCDataset(2)

NYUDataset(2)

ZooplaMatchedCollated(2)

SLDataPreprocess(2)

SLdatasetbyCity(1)

PaintingsDataset(1)

Solar(1)

SLdatasetbyDate(1)

SVHNdel(1)

Shakespeare(1)

Market1501EvaluateDataset(1)

Traffic(1)

TrainingDataset(1)

TumorSim(1)

ZooplaMatchedAggregated(1)

MultiDataset(1)

ApplesOranges(1)

MRBrainS18(1)

ExchangeRate(1)

BrainWeb(1)

CIFAR100del(1)

CIFAR10del(1)

CUHK03EvaluateDataset(1)

DataSet(1)

EHSincome(1)

Electricity(1)

FMNISTdel(1)

MRBrainS17(1)

Femnist(1)

HPIMonthly(1)

IBSR(1)

ImageNet(1)

MARSEvalDataset(1)

ML100K(1)

BraTS12(1)

MRBrainS13(1)

MNISTdel(1)

Beispiel #1

Datei anzeigen

def CalculatePriceChanges():
    distribution = DiscountDistribution()
    priceMap = {}
    #    data = ds.ZooplaMatchedDaily(2000000) # during rising housing market
    data = ds.ZooplaMatchedDaily()  # at bottom of housing market
    chunk = data.read(500000)
    chunk.rename(columns={'\xef\xbb\xbfLISTING ID': 'LISTING ID'},
                 inplace=True)
    filteredchunk = chunk[chunk["MARKET"] == "SALE"][[
        'LISTING ID', 'DAY', 'PRICE'
    ]][chunk['PRICE'] > 0]
    for row in filteredchunk.values:
        # row: LISTING ID   DAY   PRICE
        listingid = row[0]
        if listingid in priceMap:
            lastRecord = priceMap[listingid]
            oldPrice = lastRecord.currentprice
            startDay, endDay, percent = lastRecord.add(row[1], row[2])
            if (oldPrice == row[2]):  # no price change
                distribution.noChange(startDay / 30, endDay / 30)
            else:  # price has changed
                distribution.addChange(startDay / 30, endDay / 30, percent)
        else:
            priceMap[listingid] = PriceCalc(row[1], row[2])
    return (distribution)

Beispiel #2

Datei anzeigen

def ZooplaPriceChanges():
    total = 0
    pSame = 0
    priceMap = {}
    #    distribution = DiscountDistribution()
    data = ds.ZooplaMatchedDaily()
    #    store = pd.HDFStore('rawDaily.hd5',mode='w')
    #    for chunk in data.parser:
    chunk = data.read(1000)
    chunk.rename(columns={'\xef\xbb\xbfLISTING ID': 'LISTING ID'},
                 inplace=True)
    filteredchunk = chunk[chunk["MARKET"] == "SALE"][[
        'LISTING ID', 'DAY', 'PRICE'
    ]][chunk['PRICE'] > 0]
    for row in filteredchunk.values:
        currentState = priceMap.get(row[0])
        if currentState == None:
            priceMap[row[0]] = PriceCalc(row[1], row[2])
        else:
            startDay, endDay, percent = currentState.add(row[1], row[2])
            distribution.add(startDay, endDay, percent)

    # now get deletion dates
    delData = ds.ZooplaMatchedCollated()
    #    for chunk in delData.parser:
    chunk = delData.read(1000)
    chunk.rename(columns={'\xef\xbb\xbfLISTING ID': 'LISTING ID'},
                 inplace=True)
    filteredchunk = chunk[chunk["MARKET"] == "SALE"][['LISTING ID', 'DELETED']]
    for row in filteredchunk.values:
        currentState = priceMap.get(row[0])
        if currentState != None:
            if (currentState.currentprice == currentState.initialmarketprice):
                pSame += 1
            total += 1
            startDay, endDay, percent = currentState.add(row[1], 0)
            distribution.add(startDay, endDay, percent)
            priceMap.pop(row[0])
    print len(priceMap)
    print pSame, total, pSame * 1.0 / total
    plotProbability(distribution.dist)

Beispiel #3

Datei anzeigen

def ZooplaPriceChanges():
    total = 0
    pSame = 0
    priceMap = {}
#    distribution = DiscountDistribution()    
    data = ds.ZooplaMatchedDaily()
    #    store = pd.HDFStore('rawDaily.hd5',mode='w')
    #    for chunk in data.parser:
    chunk = data.read(10000000)
    chunk.rename(columns={'\xef\xbb\xbfLISTING ID':'LISTING ID'},inplace=True)
    filteredchunk = chunk[chunk["MARKET"]=="SALE"][['LISTING ID','DAY','PRICE']][chunk['PRICE']>0]
    change = []
    changeprice = []
    nochange = []
    for row in filteredchunk.values:
        if row[0] in priceMap:
            if(priceMap[row[0]].currentprice == row[2]):
                # no change
                nochange.append(priceMap[row[0]].daysonmarket/30)
            else:'
                change.append(priceMap[row[0]].daysonmarket/30)
                changeprice.append([priceMap[row[0]].daysonmarket/30, -(priceMap[row[0]].currentprice-row[2])/row[2]*100])
          
                
            startDay, endDay, percent = priceMap[row[0]].add(row[1],row[2])
            distribution.add(startDay, endDay, percent)
        else:
            priceMap[row[0]] = PriceCalc(row[1],row[2])
               
    # now get deletion dates
    delData = ds.ZooplaMatchedCollated()
#    for chunk in delData.parser:
    chunk = delData.read(10000000)
    chunk.rename(columns={'\xef\xbb\xbfLISTING ID':'LISTING ID'},inplace=True)
    filteredchunk = chunk[chunk["MARKET"]=="SALE"][['LISTING ID','DELETED']]

    for row in filteredchunk.values:
       if row[0] in priceMap:
           if(priceMap[row[0]].currentprice == priceMap[row[0]].initialmarketprice):
               pSame += 1
           total += 1

    print pSame, total, pSame*1.0/total
    

    for row in filteredchunk.values:
       if row[0] in priceMap:
           startDay, endDay, percent = priceMap[row[0]].add(row[1],0)
           distribution.add(startDay, endDay, percent)
           priceMap.pop(row[0])
           
    print len(priceMap)

    global savedOutput1
    global savedOutput2
    global savedOutput3
    savedOutput1 = nochange
    savedOutput2 = change
    savedOutput3 = changeprice
    plotProbability(distribution.dist)
    
    global hist
    global n, n1, n2, nprice, df
 
 #   hist = np.histogram(savedOutput1)
    

    n1, bins1, patches1 = pyl.hist(savedOutput1,bins=range(min(savedOutput1), max(savedOutput1) + 1, 1))
    
    n2, bins2, patches2 = pyl.hist(savedOutput2,bins=range(min(savedOutput2), max(savedOutput2) + 1, 1))
    
    dist, binsa, binsb = np.histogram2d([x[0] for x in savedOutput3], [x[1] for x in savedOutput3], range=[[0,30],[-30,0]], bins=[30,20])
    
# plt.imshow(dist)

    
    n = n2/(n1+n2)
  
    return(n, n1, n2)