Ejemplo n.º 1
0
 def connection(self):
     return Model.get_connection_resolver().connection()
Ejemplo n.º 2
0
 def tearDownClass(cls):
     Model.unset_connection_resolver()
Ejemplo n.º 3
0
 def setUpClass(cls):
     Model.set_connection_resolver(DatabaseIntegrationConnectionResolver())
Ejemplo n.º 4
0
# class Source(Model):
#     pass

# source = Source.all()

from eloquent import DatabaseManager, Model

config = {
    'default': 'mysql',
    'mysql': {
        'driver': 'mysql',
        'host': 'localhost',
        'port': 33060,
        'database': 'aauuss',
        'user': '******',
        'password': '******',
        'prefix': ''
    }
}

db = DatabaseManager(config)
Model.set_connection_resolver(db)


class Source(Model):
    pass


source = Source.all()
Ejemplo n.º 5
0
    def createDatawarehouseClient(self):
        monthList = {
            '01': 'Jan',
            '02': 'Feb',
            '03': 'Mar',
            '04': 'Apr',
            '05': 'May',
            '06': 'Jun',
            '07': 'Jul',
            '08': 'Aug',
            '09': 'Sep',
            '10': 'Oct',
            '11': 'Nov',
            '12': 'Dec'
        }
        mydb = mysql.connector.connect(host="localhost",
                                       user="******",
                                       passwd="",
                                       database="interDB")
        mycursor = mydb.cursor()
        mycursor.execute(
            "select country, countryCode, date, dateCode, sum(confirmed) as coronaConfirmed,"
            " sum(deaths) as coronaDeaths, sum(recovered) as coronaRecovered from covidstats "
            "group by country, countryCode, date, dateCode")
        result = mycursor.fetchall()
        preProcessing = TweetsPreProcessing()
        configdb = {
            'mysql': {
                'driver': 'mysql',
                'host': 'localhost',
                'database': 'clientdb',
                'user': '******',
                'password': '',
                'prefix': ''
            }
        }

        db = DatabaseManager(configdb)
        Model.set_connection_resolver(db)
        cpt = 0
        for row in result:
            year = row[3][:4]
            month = row[3][4:6]
            day = row[3][6:8]
            dayOfYear = date.fromisoformat(year + '-' + month + '-' +
                                           day).timetuple().tm_yday
            spring = range(80, 172)
            summer = range(172, 264)
            autumn = range(264, 355)
            if dayOfYear in spring:
                season = 'spring'
            elif dayOfYear in summer:
                season = 'summer'
            elif dayOfYear in autumn:
                season = 'autumn'
            else:
                season = 'winter'
            timeAltID = row[3]
            monthName = monthList[month]

            rowLocation = preProcessing.getLocation(row[0])
            rowTime = [
                timeAltID, dayOfYear, day, month, monthName, year, season
            ]

            time = DimTime()
            location = DimLocation()
            factCovCase = FactCovCase()

            # fill the dimensions
            timeID = time.insert(rowTime)
            locationID = location.insert(rowLocation)
            # fill the dimensions

            # fill the fact table with foreign keys & mesures
            nbrOfCases = row[4]
            nbrOfDeath = row[5]
            nbrOfRecovered = row[6]
            row = [locationID, timeID, nbrOfCases, nbrOfDeath, nbrOfRecovered]
            factCovCase.insert(row)
            cpt += 1
            print(cpt)
    def createDatawareHouse(self, analysisID, numberOfTweets):

        # get all the different concepts for this client
        #allConcepts = dbIntermediary.table('alltweets').select(dbIntermediary.raw('distinct concept')).where('analysisID', '=', analysisID).get()
        configdb = {
            'mysql': {
                'driver': 'mysql',
                'host': 'localhost',
                'database': 'datawarehouse',
                'user': '******',
                'password': '',
                'prefix': ''
            }
        }

        db = DatabaseManager(configdb)
        Model.set_connection_resolver(db)
        '''for temp in allConcepts:
            concept = temp['concept']
            print('concept is : ',concept)
            print("hello")
            #-----------------------------------------
            # Fill the Fact Tweet Table
            data = dbIntermediary.table('alltweets').select(dbIntermediary.raw(
                'alltweets.languageName, alltweets.sourceName, alltweets.timeAltID, alltweets.sentimentLabel, alltweets.cityName, count(*) as numberOfTweets'))\
                .where('alltweets.analysisID', '=', analysisID).where('alltweets.concept', '=', concept)\
                .group_by('alltweets.languageName', 'alltweets.sourceName', 'alltweets.timeAltID', 'alltweets.sentimentLabel', 'alltweets.cityName')\
                .get()

            conceptTable = DimConcept()
            rowConcept = [concept]
            conceptID = conceptTable.insert(rowConcept)
            cpt = 0
            for tuple in data:
                temp = dbIntermediary.table('alltweets').select(dbIntermediary.raw('*')).where(
                    'languageName', '=', tuple['languageName']).where(
                    'sourceName', '=', tuple['sourceName']).where(
                    'timeAltID', '=', tuple['timeAltID']).where(
                    'sentimentLabel', '=', tuple['sentimentLabel']).where(
                    'cityName', '=', tuple['cityName']).get()

                row = temp[0]
                rowSentiment = [row['sentimentLabel']]
                rowSource = [row['sourceName']]
                rowTime = [row['timeAltID'], row['dayOfWeek'], row['day'], row['month'], row['monthName'], row['year'],
                           row['season']]
                rowLocation = [row['locationAltID'], row['cityName'], row['countryID'], row['countryName'],
                               row['continentID'], row['continentName']]
                rowLanguage = [row['languageCode'], row['languageName']]

                # instanciate the DB tables
                time = DimTime()
                sentiment = DimSentiment()
                language = DimLanguage()
                location = DimLocation()
                source = DimSource()
                factTweet = FactTweet()

                # fill the dimensions
                timeID = time.insert(rowTime)
                sentimentID = sentiment.insert(rowSentiment)
                languageID = language.insert(rowLanguage)
                locationID = location.insert(rowLocation)
                sourceID = source.insert(rowSource)

                # fill the fact table with foreign keys & mesures
                numberOfTweets = tuple['numberOfTweets']
                row = [conceptID, locationID, sourceID, languageID, timeID, sentimentID, numberOfTweets]
                factTweet.insert(row)
                cpt += 1
                print(cpt, "tuple inserted", sep=" ")
            print("All tuples are inserted For the Fact Tweet for the concept :", concept)
# ----------------------------------------------------------------------------------------------------------------
            # Fill the Fact Sentiment Table
            data = dbIntermediary.table('alltweets').select(
                dbIntermediary.raw('languageName, timeAltID, cityName, avg(sentimentValue) as averageSentiment'))\
                .where('analysisID', '=', analysisID).where('concept', '=', concept).group_by(
                'languageName', 'timeAltID', 'cityName').get()
            cpt = 0
            for tuple in data:
                temp = dbIntermediary.table('alltweets').select(dbIntermediary.raw('*')).where(
                    'languageName', '=', tuple['languageName']).where(
                    'timeAltID', '=', tuple['timeAltID']).where(
                    'cityName', '=', tuple['cityName']).get()

                row = temp[0]
                rowTime = [row['timeAltID'], row['dayOfWeek'], row['day'], row['month'], row['monthName'], row['year'],
                           row['season']]
                rowLocation = [row['locationAltID'], row['cityName'], row['countryID'], row['countryName'],
                               row['continentID'], row['continentName']]
                rowLanguage = [row['languageCode'], row['languageName']]

                # instanciate the DB tables
                time = DimTime()
                language = DimLanguage()
                location = DimLocation()
                factSentiment = FactSentiment()

                # fill the dimensions
                timeID = time.insert(rowTime)
                languageID = language.insert(rowLanguage)
                locationID = location.insert(rowLocation)

                # fill the fact table with foreign keys & mesures
                averageSentiment = tuple['averageSentiment']
                row = [conceptID, locationID, languageID, timeID, averageSentiment]

                factSentiment.insert(row)
                cpt += 1
                print(cpt, "tuple inserted", sep=" ")
            print("All tuples are inserted For the Fact Sentiment for the concept :", concept)'''
        listIDTweets = []
        if numberOfTweets > 0:
            listIDTweets = dbIntermediary.table('alltweets') \
                .select('tweetID') \
                .where('analysisID', '=', analysisID) \
                .take(numberOfTweets)\
                .get()
            temp = []
            for element in listIDTweets:
                temp.append(element['tweetID'])
            listIDTweets = temp
            print(listIDTweets.__len__(), listIDTweets)
            data = dbIntermediary.table('alltweets')\
                .select(dbIntermediary.raw('languageCode , languageName, locationAltID, cityName, countryID, countryName, continentID, continentName, timeAltID ,dayOfWeek, day, month, monthName, year, season, sourceName, sentimentLabel, concept, count(*) as numberOfTweets'))\
                .where('analysisID', '=', analysisID)\
                .where_in('tweetID', listIDTweets)\
                .group_by('languageCode', 'languageName', 'locationAltID', 'cityName', 'countryID', 'countryName', 'continentID', 'continentName', 'timeAltID' ,'dayOfWeek', 'day', 'month', 'monthName', 'year', 'season', 'sourceName', 'sentimentLabel', 'concept')\
                .get()
        else:
            data = dbIntermediary.table('alltweets') \
                .select(dbIntermediary.raw(
                'languageCode , languageName, locationAltID, cityName, countryID, countryName, continentID, continentName, timeAltID ,dayOfWeek, day, month, monthName, year, season, sourceName, sentimentLabel, concept, count(*) as numberOfTweets')) \
                .where('analysisID', '=', analysisID) \
                .group_by('languageCode', 'languageName', 'locationAltID', 'cityName', 'countryID', 'countryName',
                          'continentID', 'continentName', 'timeAltID', 'dayOfWeek', 'day', 'month', 'monthName', 'year',
                          'season', 'sourceName', 'sentimentLabel', 'concept') \
                .get()
        cpt = 0
        for row in data:
            rowSentiment = [row['sentimentLabel']]
            rowSource = [row['sourceName']]
            rowTime = [
                row['timeAltID'], row['dayOfWeek'], row['day'], row['month'],
                row['monthName'], row['year'], row['season']
            ]
            rowLocation = [
                row['locationAltID'], row['cityName'], row['countryID'],
                row['countryName'], row['continentID'], row['continentName']
            ]
            rowLanguage = [row['languageCode'], row['languageName']]
            rowConcept = [row['concept']]

            # instanciate the DB tables
            time = DimTime()
            sentiment = DimSentiment()
            language = DimLanguage()
            location = DimLocation()
            source = DimSource()
            factTweet = FactTweet()
            conceptTable = DimConcept()
            # fill the dimensions
            timeID = time.insert(rowTime)
            sentimentID = sentiment.insert(rowSentiment)
            languageID = language.insert(rowLanguage)
            locationID = location.insert(rowLocation)
            sourceID = source.insert(rowSource)
            conceptID = conceptTable.insert(rowConcept)

            # fill the fact table with foreign keys & mesures
            numberOfTweet = row['numberOfTweets']
            row = [
                conceptID, locationID, sourceID, languageID, timeID,
                sentimentID, numberOfTweet
            ]
            factTweet.insert(row)
            cpt += 1
            print(cpt, "tuple inserted", sep=" ")
        #print(listIDTweets)
# ----------------------------------------------------------------------------------------------------------------
# Fill the Fact Sentiment Table
        if numberOfTweets > 0:
            data = dbIntermediary.table('alltweets').select(
                dbIntermediary.raw('languageCode , languageName, locationAltID, cityName, countryID, countryName, continentID, continentName, timeAltID ,dayOfWeek, day, month, monthName, year, season, concept, avg(sentimentValue) as averageSentiment'))\
                .where('analysisID', '=', analysisID)\
                .where_in('tweetID', listIDTweets)\
                .group_by('languageCode', 'languageName', 'locationAltID', 'cityName', 'countryID', 'countryName',
                              'continentID', 'continentName', 'timeAltID', 'dayOfWeek', 'day', 'month', 'monthName', 'year',
                              'season', 'concept').get()
        else:
            data = dbIntermediary.table('alltweets').select(
                dbIntermediary.raw(
                    'languageCode , languageName, locationAltID, cityName, countryID, countryName, continentID, continentName, timeAltID ,dayOfWeek, day, month, monthName, year, season, concept, avg(sentimentValue) as averageSentiment')) \
                .where('analysisID', '=', analysisID) \
                .group_by('languageCode', 'languageName', 'locationAltID', 'cityName', 'countryID', 'countryName',
                          'continentID', 'continentName', 'timeAltID', 'dayOfWeek', 'day', 'month', 'monthName', 'year',
                          'season', 'concept').get()
        cpt = 0
        for row in data:
            print(row)
            rowTime = [
                row['timeAltID'], row['dayOfWeek'], row['day'], row['month'],
                row['monthName'], row['year'], row['season']
            ]
            rowLocation = [
                row['locationAltID'], row['cityName'], row['countryID'],
                row['countryName'], row['continentID'], row['continentName']
            ]
            rowLanguage = [row['languageCode'], row['languageName']]
            rowConcept = [row['concept']]

            # instanciate the DB tables
            time = DimTime()
            language = DimLanguage()
            location = DimLocation()
            concept = DimConcept()
            factSentiment = FactSentiment()

            # fill the dimensions
            timeID = time.insert(rowTime)
            languageID = language.insert(rowLanguage)
            locationID = location.insert(rowLocation)
            conceptID = concept.insert(rowConcept)

            # fill the fact table with foreign keys & mesures
            averageSentiment = row['averageSentiment']
            row = [conceptID, locationID, languageID, timeID, averageSentiment]

            factSentiment.insert(row)
            cpt += 1
            print(cpt, "tuple inserted", sep=" ")


# ----------------------------------------------------------------------------------------------------------------
        '''# Fill the Fact CovCase Table