Python SmvModuleRunner示例

编程语言: Python

命名空间/包名称: smv.smvmodulerunner

类/类型: SmvModuleRunner

hotexamples.com的示例: 14

Python SmvModuleRunner - 已找到14个示例。这些是从开源项目中提取的最受好评的smv.smvmodulerunner.SmvModuleRunner现实Python示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

SmvModuleRunner(14)

示例#1

显示文件

文件： smvapp.py 项目： bakhalea/SMV

    def runModule(self, fqn, forceRun=False, quickRun=False):
        """Runs SmvModule by its Fully Qualified Name(fqn)

        Args:
            fqn (str): The FQN of a module
            forceRun (bool): True if the module should be forced to run even if it has persisted output. False otherwise.
            quickRun (bool): skip computing dqm+metadata and persisting csv

        Example:
            To get just the dataframe of the module:
                dataframe = smvApp.runModule('package.module.SmvModuleClass')[0]
            To get both the dataframe and the run info collector:
                dataframe, collector = smvApp.runModule('package.module.SmvModuleClass')

        Returns:
            (DataFrame, SmvRunInfoCollector) tuple
            - DataFrame is the computed result of the module
            - SmvRunInfoCollector contains additional information
              about the run, such as validation results.
        """
        ds = self.dsm.load(fqn)[0]

        if (quickRun):
            return self._to_single_run_res(
                SmvModuleRunner([ds], self).quick_run(forceRun))
        else:
            return self._to_single_run_res(
                SmvModuleRunner([ds], self).run(forceRun))

示例#2

显示文件

文件： smvapp.py 项目： bakhalea/SMV

    def getRunInfo(self, fqn):
        """Returns the run information of a module and all its dependencies
        from the last run.

        Unlike the runModule() method, which returns the run
        information just for that run, this method returns the run
        information from the last run.

        If no module was run (e.g. the code did not change, so the
        data is read from persistent storage), the SmRunInfoCollector
        returned from the runModule() method would be empty.  But the
        SmvRunInfoCollector returned from this method would contain
        all latest run information about all dependent modules.

        Args:
            fqn (str): fqn of target module
            runConfig (dict): runConfig to apply when collecting info. If module
                              was run with a config, the same config needs to be
                              specified here to retrieve the info.

        Returns:
            SmvRunInfoCollector

        """
        ds = self.dsm.load(fqn)[0]
        return SmvModuleRunner([ds], self).get_runinfo()

示例#3

显示文件

文件： testSmvFramework2.py 项目： TresAmigosSD/SMV

    def test_basic_metadata_creation(self):
        fqn = "stage.modules.M2"
        m = self.load(fqn)[0]

        SmvModuleRunner([m], self.smvApp).run()

        result = m.module_meta._metadata['_dqmValidation']
        rule_cnt = result['dqmStateSnapshot']['ruleErrors']['b_lt_04']['total']

        self.assertEqual(m.module_meta._metadata['_fqn'], fqn)
        self.assertEqual(rule_cnt, 1)

示例#4

显示文件

文件： testSmvFramework2.py 项目： TresAmigosSD/SMV

    def test_publish(self):
        fqn = "stage.modules.M3"
        pub_dir = self.smvApp.all_data_dirs().publishDir

        m = self.load(fqn)[0]
        SmvModuleRunner([m], self.smvApp).publish(pub_dir)

        csv_path = '{}/{}.csv'.format(pub_dir, m.fqn())
        meta_path = '{}/{}.meta'.format(pub_dir, m.fqn())
        hist_path = '{}/{}.hist'.format(pub_dir, m.fqn())

        self.assertTrue(os.path.exists(csv_path))
        self.assertTrue(os.path.exists(meta_path))
        self.assertTrue(os.path.exists(hist_path))

示例#5

显示文件

文件： testSmvFramework2.py 项目： TresAmigosSD/SMV

    def test_purge_persisted(self):
        fqn1 = "stage.modules.M2"
        fqn2 = "stage.modules.M3"

        (m1, m2) = self.load(fqn1, fqn2)

        self.df(fqn2)

        # Should be persisted
        self.assertTrue(os.path.exists(m1.persistStrategy()._file_path))

        # Should be removed
        SmvModuleRunner([m2], self.smvApp).purge_persisted()
        self.assertFalse(os.path.exists(m1.persistStrategy()._file_path))

示例#6

显示文件

文件： smvapp.py 项目： bakhalea/SMV

 def _generate_output_modules(self, mods):
     SmvModuleRunner(mods, self).run()

示例#7

显示文件

文件： smvapp.py 项目： bakhalea/SMV

 def _publish_modules_locally(self, mods):
     local_dir = self.cmd_line.exportCsv
     SmvModuleRunner(mods, self).publish_local(local_dir)

示例#8

显示文件

文件： smvapp.py 项目： bakhalea/SMV

 def _publish_modules_through_jdbc(self, mods):
     SmvModuleRunner(mods, self).publish_to_jdbc()

示例#9

显示文件

文件： smvapp.py 项目： bakhalea/SMV

 def _publish_modules_to_hive(self, mods):
     SmvModuleRunner(mods, self).publish_to_hive()

示例#10

显示文件

文件： smvapp.py 项目： bakhalea/SMV

 def _publish_modules(self, mods):
     SmvModuleRunner(mods, self).publish()

示例#11

显示文件

文件： smvapp.py 项目： bakhalea/SMV

 def _purge_current_output_files(self, mods):
     SmvModuleRunner(mods, self).purge_persisted()

示例#12

显示文件

文件： smvapp.py 项目： bakhalea/SMV

 def publishModuleToHiveByName(self, name):
     """Publish an SmvModule to Hive by its name (can be partial FQN)
     """
     fqn = self.dsm.inferFqn(name)
     ds = self.load_single_ds(fqn)
     return SmvModuleRunner([ds], self).publish_to_hive()

示例#13

显示文件

文件： smvapp.py 项目： bakhalea/SMV

 def quickRunModule(self, fqn):
     ds = self.dsm.load(fqn)[0]
     return SmvModuleRunner([ds], self).quick_run()[0]

示例#14

显示文件

 def test_publish_to_hive2(self):
     m = self.load("stage.modules.M")[0]
     df = self.df("stage.modules.M")
     SmvModuleRunner([m], self.smvApp).publish_to_hive()
     read_back = self.smvApp.sqlContext.sql("select * from " + "M")
     self.should_be_same(df, read_back)