Python classpath_jars示例

编程语言: Python

命名空间/包名称: sagemaker_pyspark

方法/功能: classpath_jars

hotexamples.com的示例: 4

Python classpath_jars - 已找到4个示例。这些是从开源项目中提取的最受好评的sagemaker_pyspark.classpath_jars现实Python示例。您可以评价示例，以帮助我们提高示例质量。

示例#1

显示文件

def test_classpath_script_works():

    p = subprocess.Popen(["sagemakerpyspark-jars"], stdout=subprocess.PIPE)
    output, errors = p.communicate()

    jars = sagemaker_pyspark.classpath_jars()

    script_jars = output.decode('utf-8').split(",")
    assert len(jars) == len(script_jars)
    assert jars[0] == script_jars[0]

示例#2

显示文件

def test_classpath_script_can_use_separators():

    p = subprocess.Popen("sagemakerpyspark-jars :".split(),
                         stdout=subprocess.PIPE)
    output, errors = p.communicate()

    jars = sagemaker_pyspark.classpath_jars()

    script_jars = output.decode('utf-8').split(":")
    assert len(jars) == len(script_jars)
    assert jars[0] == script_jars[0]

示例#3

显示文件

文件： linear_learner_binary_classifier_test.py 项目： nadiaya/test

def with_spark_context():
    os.environ['SPARK_CLASSPATH'] = ":".join(classpath_jars())
    conf = (SparkConf().set("spark.driver.extraClassPath",
                            os.environ['SPARK_CLASSPATH']))

    if SparkContext._active_spark_context is None:
        SparkContext(conf=conf)

    yield SparkContext._active_spark_context

    # TearDown
    SparkContext.stop(SparkContext._active_spark_context)

示例#4

显示文件

文件： pyspark_mnist_custom_estimator.py 项目： rogerromualdo10/AWS_SageMaker_Project

import os
import boto3

from pyspark import SparkContext, SparkConf
from pyspark.sql import SparkSession

import sagemaker
from sagemaker import get_execution_role
import sagemaker_pyspark

role = get_execution_role()

# Configure Spark to use the SageMaker Spark dependency jars
jars = sagemaker_pyspark.classpath_jars()

classpath = ":".join(sagemaker_pyspark.classpath_jars())

# See the SageMaker Spark Github to learn how to connect to EMR from a notebook instance
spark = SparkSession.builder.config("spark.driver.extraClassPath", classpath)\
    .master("local[*]").getOrCreate()

spark

import boto3

cn_regions = ['cn-north-1', 'cn-northwest-1']
region = boto3.Session().region_name
endpoint_domain = 'com.cn' if region in cn_regions else 'com'
spark._jsc.hadoopConfiguration().set(
    'fs.s3a.endpoint', 's3.{}.amazonaws.{}'.format(region, endpoint_domain))