Coverage for pyspark/tests/test

223 ↛ 225line 223 didn't jump to line 225, because the condition on line 223 was never false if os.environ.get("PYSPARK_PIN_THREAD", "true").lower() == "true":

sc.setJobGroup('test_progress_api', '', True)

try:

rdd.count()

except Exception:

pass

t = threading.Thread(target=run)

t.daemon = True

t.start()

# wait for scheduler to start

time.sleep(1)

tracker = sc.statusTracker()

jobIds = tracker.getJobIdsForGroup('test_progress_api')

self.assertEqual(1, len(jobIds))

job = tracker.getJobInfo(jobIds[0])

self.assertEqual(1, len(job.stageIds))

stage = tracker.getStageInfo(job.stageIds[0])

self.assertEqual(rdd.getNumPartitions(), stage.numTasks)

sc.cancelAllJobs()

t.join()

# wait for event listener to update the status

time.sleep(1)

job = tracker.getJobInfo(jobIds[0])

self.assertEqual('FAILED', job.status)

self.assertEqual([], tracker.getActiveJobsIds())

self.assertEqual([], tracker.getActiveStageIds())

sc.stop()

def test_startTime(self):

with SparkContext() as sc:

self.assertGreater(sc.startTime, 0)

def test_forbid_insecure_gateway(self):

# Fail immediately if you try to create a SparkContext

# with an insecure gateway

parameters = namedtuple('MockGatewayParameters', 'auth_token')(None)

mock_insecure_gateway = namedtuple('MockJavaGateway', 'gateway_parameters')(parameters)

with self.assertRaises(ValueError) as context:

SparkContext(gateway=mock_insecure_gateway)

self.assertIn("insecure Py4j gateway", str(context.exception))

def test_resources(self):

"""Test the resources are empty by default."""

with SparkContext() as sc:

resources = sc.resources

self.assertEqual(len(resources), 0)

def test_disallow_to_create_spark_context_in_executors(self):

# SPARK-32160: SparkContext should not be created in executors.

with SparkContext("local-cluster[3, 1, 1024]") as sc:

with self.assertRaises(Exception) as context:

sc.range(2).foreach(lambda _: SparkContext())

self.assertIn("SparkContext should only be created and accessed on the driver.",

str(context.exception))

def test_allow_to_create_spark_context_in_executors(self):

# SPARK-32160: SparkContext can be created in executors if the config is set.

def create_spark_context():

conf = SparkConf().set("spark.executor.allowSparkContext", "true")

with SparkContext(conf=conf):

pass

with SparkContext("local-cluster[3, 1, 1024]") as sc:

sc.range(2).foreach(lambda _: create_spark_context())

class ContextTestsWithResources(unittest.TestCase):

def setUp(self):

class_name = self.__class__.__name__

self.tempFile = tempfile.NamedTemporaryFile(delete=False)

self.tempFile.write(b'echo {\\"name\\": \\"gpu\\", \\"addresses\\": [\\"0\\"]}')

self.tempFile.close()

# create temporary directory for Worker resources coordination

self.tempdir = tempfile.NamedTemporaryFile(delete=False)

os.unlink(self.tempdir.name)

os.chmod(self.tempFile.name, stat.S_IRWXU | stat.S_IXGRP | stat.S_IRGRP |

stat.S_IROTH | stat.S_IXOTH)

conf = SparkConf().set("spark.test.home", SPARK_HOME)

conf = conf.set("spark.driver.resource.gpu.amount", "1")

conf = conf.set("spark.driver.resource.gpu.discoveryScript", self.tempFile.name)

self.sc = SparkContext('local-cluster[2,1,1024]', class_name, conf=conf)

def test_resources(self):

"""Test the resources are available."""

resources = self.sc.resources

self.assertEqual(len(resources), 1)

self.assertTrue('gpu' in resources)

self.assertEqual(resources['gpu'].name, 'gpu')

self.assertEqual(resources['gpu'].addresses, ['0'])

def tearDown(self):

os.unlink(self.tempFile.name)

self.sc.stop()

if __name__ == "__main__":

from pyspark.tests.test_context import * # noqa: F401

try:

import xmlrunner # type: ignore[import]

testRunner = xmlrunner.XMLTestRunner(output='target/test-reports', verbosity=2)

except ImportError:

testRunner = None

unittest.main(testRunner=testRunner, verbosity=2)

Coverage for pyspark/tests/test_context.py : 99%

229 statements 228 run 1 missing 0 excluded 2 partial