示例#1
0
 def test_storage_levels(self):
     df = self.spark.createDataFrame(
         [(0, 0, 4.0), (0, 1, 2.0), (1, 1, 3.0), (1, 2, 4.0), (2, 1, 1.0), (2, 2, 5.0)],
         ["user", "item", "rating"])
     als = ALS().setMaxIter(1).setRank(1)
     # test default params
     als.fit(df)
     self.assertEqual(als.getIntermediateStorageLevel(), "MEMORY_AND_DISK")
     self.assertEqual(als._java_obj.getIntermediateStorageLevel(), "MEMORY_AND_DISK")
     self.assertEqual(als.getFinalStorageLevel(), "MEMORY_AND_DISK")
     self.assertEqual(als._java_obj.getFinalStorageLevel(), "MEMORY_AND_DISK")
     # test non-default params
     als.setIntermediateStorageLevel("MEMORY_ONLY_2")
     als.setFinalStorageLevel("DISK_ONLY")
     als.fit(df)
     self.assertEqual(als.getIntermediateStorageLevel(), "MEMORY_ONLY_2")
     self.assertEqual(als._java_obj.getIntermediateStorageLevel(), "MEMORY_ONLY_2")
     self.assertEqual(als.getFinalStorageLevel(), "DISK_ONLY")
     self.assertEqual(als._java_obj.getFinalStorageLevel(), "DISK_ONLY")