1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18 __all__ = ["StorageLevel"]
19
21 """
22 Flags for controlling the storage of an RDD. Each StorageLevel records whether to use memory,
23 whether to drop the RDD to disk if it falls out of memory, whether to keep the data in memory
24 in a serialized format, and whether to replicate the RDD partitions on multiple nodes.
25 Also contains static constants for some commonly used storage levels, such as MEMORY_ONLY.
26 """
27
28 - def __init__(self, useDisk, useMemory, useOffHeap, deserialized, replication = 1):
29 self.useDisk = useDisk
30 self.useMemory = useMemory
31 self.useOffHeap = useOffHeap
32 self.deserialized = deserialized
33 self.replication = replication
34
36 return "StorageLevel(%s, %s, %s, %s, %s)" % (
37 self.useDisk, self.useMemory, self.useOffHeap, self.deserialized, self.replication)
38
39 StorageLevel.DISK_ONLY = StorageLevel(True, False, False, False)
40 StorageLevel.DISK_ONLY_2 = StorageLevel(True, False, False, False, 2)
41 StorageLevel.MEMORY_ONLY = StorageLevel(False, True, False, True)
42 StorageLevel.MEMORY_ONLY_2 = StorageLevel(False, True, False, True, 2)
43 StorageLevel.MEMORY_ONLY_SER = StorageLevel(False, True, False, False)
44 StorageLevel.MEMORY_ONLY_SER_2 = StorageLevel(False, True, False, False, 2)
45 StorageLevel.MEMORY_AND_DISK = StorageLevel(True, True, False, True)
46 StorageLevel.MEMORY_AND_DISK_2 = StorageLevel(True, True, False, True, 2)
47 StorageLevel.MEMORY_AND_DISK_SER = StorageLevel(True, True, False, False)
48 StorageLevel.MEMORY_AND_DISK_SER_2 = StorageLevel(True, True, False, False, 2)
49 StorageLevel.OFF_HEAP = StorageLevel(False, False, True, False, 1)
50