-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathmain.py
156 lines (126 loc) · 5.42 KB
/
main.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
#!/usr/bin/env python3
"""Automatic backup of RBD images accessed by virtual machines run by QEMU and managed by libvirt
Uses libvirt Python API and Ceph librbd RBD Python API to list relevant virtual machines,
create a RBD snapshot and save the snapshot to defined output modules.
Configuration is done via config.py (copy from config.py.example)."""
from datetime import datetime
# Multiprocessing from Python documentationen for module multiprocessing
# https://docs.python.org/3/library/multiprocessing.html
import multiprocessing
import virt
import ceph
import output.restic as restic
from config import NUMBER_OF_PROCESSES, LIBVIRT_CONNECTION, TARGET_REPO, TARGET_KEYFILE
def worker(input_queue, output_queue):
"""Run by worker processes, executes backup processing for tasks from the queue"""
for domain_images in iter(input_queue.get, None):
print(
f"Processing {len(domain_images)} images for domain {domain_images[0].domain}")
result = process_backup(domain_images)
output_queue.put(result)
# List images and start parallel backup operations
def run_parallel():
"""List images and start parallel backup operations with worker pool"""
virt_conn = virt.VirtConnection(LIBVIRT_CONNECTION)
images = []
try:
virt_conn.open()
images = virt_conn.list_virtrbd_images()
finally:
virt_conn.close()
domain_images = {}
for image in images:
cluster = domain_images.get(image.domain, [])
cluster.append(image)
domain_images[image.domain] = cluster
# Create queues
task_queue = multiprocessing.Queue()
done_queue = multiprocessing.Queue()
# Submit tasks
for domain in domain_images:
task_queue.put(domain_images[domain])
# Start worker processes
for _ in range(NUMBER_OF_PROCESSES):
multiprocessing.Process(target=worker, args=(
task_queue, done_queue)).start()
# Get and print results
for _ in range(len(domain_images)):
(result, text) = done_queue.get()
if result:
print(f"Backup successful: {text}")
else:
print(f"Backup failed: {text}")
# Tell child processes to stop
for _ in range(NUMBER_OF_PROCESSES):
task_queue.put(None)
def process_backup(domain_images):
"""Process the backup of a set of domain images.
Handles orchestration of other modules.
Assumptions: Images belong to a single domain and have identical authentication to the
Ceph cluster. It is not required for images to be in the same pool"""
exceptions = []
virt_conn = virt.VirtConnection(LIBVIRT_CONNECTION)
try:
virt_conn.open()
domain = virt_conn.lookupByUUIDString(domain_images[0].domain)
try:
storage_conn = ceph.CephConnection(
domain_images[0].username, domain_images[0].secret)
storage_conn.connect()
# First pass: Create backup snapshosts
for image in domain_images:
storage_conn.pool_exists(image.pool)
storage_conn.open_pool(image.pool)
storage_conn.open_image(image.name)
timestamp = datetime.utcnow().strftime('%Y_%m_%d_%s')
image.snapshot_name = image.name+"-backup-"+timestamp
storage_conn.create_snapshot(
image.snapshot_name, protected=True)
storage_conn.close_image()
storage_conn.close_pool()
except Exception as ex:
exceptions.append(
(False, "Error creating snapshot for domain:" +
f" {domain_images[0].domain}. Exception: {repr(ex)}"))
raise
finally:
storage_conn.close()
# Second pass: Copy snapshot content to backup module
try:
storage_conn = ceph.CephConnection(
domain_images[0].username, domain_images[0].secret)
storage_conn.connect()
for image in domain_images:
storage_conn.open_pool(image.pool)
storage_conn.open_image(
image.name, snapshot=image.snapshot_name, read_only=True)
restic.backup(TARGET_REPO, TARGET_KEYFILE, storage_conn.image,
filename=image.name+".img", progress=True)
storage_conn.close_image()
storage_conn.open_image(image.name)
storage_conn.remove_snapshot(
image.snapshot_name, force_protected=True)
storage_conn.close_image()
storage_conn.close_pool()
except Exception as ex:
exceptions.append(
(False, "Error during backup copy for domain:" +
f" {domain_images[0].domain}. Exception: {repr(ex)}"))
raise
finally:
# TODO: Clean snapshots on exception in this pass!
storage_conn.close()
except Exception as ex:
exceptions.append(
(False, "Error during libvirt connection or operation for domain:" +
f" {domain_images[0].domain}. Exception: {repr(ex)}"))
finally:
virt_conn.close()
if len(exceptions) == 0:
return (True, f"No error occurred for domain {domain_images[0].domain}")
# Only give first exception for now
return exceptions[0]
# Entrypoint definition
if __name__ == '__main__':
multiprocessing.freeze_support()
run_parallel()