1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
|
import errno
import logging
import os
from typing import List, Tuple
from contextlib import contextmanager
import orchestrator
from .lock import GlobalLock
from ..exception import VolumeException, IndexException
from ..fs_util import create_pool, remove_pool, rename_pool, create_filesystem, \
remove_filesystem, rename_filesystem, create_mds, volume_exists, listdir
from .trash import Trash
from mgr_util import open_filesystem, CephfsConnectionException
from .clone_index import open_clone_index
log = logging.getLogger(__name__)
def gen_pool_names(volname):
"""
return metadata and data pool name (from a filesystem/volume name) as a tuple
"""
return "cephfs.{}.meta".format(volname), "cephfs.{}.data".format(volname)
def get_mds_map(mgr, volname):
"""
return mdsmap for a volname
"""
mds_map = None
fs_map = mgr.get("fs_map")
for f in fs_map['filesystems']:
if volname == f['mdsmap']['fs_name']:
return f['mdsmap']
return mds_map
def get_pool_names(mgr, volname):
"""
return metadata and data pools (list) names of volume as a tuple
"""
fs_map = mgr.get("fs_map")
metadata_pool_id = None
data_pool_ids: List[int] = []
for f in fs_map['filesystems']:
if volname == f['mdsmap']['fs_name']:
metadata_pool_id = f['mdsmap']['metadata_pool']
data_pool_ids = f['mdsmap']['data_pools']
break
if metadata_pool_id is None:
return None, None
osdmap = mgr.get("osd_map")
pools = dict([(p['pool'], p['pool_name']) for p in osdmap['pools']])
metadata_pool = pools[metadata_pool_id]
data_pools = [pools[id] for id in data_pool_ids]
return metadata_pool, data_pools
def get_pool_ids(mgr, volname):
"""
return metadata and data pools (list) id of volume as a tuple
"""
fs_map = mgr.get("fs_map")
metadata_pool_id = None
data_pool_ids: List[int] = []
for f in fs_map['filesystems']:
if volname == f['mdsmap']['fs_name']:
metadata_pool_id = f['mdsmap']['metadata_pool']
data_pool_ids = f['mdsmap']['data_pools']
break
if metadata_pool_id is None:
return None, None
return metadata_pool_id, data_pool_ids
def create_volume(mgr, volname, placement):
"""
create volume (pool, filesystem and mds)
"""
metadata_pool, data_pool = gen_pool_names(volname)
# create pools
r, outb, outs = create_pool(mgr, metadata_pool)
if r != 0:
return r, outb, outs
# default to a bulk pool for data. In case autoscaling has been disabled
# for the cluster with `ceph osd pool set noautoscale`, this will have no effect.
r, outb, outs = create_pool(mgr, data_pool, bulk=True)
if r != 0:
#cleanup
remove_pool(mgr, metadata_pool)
return r, outb, outs
# create filesystem
r, outb, outs = create_filesystem(mgr, volname, metadata_pool, data_pool)
if r != 0:
log.error("Filesystem creation error: {0} {1} {2}".format(r, outb, outs))
#cleanup
remove_pool(mgr, data_pool)
remove_pool(mgr, metadata_pool)
return r, outb, outs
return create_mds(mgr, volname, placement)
def delete_volume(mgr, volname, metadata_pool, data_pools):
"""
delete the given module (tear down mds, remove filesystem, remove pools)
"""
# Tear down MDS daemons
try:
completion = mgr.remove_service('mds.' + volname)
orchestrator.raise_if_exception(completion)
except (ImportError, orchestrator.OrchestratorError):
log.warning("OrchestratorError, not tearing down MDS daemons")
except Exception as e:
# Don't let detailed orchestrator exceptions (python backtraces)
# bubble out to the user
log.exception("Failed to tear down MDS daemons")
return -errno.EINVAL, "", str(e)
# In case orchestrator didn't tear down MDS daemons cleanly, or
# there was no orchestrator, we force the daemons down.
if volume_exists(mgr, volname):
r, outb, outs = remove_filesystem(mgr, volname)
if r != 0:
return r, outb, outs
else:
err = "Filesystem not found for volume '{0}'".format(volname)
log.warning(err)
return -errno.ENOENT, "", err
r, outb, outs = remove_pool(mgr, metadata_pool)
if r != 0:
return r, outb, outs
for data_pool in data_pools:
r, outb, outs = remove_pool(mgr, data_pool)
if r != 0:
return r, outb, outs
result_str = f"metadata pool: {metadata_pool} data pool: {str(data_pools)} removed.\n"
result_str += "If there are active snapshot schedules associated with this "
result_str += "volume, you might see EIO errors in the mgr logs or at the "
result_str += "snap-schedule command-line due to the missing volume. "
result_str += "However, these errors are transient and will get auto-resolved."
return r, result_str, ""
def rename_volume(mgr, volname: str, newvolname: str) -> Tuple[int, str, str]:
"""
rename volume (orch MDS service, file system, pools)
"""
# To allow volume rename to be idempotent, check whether orch managed MDS
# service is already renamed. If so, skip renaming MDS service.
completion = None
rename_mds_service = True
try:
completion = mgr.describe_service(
service_type='mds', service_name=f"mds.{newvolname}", refresh=True)
orchestrator.raise_if_exception(completion)
except (ImportError, orchestrator.OrchestratorError):
log.warning("Failed to fetch orch service mds.%s", newvolname)
except Exception as e:
# Don't let detailed orchestrator exceptions (python backtraces)
# bubble out to the user
log.exception("Failed to fetch orch service mds.%s", newvolname)
return -errno.EINVAL, "", str(e)
if completion and completion.result:
rename_mds_service = False
# Launch new MDS service matching newvolname
completion = None
remove_mds_service = False
if rename_mds_service:
try:
completion = mgr.describe_service(
service_type='mds', service_name=f"mds.{volname}", refresh=True)
orchestrator.raise_if_exception(completion)
except (ImportError, orchestrator.OrchestratorError):
log.warning("Failed to fetch orch service mds.%s", volname)
except Exception as e:
# Don't let detailed orchestrator exceptions (python backtraces)
# bubble out to the user
log.exception("Failed to fetch orch service mds.%s", volname)
return -errno.EINVAL, "", str(e)
if completion and completion.result:
svc = completion.result[0]
placement = svc.spec.placement.pretty_str()
create_mds(mgr, newvolname, placement)
remove_mds_service = True
# rename_filesytem is idempotent
r, outb, outs = rename_filesystem(mgr, volname, newvolname)
if r != 0:
errmsg = f"Failed to rename file system '{volname}' to '{newvolname}'"
log.error("Failed to rename file system '%s' to '%s'", volname, newvolname)
outs = f'{errmsg}; {outs}'
return r, outb, outs
# Rename file system's metadata and data pools
metadata_pool, data_pools = get_pool_names(mgr, newvolname)
new_metadata_pool, new_data_pool = gen_pool_names(newvolname)
if metadata_pool != new_metadata_pool:
r, outb, outs = rename_pool(mgr, metadata_pool, new_metadata_pool)
if r != 0:
errmsg = f"Failed to rename metadata pool '{metadata_pool}' to '{new_metadata_pool}'"
log.error("Failed to rename metadata pool '%s' to '%s'", metadata_pool, new_metadata_pool)
outs = f'{errmsg}; {outs}'
return r, outb, outs
data_pool_rename_failed = False
# If file system has more than one data pool, then skip renaming
# the data pools, and proceed to remove the old MDS service.
if len(data_pools) > 1:
data_pool_rename_failed = True
else:
data_pool = data_pools[0]
if data_pool != new_data_pool:
r, outb, outs = rename_pool(mgr, data_pool, new_data_pool)
if r != 0:
errmsg = f"Failed to rename data pool '{data_pool}' to '{new_data_pool}'"
log.error("Failed to rename data pool '%s' to '%s'", data_pool, new_data_pool)
outs = f'{errmsg}; {outs}'
return r, outb, outs
# Tear down old MDS service
if remove_mds_service:
try:
completion = mgr.remove_service('mds.' + volname)
orchestrator.raise_if_exception(completion)
except (ImportError, orchestrator.OrchestratorError):
log.warning("Failed to tear down orch service mds.%s", volname)
except Exception as e:
# Don't let detailed orchestrator exceptions (python backtraces)
# bubble out to the user
log.exception("Failed to tear down orch service mds.%s", volname)
return -errno.EINVAL, "", str(e)
outb = f"FS volume '{volname}' renamed to '{newvolname}'"
if data_pool_rename_failed:
outb += ". But failed to rename data pools as more than one data pool was found."
return r, outb, ""
def list_volumes(mgr):
"""
Get name of all volumes/file systems.
:param: mgr
:return: list of volume/file system names
"""
result = []
for fs in mgr.get("fs_map")['filesystems']:
result.append(fs['mdsmap']['fs_name'])
return result
def get_pending_subvol_deletions_count(fs, path):
"""
Get the number of pending subvolumes deletions.
"""
trashdir = os.path.join(path, Trash.GROUP_NAME)
try:
num_pending_subvol_del = len(listdir(fs, trashdir, filter_entries=None, filter_files=False))
except VolumeException as ve:
if ve.errno == -errno.ENOENT:
num_pending_subvol_del = 0
return {'pending_subvolume_deletions': num_pending_subvol_del}
def get_all_pending_clones_count(self, mgr, vol_spec):
pending_clones_cnt = 0
index_path = ""
fs_map = mgr.get('fs_map')
for fs in fs_map['filesystems']:
volname = fs['mdsmap']['fs_name']
try:
with open_volume(self, volname) as fs_handle:
with open_clone_index(fs_handle, vol_spec) as index:
index_path = index.path.decode('utf-8')
pending_clones_cnt = pending_clones_cnt \
+ len(listdir(fs_handle, index_path,
filter_entries=None, filter_files=False))
except IndexException as e:
if e.errno == -errno.ENOENT:
continue
raise VolumeException(-e.args[0], e.args[1])
except VolumeException as ve:
log.error("error fetching clone entry for volume '{0}' ({1})".format(volname, ve))
raise ve
return pending_clones_cnt
@contextmanager
def open_volume(vc, volname):
"""
open a volume for exclusive access. This API is to be used as a contextr
manager.
:param vc: volume client instance
:param volname: volume name
:return: yields a volume handle (ceph filesystem handle)
"""
g_lock = GlobalLock()
with g_lock.lock_op():
try:
with open_filesystem(vc, volname) as fs_handle:
yield fs_handle
except CephfsConnectionException as ce:
raise VolumeException(ce.errno, ce.error_str)
@contextmanager
def open_volume_lockless(vc, volname):
"""
open a volume with shared access. This API is to be used as a context
manager.
:param vc: volume client instance
:param volname: volume name
:return: yields a volume handle (ceph filesystem handle)
"""
try:
with open_filesystem(vc, volname) as fs_handle:
yield fs_handle
except CephfsConnectionException as ce:
raise VolumeException(ce.errno, ce.error_str)
|