Hi,
Is there anywhere that describes exactly how rbd data (including
snapshots) are stored within a pool?
I can see how a rbd broadly stores its data in rados objects in the
pool, although the object map is opaque. But once an rbd snap is created
and new data written to the rbd, where is the old data associated with
the snap?
And/or how can I access the data from an rbd snapshot directly, e.g.
using rados?
And, how can an object map be interpreted, i.e. what is the format?
I don't know if the snaps documentation here:
https://docs.ceph.com/en/latest/dev/osd_internals/snaps/
...is related to rbd snaps. Perhaps rbd snaps are "self managed snaps"
requiring the use a "SnapContext", but the rados man page doesn't include
any mention of this so it's unclear what's going on.
Perhaps rbd snapshots simply can't be accessed directly with the current
tools (other than actually mapping a snapshot)?
See below for some test explorations...
Cheers,
Chris
----------------------------------------------------------------------
##
## create a test rbd within a test pool
##
$ ceph osd pool create test
$ rbd create --size 10M --object-size 1M "test/test1"
$ rbd info test/test1
rbd image 'test1':
size 10 MiB in 10 objects
order 20 (1 MiB objects)
snapshot_count: 0
id: 08ceb039ff1c19
block_name_prefix: rbd_data.08ceb039ff1c19
format: 2
features: layering, exclusive-lock, object-map, fast-diff, deep-flatten
op_features:
flags:
create_timestamp: Tue Oct 18 09:35:49 2022
access_timestamp: Tue Oct 18 09:35:49 2022
modify_timestamp: Tue Oct 18 09:35:49 2022
$ rados -p test ls --all
rbd_directory
rbd_info
rbd_object_map.08ceb039ff1c19
rbd_header.08ceb039ff1c19
rbd_id.test1
#
# "clean" object map - but no idea what the contents mean
#
$ rados -p test get rbd_object_map.08ceb039ff1c19 - | od -t x1 > /tmp/om.clean; cat /tmp/om.clean
0000000 0e 00 00 00 01 01 08 00 00 00 0a 00 00 00 00 00
0000020 00 00 00 00 00 0c 00 00 00 c6 44 f4 3a 01 00 00
0000040 00 00 00 00 00
0000045
##
## Write to the rbd
## - confirm data appears in rbd_data.xxx object
## - rbd_object_map changes
##
$ dev=$(rbd device map "test/test1"); declare -p dev
declare -- dev="/dev/rbd0"
$ printf '1' > $dev
#
# rdb_data object appears
#
$ rados -p test ls --all | sort
rbd_data.08ceb039ff1c19.0000000000000000
rbd_directory
rbd_header.08ceb039ff1c19
rbd_id.test1
rbd_info
rbd_object_map.08ceb039ff1c19
#
# new rbd_data contains our written data
#
$ rados -p test get rbd_data.08ceb039ff1c19.0000000000000000 - | od -t x1
0000000 31 00 00 00 00 00 00 00 00 00 00 00 00 00 00 00
0000020 00 00 00 00 00 00 00 00 00 00 00 00 00 00 00 00
*
0010000
#
# rbd_object_map is updated
#
$ rados -p test get rbd_object_map.08ceb039ff1c19 - | od -t x1 > /tmp/om.head.1; cat /tmp/om.head.1
0000000 0e 00 00 00 01 01 08 00 00 00 0a 00 00 00 00 00
0000020 00 00 40 00 00 0c 00 00 00 c6 44 f4 3a 01 00 00
0000040 00 d9 80 65 c7
0000045
$ diff /tmp/om.{clean,head.1}
2,3c2,3
< 0000020 00 00 00 00 00 0c 00 00 00 c6 44 f4 3a 01 00 00
< 0000040 00 00 00 00 00
---
0000020 00 00 40 00 00 0c 00 00 00 c6 44 f4 3a 01 00 00
0000040 00 d9 80 65 c7
##
## Write again, to offset 2MB (rbd is using 1MB objects)
## - new rbd_data object appears, with object-size offset appearing in the name
## - object map updated
##
$ printf 2 | dd of=${dev} bs=1M seek=2
$ rados -p test ls --all | sort
rbd_data.08ceb039ff1c19.0000000000000000
rbd_data.08ceb039ff1c19.0000000000000002
rbd_directory
rbd_header.08ceb039ff1c19
rbd_id.test1
rbd_info
rbd_object_map.08ceb039ff1c19
#
# there's our data
#
$ rados -p test get rbd_data.08ceb039ff1c19.0000000000000002 - | od -t x1
0000000 32 00 00 00 00 00 00 00 00 00 00 00 00 00 00 00
0000020 00 00 00 00 00 00 00 00 00 00 00 00 00 00 00 00
*
0010000
#
# once again the object map is updated
#
$ rados -p test get rbd_object_map.08ceb039ff1c19 - | od -t x1 > /tmp/om.head.2; cat /tmp/om.head.2
0000000 0e 00 00 00 01 01 08 00 00 00 0a 00 00 00 00 00
0000020 00 00 44 00 00 0c 00 00 00 c6 44 f4 3a 01 00 00
0000040 00 c3 24 bb 59
0000045
$ diff /tmp/om.head.{1,2}
2,3c2,3
< 0000020 00 00 40 00 00 0c 00 00 00 c6 44 f4 3a 01 00 00
< 0000040 00 d9 80 65 c7
---
0000020 00 00 44 00 00 0c 00 00 00 c6 44 f4 3a 01 00 00
0000040 00 c3 24 bb 59
##
## Create a snap
## - new rbd_object_map is created for the snap
## - the head rbd_object_map is updated
## - the snap rbd_object_map is the same as the previous head object map
##
$ rbd snap create --snap "test/test1" "test/test1@snap1"
#
# new rbd_object_map with snap id appended appears
#
$ rados -p test ls --all | sort
rbd_data.08ceb039ff1c19.0000000000000000
rbd_data.08ceb039ff1c19.0000000000000002
rbd_directory
rbd_header.08ceb039ff1c19
rbd_id.test1
rbd_info
rbd_object_map.08ceb039ff1c19
rbd_object_map.08ceb039ff1c19.0000000000000004
#
# look at the head and snap object maps
#
$ rados -p test get rbd_object_map.08ceb039ff1c19 - | od -t x1 > /tmp/om.head.3; cat /tmp/om.head.3
0000000 0e 00 00 00 01 01 08 00 00 00 0a 00 00 00 00 00
0000020 00 00 cc 00 00 0c 00 00 00 c6 44 f4 3a 01 00 00
0000040 00 45 6d cd ea
0000045
$ rados -p test get rbd_object_map.08ceb039ff1c19.0000000000000004 - | od -t x1 > /tmp/om.snap.1; cat /tmp/om.snap.1
0000000 0e 00 00 00 01 01 08 00 00 00 0a 00 00 00 00 00
0000020 00 00 44 00 00 0c 00 00 00 c6 44 f4 3a 01 00 00
0000040 00 c3 24 bb 59
0000045
#
# "head" rbd_object_map.08ceb039ff1c19 is updated
#
$ diff /tmp/om.head.{2,3}
2,3c2,3
< 0000020 00 00 44 00 00 0c 00 00 00 c6 44 f4 3a 01 00 00
< 0000040 00 c3 24 bb 59
---
0000020 00 00 cc 00 00 0c 00 00 00 c6 44 f4 3a 01 00 00
0000040 00 45 6d cd ea
#
# snap object map is the same as the previous head object map
#
$ diff /tmp/om.{head.2,snap.1} && echo 'same'
same
##
## write new data to the rbd
## - there are no new objects
## - new data appears in existing rbd_data object
## - WHERE IS THE OLD DATA???
##
$ printf '2' > $dev
#
# no new objects
#
b4# rados -p test ls --all | sort
rbd_data.08ceb039ff1c19.0000000000000000
rbd_data.08ceb039ff1c19.0000000000000002
rbd_directory
rbd_header.08ceb039ff1c19
rbd_id.test1
rbd_info
rbd_object_map.08ceb039ff1c19
rbd_object_map.08ceb039ff1c19.0000000000000004
#
# existing rbd_data is updated
#
$ rados -p test get rbd_data.08ceb039ff1c19.0000000000000000 - | od -t x1
0000000 32 00 00 00 00 00 00 00 00 00 00 00 00 00 00 00
0000020 00 00 00 00 00 00 00 00 00 00 00 00 00 00 00 00
*
0010000
#
# head object map is updated
#
$ rados -p test get rbd_object_map.08ceb039ff1c19 - | od -t x1 > /tmp/om.head.4; cat /tmp/om.head.4
0000000 0e 00 00 00 01 01 08 00 00 00 0a 00 00 00 00 00
0000020 00 00 4c 00 00 0c 00 00 00 c6 44 f4 3a 01 00 00
0000040 00 06 1a ea 61
0000045
$ diff /tmp/om.head.{3,4}
2,3c2,3
< 0000020 00 00 cc 00 00 0c 00 00 00 c6 44 f4 3a 01 00 00
< 0000040 00 45 6d cd ea
---
0000020 00 00 4c 00 00 0c 00 00 00 c6 44 f4 3a 01 00 00
0000040 00 06 1a ea 61
#
# snap object map is the same
#
$ rados -p test get rbd_object_map.08ceb039ff1c19.0000000000000004 - | od -t x1 > /tmp/om.snap.2; cat /tmp/om.snap.2
0000000 0e 00 00 00 01 01 08 00 00 00 0a 00 00 00 00 00
0000020 00 00 44 00 00 0c 00 00 00 c6 44 f4 3a 01 00 00
0000040 00 c3 24 bb 59
0000045
$ diff /tmp/om.snap.{1,2} && echo 'same'
same
##
## WHERE IS THE OLD DATA???
##
----------------------------------------------------------------------
_______________________________________________
ceph-users mailing list -- ceph-users@xxxxxxx
To unsubscribe send an email to ceph-users-leave@xxxxxxx