// -*- mode:C++; tab-width:8; c-basic-offset:2; indent-tabs-mode:t -*- // vim: ts=8 sw=2 smarttab #include "librbd/operation/TrimRequest.h" #include "librbd/AsyncObjectThrottle.h" #include "librbd/ExclusiveLock.h" #include "librbd/ImageCtx.h" #include "librbd/internal.h" #include "librbd/ObjectMap.h" #include "librbd/Utils.h" #include "librbd/io/ObjectRequest.h" #include "common/ContextCompletion.h" #include "common/dout.h" #include "common/errno.h" #include "osdc/Striper.h" #include #include #include #include #define dout_subsys ceph_subsys_rbd #undef dout_prefix #define dout_prefix *_dout << "librbd::TrimRequest: " namespace librbd { namespace operation { template class C_CopyupObject : public C_AsyncObjectThrottle { public: C_CopyupObject(AsyncObjectThrottle &throttle, I *image_ctx, ::SnapContext snapc, uint64_t object_no) : C_AsyncObjectThrottle(throttle, *image_ctx), m_snapc(snapc), m_object_no(object_no) { } int send() override { I &image_ctx = this->m_image_ctx; assert(image_ctx.owner_lock.is_locked()); assert(image_ctx.exclusive_lock == nullptr || image_ctx.exclusive_lock->is_lock_owner()); string oid = image_ctx.get_object_name(m_object_no); ldout(image_ctx.cct, 10) << "removing (with copyup) " << oid << dendl; auto req = io::ObjectRequest::create_trim(&image_ctx, oid, m_object_no, m_snapc, false, this); req->send(); return 0; } private: ::SnapContext m_snapc; uint64_t m_object_no; }; template class C_RemoveObject : public C_AsyncObjectThrottle { public: C_RemoveObject(AsyncObjectThrottle &throttle, I *image_ctx, uint64_t object_no) : C_AsyncObjectThrottle(throttle, *image_ctx), m_object_no(object_no) { } int send() override { I &image_ctx = this->m_image_ctx; assert(image_ctx.owner_lock.is_locked()); assert(image_ctx.exclusive_lock == nullptr || image_ctx.exclusive_lock->is_lock_owner()); { RWLock::RLocker snap_locker(image_ctx.snap_lock); if (image_ctx.object_map != nullptr && !image_ctx.object_map->object_may_exist(m_object_no)) { return 1; } } string oid = image_ctx.get_object_name(m_object_no); ldout(image_ctx.cct, 10) << "removing " << oid << dendl; librados::AioCompletion *rados_completion = util::create_rados_callback(this); int r = image_ctx.data_ctx.aio_remove(oid, rados_completion); assert(r == 0); rados_completion->release(); return 0; } private: uint64_t m_object_no; }; template TrimRequest::TrimRequest(I &image_ctx, Context *on_finish, uint64_t original_size, uint64_t new_size, ProgressContext &prog_ctx) : AsyncRequest(image_ctx, on_finish), m_new_size(new_size), m_prog_ctx(prog_ctx) { uint64_t period = image_ctx.get_stripe_period(); uint64_t new_num_periods = ((m_new_size + period - 1) / period); m_delete_off = MIN(new_num_periods * period, original_size); // first object we can delete free and clear m_delete_start = new_num_periods * image_ctx.get_stripe_count(); m_delete_start_min = m_delete_start; m_num_objects = Striper::get_num_objects(image_ctx.layout, original_size); CephContext *cct = image_ctx.cct; ldout(cct, 10) << this << " trim image " << original_size << " -> " << m_new_size << " periods " << new_num_periods << " discard to offset " << m_delete_off << " delete objects " << m_delete_start << " to " << m_num_objects << dendl; } template bool TrimRequest::should_complete(int r) { I &image_ctx = this->m_image_ctx; CephContext *cct = image_ctx.cct; ldout(cct, 5) << this << " should_complete: r=" << r << dendl; if (r == -ERESTART) { ldout(cct, 5) << "trim operation interrupted" << dendl; return true; } else if (r < 0) { lderr(cct) << "trim encountered an error: " << cpp_strerror(r) << dendl; return true; } RWLock::RLocker owner_lock(image_ctx.owner_lock); switch (m_state) { case STATE_PRE_TRIM: ldout(cct, 5) << " PRE_TRIM" << dendl; send_copyup_objects(); break; case STATE_COPYUP_OBJECTS: ldout(cct, 5) << " COPYUP_OBJECTS" << dendl; send_remove_objects(); break; case STATE_REMOVE_OBJECTS: ldout(cct, 5) << " REMOVE_OBJECTS" << dendl; send_post_trim(); break; case STATE_POST_TRIM: ldout(cct, 5) << " POST_TRIM" << dendl; send_clean_boundary(); break; case STATE_CLEAN_BOUNDARY: ldout(cct, 5) << "CLEAN_BOUNDARY" << dendl; send_finish(0); break; case STATE_FINISHED: ldout(cct, 5) << "FINISHED" << dendl; return true; default: lderr(cct) << "invalid state: " << m_state << dendl; assert(false); break; } return false; } template void TrimRequest::send() { send_pre_trim(); } template void TrimRequest::send_pre_trim() { I &image_ctx = this->m_image_ctx; assert(image_ctx.owner_lock.is_locked()); if (m_delete_start >= m_num_objects) { send_clean_boundary(); return; } { RWLock::RLocker snap_locker(image_ctx.snap_lock); if (image_ctx.object_map != nullptr) { ldout(image_ctx.cct, 5) << this << " send_pre_trim: " << " delete_start_min=" << m_delete_start_min << " num_objects=" << m_num_objects << dendl; m_state = STATE_PRE_TRIM; assert(image_ctx.exclusive_lock->is_lock_owner()); RWLock::WLocker object_map_locker(image_ctx.object_map_lock); if (image_ctx.object_map->template aio_update >( CEPH_NOSNAP, m_delete_start_min, m_num_objects, OBJECT_PENDING, OBJECT_EXISTS, {}, this)) { return; } } } send_copyup_objects(); } template void TrimRequest::send_copyup_objects() { I &image_ctx = this->m_image_ctx; assert(image_ctx.owner_lock.is_locked()); ::SnapContext snapc; bool has_snapshots; uint64_t parent_overlap; { RWLock::RLocker snap_locker(image_ctx.snap_lock); RWLock::RLocker parent_locker(image_ctx.parent_lock); snapc = image_ctx.snapc; has_snapshots = !image_ctx.snaps.empty(); int r = image_ctx.get_parent_overlap(CEPH_NOSNAP, &parent_overlap); assert(r == 0); } // copyup is only required for portion of image that overlaps parent uint64_t copyup_end = Striper::get_num_objects(image_ctx.layout, parent_overlap); // TODO: protect against concurrent shrink and snap create? // skip to remove if no copyup is required. if (copyup_end <= m_delete_start || !has_snapshots) { send_remove_objects(); return; } uint64_t copyup_start = m_delete_start; m_delete_start = copyup_end; ldout(image_ctx.cct, 5) << this << " send_copyup_objects: " << " start object=" << copyup_start << ", " << " end object=" << copyup_end << dendl; m_state = STATE_COPYUP_OBJECTS; Context *ctx = this->create_callback_context(); typename AsyncObjectThrottle::ContextFactory context_factory( boost::lambda::bind(boost::lambda::new_ptr >(), boost::lambda::_1, &image_ctx, snapc, boost::lambda::_2)); AsyncObjectThrottle *throttle = new AsyncObjectThrottle( this, image_ctx, context_factory, ctx, &m_prog_ctx, copyup_start, copyup_end); throttle->start_ops(image_ctx.concurrent_management_ops); } template void TrimRequest::send_remove_objects() { I &image_ctx = this->m_image_ctx; assert(image_ctx.owner_lock.is_locked()); ldout(image_ctx.cct, 5) << this << " send_remove_objects: " << " delete_start=" << m_delete_start << " num_objects=" << m_num_objects << dendl; m_state = STATE_REMOVE_OBJECTS; Context *ctx = this->create_callback_context(); typename AsyncObjectThrottle::ContextFactory context_factory( boost::lambda::bind(boost::lambda::new_ptr >(), boost::lambda::_1, &image_ctx, boost::lambda::_2)); AsyncObjectThrottle *throttle = new AsyncObjectThrottle( this, image_ctx, context_factory, ctx, &m_prog_ctx, m_delete_start, m_num_objects); throttle->start_ops(image_ctx.concurrent_management_ops); } template void TrimRequest::send_post_trim() { I &image_ctx = this->m_image_ctx; assert(image_ctx.owner_lock.is_locked()); { RWLock::RLocker snap_locker(image_ctx.snap_lock); if (image_ctx.object_map != nullptr) { ldout(image_ctx.cct, 5) << this << " send_post_trim:" << " delete_start_min=" << m_delete_start_min << " num_objects=" << m_num_objects << dendl; m_state = STATE_POST_TRIM; assert(image_ctx.exclusive_lock->is_lock_owner()); RWLock::WLocker object_map_locker(image_ctx.object_map_lock); if (image_ctx.object_map->template aio_update >( CEPH_NOSNAP, m_delete_start_min, m_num_objects, OBJECT_NONEXISTENT, OBJECT_PENDING, {}, this)) { return; } } } send_clean_boundary(); } template void TrimRequest::send_clean_boundary() { I &image_ctx = this->m_image_ctx; assert(image_ctx.owner_lock.is_locked()); CephContext *cct = image_ctx.cct; if (m_delete_off <= m_new_size) { send_finish(0); return; } // should have been canceled prior to releasing lock assert(image_ctx.exclusive_lock == nullptr || image_ctx.exclusive_lock->is_lock_owner()); uint64_t delete_len = m_delete_off - m_new_size; ldout(image_ctx.cct, 5) << this << " send_clean_boundary: " << " delete_off=" << m_delete_off << " length=" << delete_len << dendl; m_state = STATE_CLEAN_BOUNDARY; ::SnapContext snapc; { RWLock::RLocker snap_locker(image_ctx.snap_lock); snapc = image_ctx.snapc; } // discard the weird boundary std::vector extents; Striper::file_to_extents(cct, image_ctx.format_string, &image_ctx.layout, m_new_size, delete_len, 0, extents); ContextCompletion *completion = new ContextCompletion(this->create_async_callback_context(), true); for (vector::iterator p = extents.begin(); p != extents.end(); ++p) { ldout(cct, 20) << " ex " << *p << dendl; Context *req_comp = new C_ContextCompletion(*completion); io::ObjectRequest *req; if (p->offset == 0) { req = io::ObjectRequest::create_trim(&image_ctx, p->oid.name, p->objectno, snapc, true, req_comp); } else { req = io::ObjectRequest::create_truncate(&image_ctx, p->oid.name, p->objectno, p->offset, snapc, {}, req_comp); } req->send(); } completion->finish_adding_requests(); } template void TrimRequest::send_finish(int r) { m_state = STATE_FINISHED; this->async_complete(r); } } // namespace operation } // namespace librbd template class librbd::operation::TrimRequest;