+++ /dev/null
-// -*- mode:C++; tab-width:8; c-basic-offset:2; indent-tabs-mode:t -*-
-// vim: ts=8 sw=2 smarttab
-
-#include "rgw_gc.h"
-#include "include/rados/librados.hpp"
-#include "cls/rgw/cls_rgw_client.h"
-#include "cls/refcount/cls_refcount_client.h"
-#include "cls/lock/cls_lock_client.h"
-#include "auth/Crypto.h"
-
-#include <list>
-
-#define dout_context g_ceph_context
-#define dout_subsys ceph_subsys_rgw
-
-using namespace std;
-using namespace librados;
-
-static string gc_oid_prefix = "gc";
-static string gc_index_lock_name = "gc_process";
-
-
-void RGWGC::initialize(CephContext *_cct, RGWRados *_store) {
- cct = _cct;
- store = _store;
-
- max_objs = min(static_cast<int>(cct->_conf->rgw_gc_max_objs), rgw_shards_max());
-
- obj_names = new string[max_objs];
-
- for (int i = 0; i < max_objs; i++) {
- obj_names[i] = gc_oid_prefix;
- char buf[32];
- snprintf(buf, 32, ".%d", i);
- obj_names[i].append(buf);
- }
-}
-
-void RGWGC::finalize()
-{
- delete[] obj_names;
-}
-
-int RGWGC::tag_index(const string& tag)
-{
- return rgw_shards_hash(tag, max_objs);
-}
-
-void RGWGC::add_chain(ObjectWriteOperation& op, cls_rgw_obj_chain& chain, const string& tag)
-{
- cls_rgw_gc_obj_info info;
- info.chain = chain;
- info.tag = tag;
-
- cls_rgw_gc_set_entry(op, cct->_conf->rgw_gc_obj_min_wait, info);
-}
-
-int RGWGC::send_chain(cls_rgw_obj_chain& chain, const string& tag, bool sync)
-{
- ObjectWriteOperation op;
- add_chain(op, chain, tag);
-
- int i = tag_index(tag);
-
- if (sync)
- return store->gc_operate(obj_names[i], &op);
-
- return store->gc_aio_operate(obj_names[i], &op);
-}
-
-int RGWGC::defer_chain(const string& tag, bool sync)
-{
- ObjectWriteOperation op;
- cls_rgw_gc_defer_entry(op, cct->_conf->rgw_gc_obj_min_wait, tag);
-
- int i = tag_index(tag);
-
- if (sync)
- return store->gc_operate(obj_names[i], &op);
-
- return store->gc_aio_operate(obj_names[i], &op);
-}
-
-int RGWGC::remove(int index, const std::list<string>& tags)
-{
- ObjectWriteOperation op;
- cls_rgw_gc_remove(op, tags);
- return store->gc_operate(obj_names[index], &op);
-}
-
-int RGWGC::list(int *index, string& marker, uint32_t max, bool expired_only, std::list<cls_rgw_gc_obj_info>& result, bool *truncated)
-{
- result.clear();
- string next_marker;
-
- for (; *index < max_objs && result.size() < max; (*index)++, marker.clear()) {
- std::list<cls_rgw_gc_obj_info> entries;
- int ret = cls_rgw_gc_list(store->gc_pool_ctx, obj_names[*index], marker, max - result.size(), expired_only, entries, truncated, next_marker);
- if (ret == -ENOENT)
- continue;
- if (ret < 0)
- return ret;
-
- std::list<cls_rgw_gc_obj_info>::iterator iter;
- for (iter = entries.begin(); iter != entries.end(); ++iter) {
- result.push_back(*iter);
- }
-
- marker = next_marker;
-
- if (*index == max_objs - 1) {
- /* we cut short here, truncated will hold the correct value */
- return 0;
- }
-
- if (result.size() == max) {
- /* close approximation, it might be that the next of the objects don't hold
- * anything, in this case truncated should have been false, but we can find
- * that out on the next iteration
- */
- *truncated = true;
- return 0;
- }
-
- }
- *truncated = false;
-
- return 0;
-}
-
-int RGWGC::process(int index, int max_secs)
-{
- rados::cls::lock::Lock l(gc_index_lock_name);
- utime_t end = ceph_clock_now();
- std::list<string> remove_tags;
-
- /* max_secs should be greater than zero. We don't want a zero max_secs
- * to be translated as no timeout, since we'd then need to break the
- * lock and that would require a manual intervention. In this case
- * we can just wait it out. */
- if (max_secs <= 0)
- return -EAGAIN;
-
- end += max_secs;
- utime_t time(max_secs, 0);
- l.set_duration(time);
-
- int ret = l.lock_exclusive(&store->gc_pool_ctx, obj_names[index]);
- if (ret == -EBUSY) { /* already locked by another gc processor */
- dout(10) << "RGWGC::process() failed to acquire lock on " << obj_names[index] << dendl;
- return 0;
- }
- if (ret < 0)
- return ret;
-
- string marker;
- string next_marker;
- bool truncated;
- IoCtx *ctx = new IoCtx;
- do {
- int max = 100;
- std::list<cls_rgw_gc_obj_info> entries;
- ret = cls_rgw_gc_list(store->gc_pool_ctx, obj_names[index], marker, max, true, entries, &truncated, next_marker);
- if (ret == -ENOENT) {
- ret = 0;
- goto done;
- }
- if (ret < 0)
- goto done;
-
- string last_pool;
- std::list<cls_rgw_gc_obj_info>::iterator iter;
- for (iter = entries.begin(); iter != entries.end(); ++iter) {
- bool remove_tag;
- cls_rgw_gc_obj_info& info = *iter;
- std::list<cls_rgw_obj>::iterator liter;
- cls_rgw_obj_chain& chain = info.chain;
-
- utime_t now = ceph_clock_now();
- if (now >= end)
- goto done;
-
- remove_tag = true;
- for (liter = chain.objs.begin(); liter != chain.objs.end(); ++liter) {
- cls_rgw_obj& obj = *liter;
-
- if (obj.pool != last_pool) {
- delete ctx;
- ctx = new IoCtx;
- ret = rgw_init_ioctx(store->get_rados_handle(), obj.pool, *ctx);
- if (ret < 0) {
- dout(0) << "ERROR: failed to create ioctx pool=" << obj.pool << dendl;
- continue;
- }
- last_pool = obj.pool;
- }
-
- ctx->locator_set_key(obj.loc);
-
- const string& oid = obj.key.name; /* just stored raw oid there */
-
- dout(5) << "gc::process: removing " << obj.pool << ":" << obj.key.name << dendl;
- ObjectWriteOperation op;
- cls_refcount_put(op, info.tag, true);
- ret = ctx->operate(oid, &op);
- if (ret == -ENOENT)
- ret = 0;
- if (ret < 0) {
- remove_tag = false;
- dout(0) << "failed to remove " << obj.pool << ":" << oid << "@" << obj.loc << dendl;
- }
-
- if (going_down()) // leave early, even if tag isn't removed, it's ok
- goto done;
- }
- if (remove_tag) {
- remove_tags.push_back(info.tag);
-#define MAX_REMOVE_CHUNK 16
- if (remove_tags.size() > MAX_REMOVE_CHUNK) {
- RGWGC::remove(index, remove_tags);
- remove_tags.clear();
- }
- }
- }
- if (!remove_tags.empty()) {
- RGWGC::remove(index, remove_tags);
- remove_tags.clear();
- }
- } while (truncated);
-
-done:
- if (!remove_tags.empty())
- RGWGC::remove(index, remove_tags);
- l.unlock(&store->gc_pool_ctx, obj_names[index]);
- delete ctx;
- return 0;
-}
-
-int RGWGC::process()
-{
- int max_secs = cct->_conf->rgw_gc_processor_max_time;
-
- unsigned start;
- int ret = get_random_bytes((char *)&start, sizeof(start));
- if (ret < 0)
- return ret;
-
- for (int i = 0; i < max_objs; i++) {
- int index = (i + start) % max_objs;
- ret = process(index, max_secs);
- if (ret < 0)
- return ret;
- }
-
- return 0;
-}
-
-bool RGWGC::going_down()
-{
- return down_flag;
-}
-
-void RGWGC::start_processor()
-{
- worker = new GCWorker(cct, this);
- worker->create("rgw_gc");
-}
-
-void RGWGC::stop_processor()
-{
- down_flag = true;
- if (worker) {
- worker->stop();
- worker->join();
- }
- delete worker;
- worker = NULL;
-}
-
-void *RGWGC::GCWorker::entry() {
- do {
- utime_t start = ceph_clock_now();
- dout(2) << "garbage collection: start" << dendl;
- int r = gc->process();
- if (r < 0) {
- dout(0) << "ERROR: garbage collection process() returned error r=" << r << dendl;
- }
- dout(2) << "garbage collection: stop" << dendl;
-
- if (gc->going_down())
- break;
-
- utime_t end = ceph_clock_now();
- end -= start;
- int secs = cct->_conf->rgw_gc_processor_period;
-
- if (secs <= end.sec())
- continue; // next round
-
- secs -= end.sec();
-
- lock.Lock();
- cond.WaitInterval(lock, utime_t(secs, 0));
- lock.Unlock();
- } while (!gc->going_down());
-
- return NULL;
-}
-
-void RGWGC::GCWorker::stop()
-{
- Mutex::Locker l(lock);
- cond.Signal();
-}
-