/* Copyright (c) 2013-2014 Red Hat, Inc. This file is part of GlusterFS. This file is licensed to you under your choice of the GNU Lesser General Public License, version 3 or any later version (LGPLv3 or later), or the GNU General Public License, version 2 (GPLv2), in all cases as published by the Free Software Foundation. */ #ifndef _CONFIG_H #define _CONFIG_H #include "config.h" #endif #include #include #include #include #include #include #include #if !defined(__NetBSD__) && !defined(GF_DARWIN_HOST_OS) #include #else #include "mntent_compat.h" #endif #ifdef __NetBSD__ #define umount2(dir, flags) unmount(dir, ((flags) != 0) ? MNT_FORCE : 0) #endif #ifdef GF_DARWIN_HOST_OS #include #include #define umount2(dir, flags) unmount(dir, ((flags) != 0) ? MNT_FORCE : 0) #endif #include #include "globals.h" #include "compat.h" #include "protocol-common.h" #include "xlator.h" #include "logging.h" #include "timer.h" #include "glusterd-mem-types.h" #include "glusterd.h" #include "glusterd-sm.h" #include "glusterd-op-sm.h" #include "glusterd-utils.h" #include "glusterd-store.h" #include "run.h" #include "glusterd-volgen.h" #include "glusterd-mgmt.h" #include "glusterd-syncop.h" #include "syscall.h" #include "cli1-xdr.h" #include "xdr-generic.h" #include "lvm-defaults.h" char snap_mount_folder[PATH_MAX]; struct snap_create_args_ { xlator_t *this; dict_t *dict; dict_t *rsp_dict; glusterd_volinfo_t *snap_vol; glusterd_brickinfo_t *brickinfo; struct syncargs *args; int32_t volcount; int32_t brickcount; int32_t brickorder; }; typedef struct snap_create_args_ snap_create_args_t; /* This function is called to get the device path of the snap lvm. Usually if /dev/mapper/- is the device for the lvm, then the snap device will be /dev//. This function takes care of building the path for the snap device. */ char * glusterd_build_snap_device_path (char *device, char *snapname, int32_t brickcount) { char snap[PATH_MAX] = ""; char msg[1024] = ""; char volgroup[PATH_MAX] = ""; char *snap_device = NULL; xlator_t *this = NULL; runner_t runner = {0,}; char *ptr = NULL; int ret = -1; this = THIS; GF_ASSERT (this); if (!device) { gf_log (this->name, GF_LOG_ERROR, "device is NULL"); goto out; } if (!snapname) { gf_log (this->name, GF_LOG_ERROR, "snapname is NULL"); goto out; } runinit (&runner); runner_add_args (&runner, "/sbin/lvs", "--noheadings", "-o", "vg_name", device, NULL); runner_redir (&runner, STDOUT_FILENO, RUN_PIPE); snprintf (msg, sizeof (msg), "Get volume group for device %s", device); runner_log (&runner, this->name, GF_LOG_DEBUG, msg); ret = runner_start (&runner); if (ret == -1) { gf_log (this->name, GF_LOG_ERROR, "Failed to get volume group " "for device %s", device); runner_end (&runner); goto out; } ptr = fgets(volgroup, sizeof(volgroup), runner_chio (&runner, STDOUT_FILENO)); if (!ptr || !strlen(volgroup)) { gf_log (this->name, GF_LOG_ERROR, "Failed to get volume group " "for snap %s", snapname); runner_end (&runner); ret = -1; goto out; } runner_end (&runner); snprintf (snap, sizeof(snap), "/dev/%s/%s_%d", gf_trim(volgroup), snapname, brickcount); snap_device = gf_strdup (snap); if (!snap_device) { gf_log (this->name, GF_LOG_WARNING, "Cannot copy the " "snapshot device name for snapname: %s", snapname); } out: return snap_device; } /* Look for disconnected peers, for missed snap creates or deletes */ static int32_t glusterd_find_missed_snap (dict_t *rsp_dict, glusterd_volinfo_t *vol, struct list_head *peers, int32_t op) { int32_t brick_count = -1; int32_t ret = -1; xlator_t *this = NULL; glusterd_peerinfo_t *peerinfo = NULL; glusterd_brickinfo_t *brickinfo = NULL; this = THIS; GF_ASSERT (this); GF_ASSERT (rsp_dict); GF_ASSERT (peers); GF_ASSERT (vol); brick_count = 0; list_for_each_entry (brickinfo, &vol->bricks, brick_list) { if (!uuid_compare (brickinfo->uuid, MY_UUID)) { /* If the brick belongs to the same node */ brick_count++; continue; } list_for_each_entry (peerinfo, peers, uuid_list) { if (uuid_compare (peerinfo->uuid, brickinfo->uuid)) { /* If the brick doesnt belong to this peer */ continue; } /* Found peer who owns the brick, * * if peer is not connected or not * * friend add it to missed snap list */ if (!(peerinfo->connected) || (peerinfo->state.state != GD_FRIEND_STATE_BEFRIENDED)) { ret = glusterd_add_missed_snaps_to_dict (rsp_dict, vol, brickinfo, brick_count + 1, op); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to add missed snapshot " "info for %s:%s in the " "rsp_dict", brickinfo->hostname, brickinfo->path); goto out; } } } brick_count++; } ret = 0; out: gf_log (this->name, GF_LOG_TRACE, "Returning %d", ret); return ret; } int snap_max_limits_display_commit (dict_t *rsp_dict, char *volname, char *op_errstr) { char err_str[PATH_MAX] = ""; char buf[PATH_MAX] = ""; glusterd_conf_t *conf = NULL; glusterd_volinfo_t *volinfo = NULL; int ret = -1; uint64_t active_hard_limit = 0; uint64_t snap_max_limit = 0; uint64_t soft_limit_value = -1; uint64_t count = 0; xlator_t *this = NULL; this = THIS; GF_ASSERT (this); GF_ASSERT (rsp_dict); GF_ASSERT (op_errstr); conf = this->private; GF_ASSERT (conf); if (!volname) { /* For system limit */ list_for_each_entry (volinfo, &conf->volumes, vol_list) { if (volinfo->is_snap_volume == _gf_true) continue; snap_max_limit = volinfo->snap_max_hard_limit; if (snap_max_limit > conf->snap_max_hard_limit) active_hard_limit = conf->snap_max_hard_limit; else active_hard_limit = snap_max_limit; soft_limit_value = (active_hard_limit * conf->snap_max_soft_limit) / 100; snprintf (buf, sizeof(buf), "volume%"PRId64"-volname", count); ret = dict_set_str (rsp_dict, buf, volinfo->volname); if (ret) { snprintf (err_str, PATH_MAX, "Failed to set %s", buf); goto out; } snprintf (buf, sizeof(buf), "volume%"PRId64"-snap-max-hard-limit", count); ret = dict_set_uint64 (rsp_dict, buf, snap_max_limit); if (ret) { snprintf (err_str, PATH_MAX, "Failed to set %s", buf); goto out; } snprintf (buf, sizeof(buf), "volume%"PRId64"-active-hard-limit", count); ret = dict_set_uint64 (rsp_dict, buf, active_hard_limit); if (ret) { snprintf (err_str, PATH_MAX, "Failed to set %s", buf); goto out; } snprintf (buf, sizeof(buf), "volume%"PRId64"-snap-max-soft-limit", count); ret = dict_set_uint64 (rsp_dict, buf, soft_limit_value); if (ret) { snprintf (err_str, PATH_MAX, "Failed to set %s", buf); goto out; } count++; } ret = dict_set_uint64 (rsp_dict, "voldisplaycount", count); if (ret) { snprintf (err_str, PATH_MAX, "Failed to set voldisplaycount"); goto out; } } else { /* For one volume */ ret = glusterd_volinfo_find (volname, &volinfo); if (ret) { snprintf (err_str, PATH_MAX, "Failed to get the" " volinfo for volume %s", volname); goto out; } snap_max_limit = volinfo->snap_max_hard_limit; if (snap_max_limit > conf->snap_max_hard_limit) active_hard_limit = conf->snap_max_hard_limit; else active_hard_limit = snap_max_limit; soft_limit_value = (active_hard_limit * conf->snap_max_soft_limit) / 100; snprintf (buf, sizeof(buf), "volume%"PRId64"-volname", count); ret = dict_set_str (rsp_dict, buf, volinfo->volname); if (ret) { snprintf (err_str, PATH_MAX, "Failed to set %s", buf); goto out; } snprintf (buf, sizeof(buf), "volume%"PRId64"-snap-max-hard-limit", count); ret = dict_set_uint64 (rsp_dict, buf, snap_max_limit); if (ret) { snprintf (err_str, PATH_MAX, "Failed to set %s", buf); goto out; } snprintf (buf, sizeof(buf), "volume%"PRId64"-active-hard-limit", count); ret = dict_set_uint64 (rsp_dict, buf, active_hard_limit); if (ret) { snprintf (err_str, PATH_MAX, "Failed to set %s", buf); goto out; } snprintf (buf, sizeof(buf), "volume%"PRId64"-snap-max-soft-limit", count); ret = dict_set_uint64 (rsp_dict, buf, soft_limit_value); if (ret) { snprintf (err_str, PATH_MAX, "Failed to set %s", buf); goto out; } count++; ret = dict_set_uint64 (rsp_dict, "voldisplaycount", count); if (ret) { snprintf (err_str, PATH_MAX, "Failed to set voldisplaycount"); goto out; } } ret = dict_set_uint64 (rsp_dict, "snap-max-hard-limit", conf->snap_max_hard_limit); if (ret) { snprintf (err_str, PATH_MAX, "Failed to set sys-snap-max-hard-limit "); goto out; } ret = dict_set_uint64 (rsp_dict, "snap-max-soft-limit", conf->snap_max_soft_limit); if (ret) { snprintf (err_str, PATH_MAX, "Failed to set sys-snap-max-hard-limit "); goto out; } ret = 0; out: if (ret) { op_errstr = gf_strdup (err_str); gf_log (this->name, GF_LOG_ERROR, "%s", err_str); } return ret; } /* Third argument of scandir(used in glusterd_copy_geo_rep_session_files) * is filter function. As we dont want "." and ".." files present in the * directory, we are excliding these 2 files. * "file_select" function here does the job of filtering. */ int file_select (const struct dirent *entry) { if (entry == NULL) return (FALSE); if ((strcmp(entry->d_name, ".") == 0) || (strcmp(entry->d_name, "..") == 0)) return (FALSE); else return (TRUE); } int32_t glusterd_copy_geo_rep_session_files (char *session, glusterd_volinfo_t *snap_vol) { int32_t ret = -1; char snap_session_dir[PATH_MAX] = ""; char georep_session_dir[PATH_MAX] = ""; regex_t *reg_exp = NULL; int file_count = -1; struct dirent **files = {0,}; xlator_t *this = NULL; int i = 0; char src_path[PATH_MAX] = ""; char dest_path[PATH_MAX] = ""; glusterd_conf_t *priv = NULL; this = THIS; GF_ASSERT (this); priv = this->private; GF_ASSERT (priv); GF_ASSERT (session); GF_ASSERT (snap_vol); ret = snprintf (georep_session_dir, sizeof (georep_session_dir), "%s/%s/%s", priv->workdir, GEOREP, session); if (ret < 0) { /* Negative value is an error */ goto out; } ret = snprintf (snap_session_dir, sizeof (snap_session_dir), "%s/%s/%s/%s/%s", priv->workdir, GLUSTERD_VOL_SNAP_DIR_PREFIX, snap_vol->snapshot->snapname, GEOREP, session); if (ret < 0) { /* Negative value is an error */ goto out; } ret = mkdir_p (snap_session_dir, 0777, _gf_true); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Creating directory %s failed", snap_session_dir); goto out; } /* TODO : good to have - Allocate in stack instead of heap */ reg_exp = GF_CALLOC (1, sizeof (regex_t), gf_common_mt_regex_t); if (!reg_exp) { ret = -1; gf_log (this->name, GF_LOG_ERROR, "Failed to allocate " "memory for regular expression"); goto out; } ret = regcomp (reg_exp, "(.*status$)|(.*conf$)\0", REG_EXTENDED); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to " "compile the regular expression"); goto out; } /* If there are no files in a particular session then fail it*/ file_count = scandir (georep_session_dir, &files, file_select, alphasort); if (file_count <= 0) { ret = -1; gf_log (this->name, GF_LOG_ERROR, "Session files not present " "in %s", georep_session_dir); goto out; } /* Now compare the file name with regular expression to see if * there is a match */ for (i = 0 ; i < file_count; i++) { if (regexec (reg_exp, files[i]->d_name, 0, NULL, 0)) continue; ret = snprintf (src_path, sizeof (src_path), "%s/%s", georep_session_dir, files[i]->d_name); if (ret < 0) { goto out; } ret = snprintf (dest_path , sizeof (dest_path), "%s/%s", snap_session_dir, files[i]->d_name); if (ret < 0) { goto out; } ret = glusterd_copy_file (src_path, dest_path); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not " "copy file %s of session %s", files[i]->d_name, session); goto out; } } out: if (reg_exp) GF_FREE (reg_exp); return ret; } /* This function will take backup of the volume store * of the to-be restored volume. This will help us to * revert the operation if it fails. * * @param volinfo volinfo of the origin volume * * @return 0 on success and -1 on failure */ int glusterd_snapshot_backup_vol (glusterd_volinfo_t *volinfo) { char pathname[PATH_MAX] = {0,}; int ret = -1; int op_ret = 0; char delete_path[PATH_MAX] = {0,}; char trashdir[PATH_MAX] = {0,}; glusterd_conf_t *priv = NULL; xlator_t *this = NULL; this = THIS; GF_ASSERT (this); priv = this->private; GF_ASSERT (priv); GF_ASSERT (volinfo); GLUSTERD_GET_VOLUME_DIR (pathname, volinfo, priv); snprintf (delete_path, sizeof (delete_path), "%s/"GLUSTERD_TRASH"/vols-%s.deleted", priv->workdir, volinfo->volname); snprintf (trashdir, sizeof (trashdir), "%s/"GLUSTERD_TRASH, priv->workdir); /* Create trash folder if it is not there */ ret = mkdir (trashdir, 0777); if (ret && errno != EEXIST) { gf_log (this->name, GF_LOG_ERROR, "Failed to create trash " "directory, reason : %s", strerror (errno)); ret = -1; goto out; } /* Move the origin volume volder to the backup location */ ret = rename (pathname, delete_path); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to rename snap " "directory %s to %s", pathname, delete_path); goto out; } /* Re-create an empty origin volume folder so that restore can * happen. */ ret = mkdir (pathname, 0777); if (ret && errno != EEXIST) { gf_log (this->name, GF_LOG_ERROR, "Failed to create origin " "volume directory (%s), reason : %s", pathname, strerror (errno)); ret = -1; goto out; } ret = 0; out: /* Save the actual return value */ op_ret = ret; if (ret) { /* Revert the changes in case of failure */ ret = rmdir (pathname); if (ret) { gf_log (this->name, GF_LOG_DEBUG, "Failed to rmdir: %s,err: %s", pathname, strerror (errno)); } ret = rename (delete_path, pathname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to rename directory %s to %s", delete_path, pathname); } ret = rmdir (trashdir); if (ret) { gf_log (this->name, GF_LOG_DEBUG, "Failed to rmdir: %s, Reason: %s", trashdir, strerror (errno)); } } gf_log (this->name, GF_LOG_TRACE, "Returning %d", op_ret); return op_ret; } int32_t glusterd_copy_geo_rep_files (glusterd_volinfo_t *origin_vol, glusterd_volinfo_t *snap_vol, dict_t *rsp_dict) { int32_t ret = -1; int i = 0; xlator_t *this = NULL; char key[PATH_MAX] = ""; char session[PATH_MAX] = ""; char slave[PATH_MAX] = ""; char snapgeo_dir[PATH_MAX] = ""; glusterd_conf_t *priv = NULL; this = THIS; GF_ASSERT (this); priv = this->private; GF_ASSERT (priv); GF_ASSERT (origin_vol); GF_ASSERT (snap_vol); GF_ASSERT (rsp_dict); /* This condition is not satisfied if the volume * is slave volume. */ if (!origin_vol->gsync_slaves) { ret = 0; goto out; } GLUSTERD_GET_SNAP_GEO_REP_DIR(snapgeo_dir, snap_vol->snapshot, priv); ret = mkdir (snapgeo_dir, 0777); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Creating directory %s failed", snapgeo_dir); goto out; } for (i = 1 ; i <= origin_vol->gsync_slaves->count ; i++) { ret = snprintf (key, sizeof (key), "slave%d", i); if (ret < 0) /* Negative value is an error */ goto out; ret = glusterd_get_geo_rep_session (key, origin_vol->volname, origin_vol->gsync_slaves, session, slave); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get geo-rep session"); goto out; } ret = glusterd_copy_geo_rep_session_files (session, snap_vol); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to copy files" " related to session %s", session); goto out; } } out: return ret; } /* This function will restore a snapshot volumes * * @param dict dictionary containing snapshot restore request * @param op_errstr In case of any failure error message will be returned * in this variable * @return Negative value on Failure and 0 in success */ int glusterd_snapshot_restore (dict_t *dict, char **op_errstr, dict_t *rsp_dict) { int ret = -1; int32_t volcount = -1; char *snapname = NULL; xlator_t *this = NULL; glusterd_volinfo_t *snap_volinfo = NULL; glusterd_volinfo_t *tmp = NULL; glusterd_volinfo_t *parent_volinfo = NULL; glusterd_snap_t *snap = NULL; glusterd_conf_t *priv = NULL; this = THIS; GF_ASSERT (this); GF_ASSERT (dict); GF_ASSERT (op_errstr); GF_ASSERT (rsp_dict); priv = this->private; GF_ASSERT (priv); ret = dict_get_str (dict, "snapname", &snapname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get " "snap name"); goto out; } snap = glusterd_find_snap_by_name (snapname); if (NULL == snap) { ret = gf_asprintf (op_errstr, "Snap (%s) not found", snapname); if (ret < 0) { goto out; } gf_log (this->name, GF_LOG_ERROR, "%s", *op_errstr); ret = -1; goto out; } volcount = 0; list_for_each_entry_safe (snap_volinfo, tmp, &snap->volumes, vol_list) { volcount++; ret = glusterd_volinfo_find (snap_volinfo->parent_volname, &parent_volinfo); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not get volinfo of %s", snap_volinfo->parent_volname); goto out; } if (is_origin_glusterd (dict) == _gf_true) { /* From origin glusterd check if * * any peers with snap bricks is down */ ret = glusterd_find_missed_snap (rsp_dict, snap_volinfo, &priv->peers, GF_SNAP_OPTION_TYPE_RESTORE); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to find missed snap restores"); goto out; } } ret = gd_restore_snap_volume (dict, rsp_dict, parent_volinfo, snap_volinfo, volcount); if (ret) { /* No need to update op_errstr because it is assumed * that the called function will do that in case of * failure. */ gf_log (this->name, GF_LOG_ERROR, "Failed to restore " "snap for %s", snapname); goto out; } } ret = 0; /* TODO: Need to check if we need to delete the snap after the * operation is successful or not. Also need to persist the state * of restore operation in the store. */ out: return ret; } /* This function is called before actual restore is taken place. This function * will validate whether the snapshot volumes are ready to be restored or not. * * @param dict dictionary containing snapshot restore request * @param op_errstr In case of any failure error message will be returned * in this variable * @param rsp_dict response dictionary * @return Negative value on Failure and 0 in success */ int32_t glusterd_snapshot_restore_prevalidate (dict_t *dict, char **op_errstr, dict_t *rsp_dict) { int ret = -1; int32_t i = 0; int32_t volcount = 0; int32_t brick_count = 0; gf_boolean_t snap_restored = _gf_false; char key[PATH_MAX] = {0, }; char *volname = NULL; char *snapname = NULL; glusterd_volinfo_t *volinfo = NULL; glusterd_brickinfo_t *brickinfo = NULL; glusterd_snap_t *snap = NULL; xlator_t *this = NULL; this = THIS; GF_ASSERT (this); GF_ASSERT (dict); GF_ASSERT (op_errstr); GF_ASSERT (rsp_dict); ret = dict_get_str (dict, "snapname", &snapname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get " "snap name"); goto out; } snap = glusterd_find_snap_by_name (snapname); if (NULL == snap) { ret = gf_asprintf (op_errstr, "Snap (%s) not found", snapname); if (ret < 0) { goto out; } gf_log (this->name, GF_LOG_ERROR, "%s", *op_errstr); ret = -1; goto out; } snap_restored = snap->snap_restored; if (snap_restored) { ret = gf_asprintf (op_errstr, "Snap (%s) is already " "restored", snapname); if (ret < 0) { goto out; } gf_log (this->name, GF_LOG_ERROR, "%s", *op_errstr); ret = -1; goto out; } ret = dict_set_str (rsp_dict, "snapname", snapname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set " "snap name(%s)", snapname); goto out; } ret = dict_get_int32 (dict, "volcount", &volcount); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get volume count"); goto out; } /* Snapshot restore will only work if all the volumes, that are part of the snapshot, are stopped. */ for (i = 1; i <= volcount; ++i) { snprintf (key, sizeof (key), "volname%d", i); ret = dict_get_str (dict, key, &volname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to " "get volume name"); goto out; } ret = glusterd_volinfo_find (volname, &volinfo); if (ret) { ret = gf_asprintf (op_errstr, "Volume (%s) not found", volname); if (ret < 0) { goto out; } gf_log (this->name, GF_LOG_ERROR, "%s", *op_errstr); ret = -1; goto out; } if (glusterd_is_volume_started (volinfo)) { ret = gf_asprintf (op_errstr, "Volume (%s) has been " "started. Volume needs to be stopped before restoring " "a snapshot.", volname); if (ret < 0) { goto out; } gf_log (this->name, GF_LOG_ERROR, "%s", *op_errstr); ret = -1; goto out; } /* Take backup of the volinfo folder */ ret = glusterd_snapshot_backup_vol (volinfo); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to backup " "volume backend files for %s volume", volinfo->volname); goto out; } } /* Get brickinfo for snap_volumes */ volcount = 0; list_for_each_entry (volinfo, &snap->volumes, vol_list) { volcount++; brick_count = 0; list_for_each_entry (brickinfo, &volinfo->bricks, brick_list) { brick_count++; if (uuid_compare (brickinfo->uuid, MY_UUID)) continue; snprintf (key, sizeof (key), "snap%d.brick%d.path", volcount, brick_count); ret = dict_set_str (rsp_dict, key, brickinfo->path); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set %s", key); goto out; } snprintf (key, sizeof (key), "snap%d.brick%d.snap_status", volcount, brick_count); ret = dict_set_int32 (rsp_dict, key, brickinfo->snap_status); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set %s", key); goto out; } snprintf (key, sizeof (key), "snap%d.brick%d.device_path", volcount, brick_count); ret = dict_set_str (rsp_dict, key, brickinfo->device_path); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set %s", key); goto out; } } snprintf (key, sizeof (key), "snap%d.brick_count", volcount); ret = dict_set_int32 (rsp_dict, key, brick_count); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set %s", key); goto out; } } ret = dict_set_int32 (rsp_dict, "volcount", volcount); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set %s", key); goto out; } out: return ret; } int snap_max_hard_limits_validate (dict_t *dict, char *volname, uint64_t value, char **op_errstr) { char err_str[PATH_MAX] = ""; glusterd_conf_t *conf = NULL; glusterd_volinfo_t *volinfo = NULL; int ret = -1; uint64_t max_limit = GLUSTERD_SNAPS_MAX_HARD_LIMIT; xlator_t *this = NULL; this = THIS; GF_ASSERT (this); GF_ASSERT (dict); GF_ASSERT (op_errstr); conf = this->private; GF_ASSERT (conf); if (volname) { ret = glusterd_volinfo_find (volname, &volinfo); if (!ret) { if (volinfo->is_snap_volume) { ret = -1; snprintf (err_str, PATH_MAX, "%s is a snap volume. Configuring " "snap-max-hard-limit for a snap " "volume is prohibited.", volname); goto out; } } } if (value) { /* Max limit for the system is GLUSTERD_SNAPS_MAX_HARD_LIMIT * but max limit for a volume is conf->snap_max_hard_limit. */ if (volname) { max_limit = conf->snap_max_hard_limit; } else { max_limit = GLUSTERD_SNAPS_MAX_HARD_LIMIT; } } if ((value < 0) || (value > max_limit)) { ret = -1; snprintf (err_str, PATH_MAX, "Invalid snap-max-hard-limit " "%"PRIu64 ". Expected range 1 - %"PRIu64, value, max_limit); goto out; } ret = 0; out: if (ret) { *op_errstr = gf_strdup (err_str); gf_log (this->name, GF_LOG_ERROR, "%s", err_str); } return ret; } int glusterd_snapshot_config_prevalidate (dict_t *dict, char **op_errstr) { char *volname = NULL; glusterd_volinfo_t *volinfo = NULL; xlator_t *this = NULL; int ret = -1; int config_command = 0; char err_str[PATH_MAX] = {0,}; glusterd_conf_t *conf = NULL; uint64_t hard_limit = 0; uint64_t soft_limit = 0; gf_loglevel_t loglevel = GF_LOG_ERROR; uint64_t max_limit = GLUSTERD_SNAPS_MAX_HARD_LIMIT; this = THIS; GF_ASSERT (this); GF_ASSERT (dict); GF_ASSERT (op_errstr); conf = this->private; GF_ASSERT (conf); ret = dict_get_int32 (dict, "config-command", &config_command); if (ret) { snprintf (err_str, sizeof (err_str), "failed to get config-command type"); goto out; } ret = dict_get_uint64 (dict, "snap-max-hard-limit", &hard_limit); ret = dict_get_uint64 (dict, "snap-max-soft-limit", &soft_limit); ret = dict_get_str (dict, "volname", &volname); if (volname) { ret = glusterd_volinfo_find (volname, &volinfo); if (ret) { snprintf (err_str, sizeof (err_str), "Volume %s does not exist.", volname); goto out; } } switch (config_command) { case GF_SNAP_CONFIG_TYPE_SET: if (hard_limit) { /* Validations for snap-max-hard-limits */ ret = snap_max_hard_limits_validate (dict, volname, hard_limit, op_errstr); if (ret) { gf_log (this->name, GF_LOG_ERROR, "snap-max-hard-limit validation " "failed."); goto out; } } if (soft_limit) { max_limit = GLUSTERD_SNAPS_MAX_SOFT_LIMIT_PERCENT; if ((soft_limit < 0) || (soft_limit > max_limit)) { ret = -1; snprintf (err_str, PATH_MAX, "Invalid " "snap-max-soft-limit ""%" PRIu64 ". Expected range 1 - %"PRIu64, soft_limit, max_limit); goto out; } break; } default: break; } ret = 0; out: if (ret && err_str[0] != '\0') { gf_log (this->name, loglevel, "%s", err_str); *op_errstr = gf_strdup (err_str); } return ret; } /* This function will be called from RPC handler routine. * This function is responsible for getting the requested * snapshot config into the dictionary. * * @param req RPC request object. Required for sending a response back. * @param op glusterd operation. Required for sending a response back. * @param dict pointer to dictionary which will contain both * request and response key-pair values. * @return -1 on error and 0 on success */ int glusterd_handle_snapshot_config (rpcsvc_request_t *req, glusterd_op_t op, dict_t *dict, char *err_str, size_t len) { int32_t ret = -1; char *volname = NULL; xlator_t *this = NULL; int config_command = 0; this = THIS; GF_ASSERT (this); GF_VALIDATE_OR_GOTO (this->name, req, out); GF_VALIDATE_OR_GOTO (this->name, dict, out); /* TODO : Type of lock to be taken when we are setting * limits system wide */ ret = dict_get_int32 (dict, "config-command", &config_command); if (ret) { snprintf (err_str, len, "Failed to get config-command type"); goto out; } ret = dict_get_str (dict, "volname", &volname); switch (config_command) { case GF_SNAP_CONFIG_TYPE_SET: if (!volname) { ret = dict_set_int32 (dict, "hold_vol_locks", _gf_false); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to set hold_vol_locks value " "as _gf_false"); goto out; } } ret = glusterd_mgmt_v3_initiate_all_phases (req, op, dict); break; case GF_SNAP_CONFIG_DISPLAY: /* Reading data from local node only */ ret = snap_max_limits_display_commit (dict, volname, err_str); if (ret) { gf_log (this->name, GF_LOG_ERROR, "snap-max-limit " "display commit failed."); goto out; } /* If everything is successful then send the response * back to cli */ ret = glusterd_op_send_cli_response (op, 0, 0, req, dict, err_str); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to send cli " "response"); goto out; } break; default: gf_log (this->name, GF_LOG_ERROR, "Unknown config type"); ret = -1; break; } out: return ret; } int glusterd_snap_create_pre_val_use_rsp_dict (dict_t *dst, dict_t *src) { char *snap_brick_dir = NULL; char *snap_device = NULL; char key[PATH_MAX] = ""; char snapbrckcnt[PATH_MAX] = ""; char snapbrckord[PATH_MAX] = ""; int ret = -1; int64_t i = -1; int64_t j = -1; int64_t volume_count = 0; int64_t brick_count = 0; int64_t brick_order = 0; xlator_t *this = NULL; int32_t brick_online = 0; this = THIS; GF_ASSERT (this); GF_ASSERT (dst); GF_ASSERT (src); ret = dict_get_int64 (src, "volcount", &volume_count); if (ret) { gf_log (this->name, GF_LOG_ERROR, "failed to " "get the volume count"); goto out; } for (i = 0; i < volume_count; i++) { memset (snapbrckcnt, '\0', sizeof(snapbrckcnt)); ret = snprintf (snapbrckcnt, sizeof(snapbrckcnt) - 1, "vol%"PRId64"_brickcount", i+1); ret = dict_get_int64 (src, snapbrckcnt, &brick_count); if (ret) { gf_log (this->name, GF_LOG_TRACE, "No bricks for this volume in this dict"); continue; } for (j = 0; j < brick_count; j++) { /* Fetching data from source dict */ snprintf (key, sizeof(key) - 1, "vol%"PRId64".brickdir%"PRId64, i+1, j); ret = dict_get_ptr (src, key, (void **)&snap_brick_dir); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Unable to fetch %s", key); continue; } /* Fetching brick order from source dict */ snprintf (snapbrckord, sizeof(snapbrckord) - 1, "vol%"PRId64".brick%"PRId64".order", i+1, j); ret = dict_get_int64 (src, snapbrckord, &brick_order); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get brick order"); goto out; } snprintf (key, sizeof(key) - 1, "vol%"PRId64".brickdir%"PRId64, i+1, brick_order); ret = dict_set_dynstr_with_alloc (dst, key, snap_brick_dir); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set %s", key); goto out; } snprintf (key, sizeof(key) - 1, "vol%"PRId64".brick_snapdevice%"PRId64, i+1, j); ret = dict_get_ptr (src, key, (void **)&snap_device); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to fetch snap_device"); goto out; } snprintf (key, sizeof(key) - 1, "vol%"PRId64".brick_snapdevice%"PRId64, i+1, brick_order); ret = dict_set_dynstr_with_alloc (dst, key, snap_device); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set %s", key); goto out; } snprintf (key, sizeof (key), "vol%"PRId64".brick%"PRId64".status", i+1, brick_order); ret = dict_get_int32 (src, key, &brick_online); if (ret) { gf_log (this->name, GF_LOG_ERROR, "failed to " "get the brick status"); goto out; } ret = dict_set_int32 (dst, key, brick_online); if (ret) { gf_log (this->name, GF_LOG_ERROR, "failed to " "set the brick status"); goto out; } brick_online = 0; } } ret = 0; out: gf_log (this->name, GF_LOG_TRACE, "Returning %d", ret); return ret; } /* Aggregate brickinfo's of the snap volumes to be restored from */ int32_t glusterd_snap_restore_use_rsp_dict (dict_t *dst, dict_t *src) { char key[PATH_MAX] = ""; char *strvalue = NULL; int32_t value = -1; int32_t i = -1; int32_t j = -1; int32_t vol_count = -1; int32_t brickcount = -1; int32_t ret = -1; xlator_t *this = NULL; this = THIS; GF_ASSERT (this); if (!dst || !src) { gf_log (this->name, GF_LOG_ERROR, "Source or Destination " "dict is empty."); goto out; } ret = dict_get_int32 (src, "volcount", &vol_count); if (ret) { gf_log (this->name, GF_LOG_DEBUG, "No volumes"); ret = 0; goto out; } for (i = 1; i <= vol_count; i++) { snprintf (key, sizeof (key), "snap%d.brick_count", i); ret = dict_get_int32 (src, key, &brickcount); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get %s", key); goto out; } for (j = 1; j <= brickcount; j++) { snprintf (key, sizeof (key), "snap%d.brick%d.path", i, j); ret = dict_get_str (src, key, &strvalue); if (ret) { /* The brickinfo will be present in * another rsp_dict */ gf_log (this->name, GF_LOG_DEBUG, "%s not present", key); ret = 0; continue; } ret = dict_set_dynstr_with_alloc (dst, key, strvalue); if (ret) { gf_log (this->name, GF_LOG_DEBUG, "Failed to set %s", key); goto out; } snprintf (key, sizeof (key), "snap%d.brick%d.snap_status", i, j); ret = dict_get_int32 (src, key, &value); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get %s", key); goto out; } ret = dict_set_int32 (dst, key, value); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set %s", key); goto out; } snprintf (key, sizeof (key), "snap%d.brick%d.device_path", i, j); ret = dict_get_str (src, key, &strvalue); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get %s", key); goto out; } ret = dict_set_dynstr_with_alloc (dst, key, strvalue); if (ret) { gf_log (this->name, GF_LOG_DEBUG, "Failed to set %s", key); goto out; } } } out: gf_log (this->name, GF_LOG_TRACE, "Returning %d", ret); return ret; } int glusterd_snap_pre_validate_use_rsp_dict (dict_t *dst, dict_t *src) { int ret = -1; int32_t snap_command = 0; xlator_t *this = NULL; this = THIS; GF_ASSERT (this); if (!dst || !src) { gf_log (this->name, GF_LOG_ERROR, "Source or Destination " "dict is empty."); goto out; } ret = dict_get_int32 (dst, "type", &snap_command); if (ret) { gf_log (this->name, GF_LOG_ERROR, "unable to get the type of " "the snapshot command"); goto out; } switch (snap_command) { case GF_SNAP_OPTION_TYPE_CREATE: ret = glusterd_snap_create_pre_val_use_rsp_dict (dst, src); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to use " "rsp dict"); goto out; } break; case GF_SNAP_OPTION_TYPE_RESTORE: ret = glusterd_snap_restore_use_rsp_dict (dst, src); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to use " "rsp dict"); goto out; } break; default: break; } ret = 0; out: gf_log (this->name, GF_LOG_DEBUG, "Returning %d", ret); return ret; } int glusterd_add_brick_status_to_dict (dict_t *dict, glusterd_volinfo_t *volinfo, glusterd_brickinfo_t *brickinfo, char *key_prefix) { char pidfile[PATH_MAX] = {0, }; int32_t brick_online = 0; pid_t pid = 0; xlator_t *this = NULL; glusterd_conf_t *conf = NULL; int ret = -1; GF_ASSERT (dict); GF_ASSERT (volinfo); GF_ASSERT (brickinfo); this = THIS; GF_ASSERT (this); conf = this->private; GF_ASSERT (conf); if (!key_prefix) { gf_log (this->name, GF_LOG_ERROR, "key prefix is NULL"); goto out; } GLUSTERD_GET_BRICK_PIDFILE (pidfile, volinfo, brickinfo, conf); brick_online = gf_is_service_running (pidfile, &pid); ret = dict_set_int32 (dict, key_prefix, brick_online); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set %s", key_prefix); goto out; } brick_online = 0; ret = 0; out: return ret; } int glusterd_snapshot_create_prevalidate (dict_t *dict, char **op_errstr, dict_t *rsp_dict) { char *volname = NULL; char *snapname = NULL; char *device = NULL; char key[PATH_MAX] = ""; char snap_volname[64] = ""; char err_str[PATH_MAX] = ""; int ret = -1; int64_t i = 0; int64_t volcount = 0; int64_t brick_count = 0; int64_t brick_order = 0; glusterd_brickinfo_t *brickinfo = NULL; glusterd_volinfo_t *volinfo = NULL; xlator_t *this = NULL; uuid_t *snap_volid = NULL; gf_loglevel_t loglevel = GF_LOG_ERROR; glusterd_conf_t *conf = NULL; int64_t effective_max_limit = 0; int flags = 0; this = THIS; GF_ASSERT (op_errstr); conf = this->private; GF_ASSERT (conf); ret = dict_get_int64 (dict, "volcount", &volcount); if (ret) { snprintf (err_str, sizeof (err_str), "Failed to " "get the volume count"); goto out; } if (volcount <= 0) { snprintf (err_str, sizeof (err_str), "Invalid volume count %"PRId64 " supplied", volcount); ret = -1; goto out; } ret = dict_get_str (dict, "snapname", &snapname); if (ret) { snprintf (err_str, sizeof (err_str), "Failed to get snapname"); goto out; } ret = dict_get_int32 (dict, "flags", &flags); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to get flags"); goto out; } if (glusterd_find_snap_by_name (snapname)) { ret = -1; snprintf (err_str, sizeof (err_str), "Snap %s already exists", snapname); goto out; } for (i = 1; i <= volcount; i++) { snprintf (key, sizeof (key), "volname%"PRId64, i); ret = dict_get_str (dict, key, &volname); if (ret) { snprintf (err_str, sizeof (err_str), "failed to get volume name"); goto out; } ret = glusterd_volinfo_find (volname, &volinfo); if (ret) { snprintf (err_str, sizeof (err_str), "Volume (%s) does not exist ", volname); goto out; } ret = -1; if (!glusterd_is_volume_started (volinfo)) { snprintf (err_str, sizeof (err_str), "volume %s is " "not started", volinfo->volname); loglevel = GF_LOG_WARNING; goto out; } if (glusterd_is_defrag_on (volinfo)) { snprintf (err_str, sizeof (err_str), "rebalance process is running for the " "volume %s", volname); loglevel = GF_LOG_WARNING; goto out; } /* TODO: Also check whether geo replication is running */ if (volinfo->is_snap_volume == _gf_true) { snprintf (err_str, sizeof (err_str), "Volume %s is a snap volume", volname); loglevel = GF_LOG_WARNING; goto out; } if (volinfo->snap_max_hard_limit < conf->snap_max_hard_limit) effective_max_limit = volinfo->snap_max_hard_limit; else effective_max_limit = conf->snap_max_hard_limit; if (volinfo->snap_count >= effective_max_limit) { snprintf (err_str, sizeof (err_str), "The number of existing snaps has reached " "the effective maximum limit of %"PRIu64" ," "for the volume %s", effective_max_limit, volname); loglevel = GF_LOG_WARNING; goto out; } snprintf (key, sizeof(key) - 1, "vol%"PRId64"_volid", i); ret = dict_get_bin (dict, key, (void **)&snap_volid); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to fetch snap_volid"); goto out; } /* snap volume uuid is used as lvm snapshot name. This will avoid restrictions on snapshot names provided by user */ GLUSTERD_GET_UUID_NOHYPHEN (snap_volname, *snap_volid); brick_count = 0; brick_order = 0; /* Adding snap bricks mount paths to the dict */ list_for_each_entry (brickinfo, &volinfo->bricks, brick_list) { if (uuid_compare (brickinfo->uuid, MY_UUID)) { brick_order++; continue; } if (!glusterd_is_brick_started (brickinfo)) { if(flags & GF_CLI_FLAG_OP_FORCE) { gf_log (this->name, GF_LOG_WARNING, "brick %s:%s is not started", brickinfo->hostname, brickinfo->path); brick_order++; brick_count++; continue; } snprintf (err_str, sizeof (err_str), "brick %s:%s is not started. " "Please start the stopped brick " "and then issue snapshot create " "command or use [force] option in " "snapshot create to override this " "behavior.", brickinfo->hostname, brickinfo->path); ret = -1; goto out; } device = glusterd_get_brick_mount_device (brickinfo->path); if (!device) { snprintf (err_str, sizeof (err_str), "getting device name for the brick " "%s:%s failed", brickinfo->hostname, brickinfo->path); ret = -1; goto out; } device = glusterd_build_snap_device_path (device, snap_volname, brick_count); if (!device) { snprintf (err_str, sizeof (err_str), "cannot copy the snapshot device " "name (volname: %s, snapname: %s)", volinfo->volname, snapname); loglevel = GF_LOG_WARNING; ret = -1; goto out; } snprintf (key, sizeof(key), "vol%"PRId64".brick_snapdevice%"PRId64, i, brick_count); ret = dict_set_dynstr (rsp_dict, key, device); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set %s", key); GF_FREE (device); goto out; } device = NULL; snprintf (key, sizeof(key), "vol%"PRId64".brickdir%"PRId64, i, brick_count); ret = dict_set_dynstr_with_alloc (rsp_dict, key, brickinfo->mount_dir); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set %s", key); goto out; } snprintf (key, sizeof(key) - 1, "vol%"PRId64".brick%"PRId64".order", i, brick_count); ret = dict_set_int64 (rsp_dict, key, brick_order); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set %s", key); goto out; } snprintf (key, sizeof (key), "vol%"PRId64".brick%"PRId64".status", i, brick_order); ret = glusterd_add_brick_status_to_dict (rsp_dict, volinfo, brickinfo, key); if (ret) { gf_log (this->name, GF_LOG_ERROR, "failed to " "add brick status to dict"); goto out; } brick_count++; brick_order++; } snprintf (key, sizeof(key) - 1, "vol%"PRId64"_brickcount", i); ret = dict_set_int64 (rsp_dict, key, brick_count); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set %s", key); goto out; } } ret = dict_set_int64 (rsp_dict, "volcount", volcount); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set volcount"); goto out; } ret = 0; out: if (device) GF_FREE (device); if (ret && err_str[0] != '\0') { gf_log (this->name, loglevel, "%s", err_str); *op_errstr = gf_strdup (err_str); } gf_log (this->name, GF_LOG_TRACE, "Returning %d", ret); return ret; } glusterd_snap_t* glusterd_new_snap_object() { glusterd_snap_t *snap = NULL; snap = GF_CALLOC (1, sizeof (*snap), gf_gld_mt_snap_t); if (snap) { if (LOCK_INIT (&snap->lock)) { gf_log (THIS->name, GF_LOG_ERROR, "Failed initiating" " snap lock"); GF_FREE (snap); return NULL; } INIT_LIST_HEAD (&snap->snap_list); INIT_LIST_HEAD (&snap->volumes); snap->snapname[0] = 0; snap->snap_status = GD_SNAP_STATUS_INIT; } return snap; }; /* Function glusterd_list_add_snapvol adds the volinfo object (snapshot volume) to the snapshot object list and to the parent volume list */ int32_t glusterd_list_add_snapvol (glusterd_volinfo_t *origin_vol, glusterd_volinfo_t *snap_vol) { int ret = -1; glusterd_snap_t *snap = NULL; GF_VALIDATE_OR_GOTO ("glusterd", origin_vol, out); GF_VALIDATE_OR_GOTO ("glusterd", snap_vol, out); snap = snap_vol->snapshot; GF_ASSERT (snap); list_add_tail (&snap_vol->vol_list, &snap->volumes); LOCK (&origin_vol->lock); { list_add_order (&snap_vol->snapvol_list, &origin_vol->snap_volumes, glusterd_compare_snap_vol_time); origin_vol->snap_count++; } UNLOCK (&origin_vol->lock); gf_log (THIS->name, GF_LOG_DEBUG, "Snap %s added to the list", snap->snapname); ret = 0; out: return ret; } glusterd_snap_t* glusterd_find_snap_by_name (char *snapname) { glusterd_snap_t *snap = NULL; glusterd_conf_t *priv = NULL; priv = THIS->private; GF_ASSERT (priv); GF_ASSERT (snapname); list_for_each_entry (snap, &priv->snapshots, snap_list) { if (!strcmp (snap->snapname, snapname)) { gf_log (THIS->name, GF_LOG_DEBUG, "Found " "snap %s (%s)", snap->snapname, uuid_utoa (snap->snap_id)); goto out; } } snap = NULL; out: return snap; } glusterd_snap_t* glusterd_find_snap_by_id (uuid_t snap_id) { glusterd_snap_t *snap = NULL; glusterd_conf_t *priv = NULL; priv = THIS->private; GF_ASSERT (priv); if (uuid_is_null(snap_id)) goto out; list_for_each_entry (snap, &priv->snapshots, snap_list) { if (!uuid_compare (snap->snap_id, snap_id)) { gf_log (THIS->name, GF_LOG_DEBUG, "Found " "snap %s (%s)", snap->snapname, uuid_utoa (snap->snap_id)); goto out; } } snap = NULL; out: return snap; } int glusterd_do_lvm_snapshot_remove (glusterd_volinfo_t *snap_vol, glusterd_brickinfo_t *brickinfo, const char *mount_pt, const char *snap_device) { int ret = -1; xlator_t *this = NULL; glusterd_conf_t *priv = NULL; runner_t runner = {0,}; char msg[1024] = {0, }; char pidfile[PATH_MAX] = {0, }; pid_t pid = -1; int retry_count = 0; this = THIS; GF_ASSERT (this); priv = this->private; GF_ASSERT (priv); if (!brickinfo) { gf_log (this->name, GF_LOG_ERROR, "brickinfo NULL"); goto out; } GF_ASSERT (snap_vol); GF_ASSERT (mount_pt); GF_ASSERT (snap_device); GLUSTERD_GET_BRICK_PIDFILE (pidfile, snap_vol, brickinfo, priv); if (gf_is_service_running (pidfile, &pid)) { ret = kill (pid, SIGKILL); if (ret && errno != ESRCH) { gf_log (this->name, GF_LOG_ERROR, "Unable to kill pid " "%d reason : %s", pid, strerror(errno)); goto out; } } /* umount cannot be done when the brick process is still in the process of shutdown, so give three re-tries */ while (retry_count < 3) { retry_count++; ret = umount2(mount_pt, MNT_FORCE); if (!ret) break; if (errno == EBUSY) { gf_log (this->name, GF_LOG_DEBUG, "umount failed for " "path %s (brick: %s): %s. Retry(%d)", mount_pt, brickinfo->path, strerror (errno), retry_count); } else { gf_log (this->name, GF_LOG_ERROR, "umount failed for " "path %s (brick: %s): %s.", mount_pt, brickinfo->path, strerror (errno)); goto out; } sleep (1); } if (ret) goto out; runinit (&runner); snprintf (msg, sizeof(msg), "remove snapshot of the brick %s:%s, " "device: %s", brickinfo->hostname, brickinfo->path, snap_device); runner_add_args (&runner, LVM_REMOVE, "-f", snap_device, NULL); runner_log (&runner, "", GF_LOG_DEBUG, msg); ret = runner_run (&runner); if (ret) { gf_log (this->name, GF_LOG_ERROR, "removing snapshot of the " "brick (%s:%s) of device %s failed", brickinfo->hostname, brickinfo->path, snap_device); goto out; } out: return ret; } int32_t glusterd_lvm_snapshot_remove (dict_t *rsp_dict, glusterd_volinfo_t *snap_vol) { char *mnt_pt = NULL; struct mntent *entry = NULL; struct mntent save_entry = {0,}; int32_t brick_count = -1; int32_t ret = -1; glusterd_brickinfo_t *brickinfo = NULL; xlator_t *this = NULL; char buff [PATH_MAX] = ""; this = THIS; GF_ASSERT (this); GF_ASSERT (snap_vol); if ((snap_vol->is_snap_volume == _gf_false) && (uuid_is_null (snap_vol->restored_from_snap))) { gf_log (this->name, GF_LOG_DEBUG, "Not a snap volume, or a restored snap volume."); ret = 0; goto out; } brick_count = -1; list_for_each_entry (brickinfo, &snap_vol->bricks, brick_list) { brick_count++; if (uuid_compare (brickinfo->uuid, MY_UUID)) { gf_log (this->name, GF_LOG_DEBUG, "%s:%s belongs to a different node", brickinfo->hostname, brickinfo->path); continue; } if (brickinfo->snap_status == -1) { gf_log (this->name, GF_LOG_INFO, "snapshot was pending. lvm not present " "for brick %s:%s of the snap %s.", brickinfo->hostname, brickinfo->path, snap_vol->snapshot->snapname); if (rsp_dict && (snap_vol->is_snap_volume == _gf_true)) { /* Adding missed delete to the dict */ ret = glusterd_add_missed_snaps_to_dict (rsp_dict, snap_vol, brickinfo, brick_count + 1, GF_SNAP_OPTION_TYPE_DELETE); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to add missed snapshot " "info for %s:%s in the " "rsp_dict", brickinfo->hostname, brickinfo->path); goto out; } } continue; } ret = glusterd_get_brick_root (brickinfo->path, &mnt_pt); if (ret) { gf_log (this->name, GF_LOG_WARNING, "getting the root " "of the brick for volume %s (snap %s) failed ", snap_vol->volname, snap_vol->snapshot->snapname); goto out; } entry = glusterd_get_mnt_entry_info (mnt_pt, buff, sizeof (buff), &save_entry); if (!entry) { gf_log (this->name, GF_LOG_WARNING, "getting the mount" " entry for the brick %s:%s of the snap %s " "(volume: %s) failed", brickinfo->hostname, brickinfo->path, snap_vol->snapshot->snapname, snap_vol->volname); ret = -1; goto out; } ret = glusterd_do_lvm_snapshot_remove (snap_vol, brickinfo, mnt_pt, entry->mnt_fsname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "failed to " "remove the snapshot %s (%s)", brickinfo->path, entry->mnt_fsname); goto out; } } ret = 0; out: gf_log (this->name, GF_LOG_TRACE, "Returning %d", ret); return ret; } int32_t glusterd_snap_volume_remove (dict_t *rsp_dict, glusterd_volinfo_t *snap_vol, gf_boolean_t remove_lvm, gf_boolean_t force) { int ret = -1; int save_ret = 0; glusterd_brickinfo_t *brickinfo = NULL; glusterd_volinfo_t *origin_vol = NULL; xlator_t *this = NULL; this = THIS; GF_ASSERT (this); GF_ASSERT (rsp_dict); GF_ASSERT (snap_vol); if (!snap_vol) { gf_log(this->name, GF_LOG_WARNING, "snap_vol in NULL"); ret = -1; goto out; } list_for_each_entry (brickinfo, &snap_vol->bricks, brick_list) { if (uuid_compare (brickinfo->uuid, MY_UUID)) continue; ret = glusterd_brick_stop (snap_vol, brickinfo, _gf_false); if (ret) { gf_log(this->name, GF_LOG_WARNING, "Failed to stop " "brick for volume %s", snap_vol->volname); save_ret = ret; /* Don't clean up the snap on error when force flag is disabled */ if (!force) goto out; } } /* Only remove the backend lvm when required */ if (remove_lvm) { ret = glusterd_lvm_snapshot_remove (rsp_dict, snap_vol); if (ret) { gf_log(this->name, GF_LOG_WARNING, "Failed to remove " "lvm snapshot volume %s", snap_vol->volname); save_ret = ret; if (!force) goto out; } } ret = glusterd_store_delete_volume (snap_vol); if (ret) { gf_log(this->name, GF_LOG_WARNING, "Failed to remove volume %s " "from store", snap_vol->volname); save_ret = ret; if (!force) goto out; } if (!list_empty(&snap_vol->snapvol_list)) { ret = glusterd_volinfo_find (snap_vol->parent_volname, &origin_vol); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get " "parent volinfo %s for volume %s", snap_vol->parent_volname, snap_vol->volname); save_ret = ret; if (!force) goto out; } origin_vol->snap_count--; } ret = glusterd_volinfo_delete (snap_vol); if (ret) { gf_log(this->name, GF_LOG_WARNING, "Failed to remove volinfo " "%s ", snap_vol->volname); save_ret = ret; if (!force) goto out; } if (save_ret) ret = save_ret; out: gf_log (this->name, GF_LOG_TRACE, "returning %d", ret); return ret; } int32_t glusterd_snapobject_delete (glusterd_snap_t *snap) { if (snap == NULL) { gf_log(THIS->name, GF_LOG_WARNING, "snap is NULL"); return -1; } list_del_init (&snap->snap_list); list_del_init (&snap->volumes); if (LOCK_DESTROY(&snap->lock)) gf_log (THIS->name, GF_LOG_WARNING, "Failed destroying lock" "of snap %s", snap->snapname); GF_FREE (snap->description); GF_FREE (snap); return 0; } int32_t glusterd_snap_remove (dict_t *rsp_dict, glusterd_snap_t *snap, gf_boolean_t remove_lvm, gf_boolean_t force) { int ret = -1; int save_ret = 0; glusterd_volinfo_t *snap_vol = NULL; glusterd_volinfo_t *tmp = NULL; xlator_t *this = NULL; this = THIS; GF_ASSERT (this); GF_ASSERT (rsp_dict); GF_ASSERT (snap); if (!snap) { gf_log(this->name, GF_LOG_WARNING, "snap is NULL"); ret = -1; goto out; } list_for_each_entry_safe (snap_vol, tmp, &snap->volumes, vol_list) { ret = glusterd_snap_volume_remove (rsp_dict, snap_vol, remove_lvm, force); if (ret && !force) { /* Don't clean up the snap on error when force flag is disabled */ gf_log(this->name, GF_LOG_WARNING, "Failed to remove " "volinfo %s for snap %s", snap_vol->volname, snap->snapname); save_ret = ret; goto out; } } ret = glusterd_store_delete_snap (snap); if (ret) { gf_log(this->name, GF_LOG_WARNING, "Failed to remove snap %s " "from store", snap->snapname); save_ret = ret; if (!force) goto out; } ret = glusterd_snapobject_delete (snap); if (ret) gf_log (this->name, GF_LOG_WARNING, "Failed to delete " "snap object %s", snap->snapname); if (save_ret) ret = save_ret; out: gf_log (THIS->name, GF_LOG_TRACE, "returning %d", ret); return ret; } static int glusterd_snapshot_get_snapvol_detail (dict_t *dict, glusterd_volinfo_t *snap_vol, char *keyprefix, int detail) { int ret = -1; int snap_limit = 0; char key[PATH_MAX] = {0,}; char *value = NULL; glusterd_volinfo_t *origin_vol = NULL; glusterd_conf_t *conf = NULL; xlator_t *this = NULL; this = THIS; conf = this->private; GF_ASSERT (conf); GF_ASSERT (dict); GF_ASSERT (snap_vol); GF_ASSERT (keyprefix); /* Volume Name */ value = gf_strdup (snap_vol->volname); if (!value) goto out; snprintf (key, sizeof (key), "%s.volname", keyprefix); ret = dict_set_dynstr (dict, key, value); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set " "volume name in dictionary: %s", key); goto out; } /* Volume ID */ value = gf_strdup (uuid_utoa (snap_vol->volume_id)); if (NULL == value) { ret = -1; goto out; } snprintf (key, sizeof (key), "%s.vol-id", keyprefix); ret = dict_set_dynstr (dict, key, value); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set " "volume id in dictionary: %s", key); goto out; } value = NULL; /* volume status */ snprintf (key, sizeof (key), "%s.vol-status", keyprefix); switch (snap_vol->status) { case GLUSTERD_STATUS_STARTED: ret = dict_set_str (dict, key, "Started"); break; case GLUSTERD_STATUS_STOPPED: ret = dict_set_str (dict, key, "Stopped"); break; case GD_SNAP_STATUS_NONE: ret = dict_set_str (dict, key, "None"); break; default: gf_log (this->name, GF_LOG_ERROR, "Invalid volume status"); ret = -1; goto out; } if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set volume status" " in dictionary: %s", key); goto out; } ret = glusterd_volinfo_find (snap_vol->parent_volname, &origin_vol); if (ret) { gf_log (this->name, GF_LOG_ERROR, "failed to get the parent " "volinfo for the volume %s", snap_vol->volname); goto out; } /* Snaps available */ if (conf->snap_max_hard_limit < origin_vol->snap_max_hard_limit) { snap_limit = conf->snap_max_hard_limit; gf_log(this->name, GF_LOG_DEBUG, "system snap-max-hard-limit is" " lesser than volume snap-max-hard-limit, " "snap-max-hard-limit value is set to %d", snap_limit); } else { snap_limit = origin_vol->snap_max_hard_limit; gf_log(this->name, GF_LOG_DEBUG, "volume snap-max-hard-limit is" " lesser than system snap-max-hard-limit, " "snap-max-hard-limit value is set to %d", snap_limit); } snprintf (key, sizeof (key), "%s.snaps-available", keyprefix); if (snap_limit > origin_vol->snap_count) ret = dict_set_int32 (dict, key, snap_limit - origin_vol->snap_count); else ret = dict_set_int32 (dict, key, 0); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set available snaps"); goto out; } snprintf (key, sizeof (key), "%s.snapcount", keyprefix); ret = dict_set_int32 (dict, key, origin_vol->snap_count); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not save snapcount"); goto out; } if (!detail) goto out; /* Parent volume name */ value = gf_strdup (snap_vol->parent_volname); if (!value) goto out; snprintf (key, sizeof (key), "%s.origin-volname", keyprefix); ret = dict_set_dynstr (dict, key, value); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set parent " "volume name in dictionary: %s", key); goto out; } value = NULL; ret = 0; out: if (value) GF_FREE (value); return ret; } static int glusterd_snapshot_get_snap_detail (dict_t *dict, glusterd_snap_t *snap, char *keyprefix, glusterd_volinfo_t *volinfo) { int ret = -1; int volcount = 0; char key[PATH_MAX] = {0,}; char *value = NULL; char *timestr = NULL; struct tm *tmptr = NULL; glusterd_volinfo_t *snap_vol = NULL; glusterd_volinfo_t *tmp_vol = NULL; xlator_t *this = NULL; this = THIS; GF_ASSERT (dict); GF_ASSERT (snap); GF_ASSERT (keyprefix); /* Snap Name */ value = gf_strdup (snap->snapname); if (!value) goto out; snprintf (key, sizeof (key), "%s.snapname", keyprefix); ret = dict_set_dynstr (dict, key, value); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set " "snap name in dictionary"); goto out; } /* Snap ID */ value = gf_strdup (uuid_utoa (snap->snap_id)); if (NULL == value) { ret = -1; goto out; } snprintf (key, sizeof (key), "%s.snap-id", keyprefix); ret = dict_set_dynstr (dict, key, value); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set " "snap id in dictionary"); goto out; } value = NULL; tmptr = localtime (&(snap->time_stamp)); if (NULL == tmptr) { gf_log (this->name, GF_LOG_ERROR, "Failed to convert " "time_t to *tm"); ret = -1; goto out; } timestr = GF_CALLOC (1, PATH_MAX, gf_gld_mt_char); if (NULL == timestr) { ret = -1; goto out; } ret = strftime (timestr, PATH_MAX, "%Y-%m-%d %H:%M:%S", tmptr); if (0 == ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to convert time_t " "to string"); ret = -1; goto out; } snprintf (key, sizeof (key), "%s.snap-time", keyprefix); ret = dict_set_dynstr (dict, key, timestr); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set " "snap time stamp in dictionary"); goto out; } timestr = NULL; /* If snap description is provided then add that into dictionary */ if (NULL != snap->description) { value = gf_strdup (snap->description); if (NULL == value) { ret = -1; goto out; } snprintf (key, sizeof (key), "%s.snap-desc", keyprefix); ret = dict_set_dynstr (dict, key, value); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set " "snap description in dictionary"); goto out; } value = NULL; } snprintf (key, sizeof (key), "%s.snap-status", keyprefix); switch (snap->snap_status) { case GD_SNAP_STATUS_INIT: ret = dict_set_str (dict, key, "Init"); break; case GD_SNAP_STATUS_IN_USE: ret = dict_set_str (dict, key, "In-use"); break; case GD_SNAP_STATUS_DECOMMISSION: ret = dict_set_str (dict, key, "Decommisioned"); break; case GD_SNAP_STATUS_RESTORED: ret = dict_set_str (dict, key, "Restored"); break; case GD_SNAP_STATUS_NONE: ret = dict_set_str (dict, key, "None"); break; default: gf_log (this->name, GF_LOG_ERROR, "Invalid snap status"); ret = -1; goto out; } if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set snap status " "in dictionary"); goto out; } if (volinfo) { volcount = 1; snprintf (key, sizeof (key), "%s.vol%d", keyprefix, volcount); ret = glusterd_snapshot_get_snapvol_detail (dict, volinfo, key, 0); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to " "get volume detail %s for snap %s", snap_vol->volname, snap->snapname); goto out; } goto done; } list_for_each_entry_safe (snap_vol, tmp_vol, &snap->volumes, vol_list) { volcount++; snprintf (key, sizeof (key), "%s.vol%d", keyprefix, volcount); ret = glusterd_snapshot_get_snapvol_detail (dict, snap_vol, key, 1); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to " "get volume detail %s for snap %s", snap_vol->volname, snap->snapname); goto out; } } done: snprintf (key, sizeof (key), "%s.vol-count", keyprefix); ret = dict_set_int32 (dict, key, volcount); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set %s", key); goto out; } ret = 0; out: if (value) GF_FREE (value); if (timestr) GF_FREE(timestr); return ret; } static int glusterd_snapshot_get_all_snap_info (dict_t *dict) { int ret = -1; int snapcount = 0; char key[PATH_MAX] = {0,}; glusterd_snap_t *snap = NULL; glusterd_snap_t *tmp_snap = NULL; glusterd_conf_t *priv = NULL; xlator_t *this = NULL; this = THIS; priv = this->private; GF_ASSERT (priv); /* General parameter validation */ GF_ASSERT (dict); list_for_each_entry_safe (snap, tmp_snap, &priv->snapshots, snap_list) { snapcount++; snprintf (key, sizeof (key), "snap%d", snapcount); ret = glusterd_snapshot_get_snap_detail (dict, snap, key, NULL); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get " "snapdetail for snap %s", snap->snapname); goto out; } } ret = dict_set_int32 (dict, "snap-count", snapcount); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set snapcount"); goto out; } ret = 0; out: return ret; } int glusterd_snapshot_get_info_by_volume (dict_t *dict, char *volname, char *err_str, size_t len) { int ret = -1; int snapcount = 0; int snap_limit = 0; char *value = NULL; char key[PATH_MAX] = ""; glusterd_volinfo_t *volinfo = NULL; glusterd_volinfo_t *snap_vol = NULL; glusterd_volinfo_t *tmp_vol = NULL; glusterd_conf_t *conf = NULL; xlator_t *this = NULL; this = THIS; conf = this->private; GF_ASSERT (conf); GF_ASSERT (dict); GF_ASSERT (volname); ret = glusterd_volinfo_find (volname, &volinfo); if (ret) { snprintf (err_str, len, "Volume (%s) does not exist", volname); gf_log (this->name, GF_LOG_ERROR, "%s", err_str); goto out; } /* Snaps available */ if (conf->snap_max_hard_limit < volinfo->snap_max_hard_limit) { snap_limit = conf->snap_max_hard_limit; gf_log(this->name, GF_LOG_DEBUG, "system snap-max-hard-limit is" " lesser than volume snap-max-hard-limit, " "snap-max-hard-limit value is set to %d", snap_limit); } else { snap_limit = volinfo->snap_max_hard_limit; gf_log(this->name, GF_LOG_DEBUG, "volume snap-max-hard-limit is" " lesser than system snap-max-hard-limit, " "snap-max-hard-limit value is set to %d", snap_limit); } if (snap_limit > volinfo->snap_count) ret = dict_set_int32 (dict, "snaps-available", snap_limit - volinfo->snap_count); else ret = dict_set_int32 (dict, "snaps-available", 0); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set available snaps"); goto out; } /* Origin volume name */ value = gf_strdup (volinfo->volname); if (!value) goto out; ret = dict_set_dynstr (dict, "origin-volname", value); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set parent " "volume name in dictionary: %s", key); goto out; } value = NULL; list_for_each_entry_safe (snap_vol, tmp_vol, &volinfo->snap_volumes, snapvol_list) { snapcount++; snprintf (key, sizeof (key), "snap%d", snapcount); ret = glusterd_snapshot_get_snap_detail (dict, snap_vol->snapshot, key, snap_vol); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get " "snapdetail for snap %s", snap_vol->snapshot->snapname); goto out; } } ret = dict_set_int32 (dict, "snap-count", snapcount); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set snapcount"); goto out; } ret = 0; out: if (value) GF_FREE (value); return ret; } /* This function will be called from RPC handler routine. * This function is responsible for getting the requested * snapshot info into the dictionary. * * @param req RPC request object. Required for sending a response back. * @param op glusterd operation. Required for sending a response back. * @param dict pointer to dictionary which will contain both * request and response key-pair values. * @return -1 on error and 0 on success */ int glusterd_handle_snapshot_info (rpcsvc_request_t *req, glusterd_op_t op, dict_t *dict, char *err_str, size_t len) { int ret = -1; int8_t snap_driven = 1; char *volname = NULL; char *snapname = NULL; glusterd_snap_t *snap = NULL; xlator_t *this = NULL; int32_t cmd = GF_SNAP_INFO_TYPE_ALL; this = THIS; GF_ASSERT (this); GF_VALIDATE_OR_GOTO (this->name, req, out); GF_VALIDATE_OR_GOTO (this->name, dict, out); ret = dict_get_int32 (dict, "cmd", &cmd); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get type " "of snapshot info"); goto out; } switch (cmd) { case GF_SNAP_INFO_TYPE_ALL: { ret = glusterd_snapshot_get_all_snap_info (dict); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get info of all snaps"); goto out; } break; } case GF_SNAP_INFO_TYPE_SNAP: { ret = dict_get_str (dict, "snapname", &snapname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get snap name"); goto out; } ret = dict_set_int32 (dict, "snap-count", 1); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set snapcount"); goto out; } snap = glusterd_find_snap_by_name (snapname); if (!snap) { snprintf (err_str, len, "Snap (%s) does not exist", snapname); gf_log (this->name, GF_LOG_ERROR, "%s", err_str); ret = -1; goto out; } ret = glusterd_snapshot_get_snap_detail (dict, snap, "snap1", NULL); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get snap detail of snap " "%s", snap->snapname); goto out; } break; } case GF_SNAP_INFO_TYPE_VOL: { ret = dict_get_str (dict, "volname", &volname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get volname"); goto out; } ret = glusterd_snapshot_get_info_by_volume (dict, volname, err_str, len); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get volume info of volume " "%s", volname); goto out; } snap_driven = 0; break; } } ret = dict_set_int8 (dict, "snap-driven", snap_driven); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set snap-driven"); goto out; } /* If everything is successful then send the response back to cli. * In case of failure the caller of this function will take care of the response */ ret = glusterd_op_send_cli_response (op, 0, 0, req, dict, err_str); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to send cli " "response"); goto out; } ret = 0; out: return ret; } /* This function sets all the snapshot names in the dictionary */ int glusterd_snapshot_get_all_snapnames (dict_t *dict) { int ret = -1; int snapcount = 0; char *snapname = NULL; char key[PATH_MAX] = {0,}; glusterd_snap_t *snap = NULL; glusterd_snap_t *tmp_snap = NULL; glusterd_conf_t *priv = NULL; xlator_t *this = NULL; this = THIS; priv = this->private; GF_ASSERT (priv); GF_ASSERT (dict); list_for_each_entry_safe (snap, tmp_snap, &priv->snapshots, snap_list) { snapcount++; snapname = gf_strdup (snap->snapname); if (!snapname) { gf_log (this->name, GF_LOG_ERROR, "strdup failed"); ret = -1; goto out; } snprintf (key, sizeof (key), "snapname%d", snapcount); ret = dict_set_dynstr (dict, key, snapname); if (ret) { GF_FREE (snapname); gf_log (this->name, GF_LOG_ERROR, "Failed to set %s", key); goto out; } } ret = dict_set_int32 (dict, "snap-count", snapcount); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set snapcount"); goto out; } ret = 0; out: return ret; } /* This function sets all the snapshot names under a given volume in the dictionary */ int glusterd_snapshot_get_vol_snapnames (dict_t *dict, glusterd_volinfo_t *volinfo) { int ret = -1; int snapcount = 0; char *snapname = NULL; char key[PATH_MAX] = {0,}; glusterd_volinfo_t *snap_vol = NULL; glusterd_volinfo_t *tmp_vol = NULL; xlator_t *this = NULL; this = THIS; GF_ASSERT (dict); GF_ASSERT (volinfo); list_for_each_entry_safe (snap_vol, tmp_vol, &volinfo->snap_volumes, snapvol_list) { snapcount++; snapname = gf_strdup (snap_vol->snapshot->snapname); if (!snapname) { gf_log (this->name, GF_LOG_ERROR, "strdup failed"); ret = -1; goto out; } snprintf (key, sizeof (key), "snapname%d", snapcount); ret = dict_set_dynstr (dict, key, snapname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to " "set %s", key); GF_FREE (snapname); goto out; } } ret = dict_set_int32 (dict, "snap-count", snapcount); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set snapcount"); goto out; } ret = 0; out: return ret; } int glusterd_handle_snapshot_list (rpcsvc_request_t *req, glusterd_op_t op, dict_t *dict, char *err_str, size_t len) { int ret = -1; char *volname = NULL; glusterd_volinfo_t *volinfo = NULL; xlator_t *this = NULL; this = THIS; GF_VALIDATE_OR_GOTO (this->name, req, out); GF_VALIDATE_OR_GOTO (this->name, dict, out); /* Ignore error for getting volname as it is optional */ ret = dict_get_str (dict, "volname", &volname); if (NULL == volname) { ret = glusterd_snapshot_get_all_snapnames (dict); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get snapshot list"); goto out; } } else { ret = glusterd_volinfo_find (volname, &volinfo); if (ret) { snprintf (err_str, len, "Volume (%s) does not exist", volname); gf_log (this->name, GF_LOG_ERROR, "%s", err_str); goto out; } ret = glusterd_snapshot_get_vol_snapnames (dict, volinfo); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get snapshot list for volume %s", volname); goto out; } } /* If everything is successful then send the response back to cli. In case of failure the caller of this function will take of response.*/ ret = glusterd_op_send_cli_response (op, 0, 0, req, dict, err_str); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to send cli " "response"); goto out; } ret = 0; out: return ret; } /* This is a snapshot create handler function. This function will be * executed in the originator node. This function is responsible for * calling mgmt_v3 framework to do the actual snap creation on all the bricks * * @param req RPC request object * @param op gluster operation * @param dict dictionary containing snapshot restore request * @param err_str In case of an err this string should be populated * @param len length of err_str buffer * * @return Negative value on Failure and 0 in success */ int glusterd_handle_snapshot_create (rpcsvc_request_t *req, glusterd_op_t op, dict_t *dict, char *err_str, size_t len) { int ret = -1; char *volname = NULL; char *snapname = NULL; int64_t volcount = 0; xlator_t *this = NULL; char key[PATH_MAX] = ""; char *username = NULL; char *password = NULL; uuid_t *uuid_ptr = NULL; uuid_t tmp_uuid = {0}; int i = 0; char snap_volname[GD_VOLUME_NAME_MAX] = {0, }; this = THIS; GF_ASSERT (this); GF_ASSERT (req); GF_ASSERT (dict); GF_ASSERT (err_str); ret = dict_get_int64 (dict, "volcount", &volcount); if (ret) { gf_log (this->name, GF_LOG_ERROR, "failed to " "get the volume count"); goto out; } if (volcount <= 0) { gf_log (this->name, GF_LOG_ERROR, "Invalid volume count %"PRId64 " supplied", volcount); ret = -1; goto out; } ret = dict_get_str (dict, "snapname", &snapname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "failed to get the snapname"); goto out; } if (strlen(snapname) >= GLUSTERD_MAX_SNAP_NAME) { snprintf (err_str, len, "snapname cannot exceed 255 " "characters"); gf_log (this->name, GF_LOG_ERROR, "%s", err_str); ret = -1; goto out; } uuid_ptr = GF_CALLOC (1, sizeof(uuid_t), gf_common_mt_uuid_t); if (!uuid_ptr) { gf_log (this->name, GF_LOG_ERROR, "Out Of Memory"); ret = -1; goto out; } uuid_generate (*uuid_ptr); ret = dict_set_bin (dict, "snap-id", uuid_ptr, sizeof(uuid_t)); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to set snap-id"); GF_FREE (uuid_ptr); goto out; } uuid_ptr = NULL; ret = dict_set_int64 (dict, "snap-time", (int64_t)time(NULL)); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to set snap-time"); goto out; } for (i = 1; i <= volcount; i++) { snprintf (key, sizeof (key), "volname%d", i); ret = dict_get_str (dict, key, &volname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get volume name"); goto out; } /* generate internal username and password for the snap*/ uuid_generate (tmp_uuid); username = gf_strdup (uuid_utoa (tmp_uuid)); snprintf (key, sizeof(key), "volume%d_username", i); ret = dict_set_dynstr (dict, key, username); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set snap " "username for volume %s", volname); GF_FREE (username); goto out; } uuid_generate (tmp_uuid); password = gf_strdup (uuid_utoa (tmp_uuid)); snprintf (key, sizeof(key), "volume%d_password", i); ret = dict_set_dynstr (dict, key, password); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set snap " "password for volume %s", volname); GF_FREE (password); goto out; } uuid_ptr = GF_CALLOC (1, sizeof(uuid_t), gf_common_mt_uuid_t); if (!uuid_ptr) { gf_log (this->name, GF_LOG_ERROR, "Out Of Memory"); ret = -1; goto out; } snprintf (key, sizeof(key) - 1, "vol%d_volid", i); uuid_generate (*uuid_ptr); ret = dict_set_bin (dict, key, uuid_ptr, sizeof(uuid_t)); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to set snap_volid"); GF_FREE (uuid_ptr); goto out; } GLUSTERD_GET_UUID_NOHYPHEN (snap_volname, *uuid_ptr); snprintf (key, sizeof (key), "snap-volname%d", i); ret = dict_set_dynstr_with_alloc (dict, key, snap_volname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to set snap volname"); GF_FREE (uuid_ptr); goto out; } } ret = glusterd_mgmt_v3_initiate_snap_phases (req, op, dict); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to initiate snap " "phases"); } out: return ret; } /* This is a snapshot status handler function. This function will be * executed in a originator node. This function is responsible for * calling mgmt v3 framework to get the actual snapshot status from * all the bricks * * @param req RPC request object * @param op gluster operation * @param dict dictionary containing snapshot status request * @param err_str In case of an err this string should be populated * @param len length of err_str buffer * * return : 0 in case of success. * -1 in case of failure. * */ int glusterd_handle_snapshot_status (rpcsvc_request_t *req, glusterd_op_t op, dict_t *dict, char *err_str, size_t len) { int ret = -1; char *volname = NULL; char *snapname = NULL; char *buf = NULL; glusterd_conf_t *conf = NULL; xlator_t *this = NULL; int32_t cmd = -1; int i = 0; dict_t *voldict = NULL; char key[PATH_MAX] = ""; glusterd_volinfo_t *volinfo = NULL; glusterd_snap_t *snap = NULL; glusterd_volinfo_t *snap_volinfo = NULL; this = THIS; GF_ASSERT (this); conf = this->private; GF_ASSERT (conf); GF_ASSERT (req); GF_ASSERT (dict); GF_ASSERT (err_str); ret = dict_get_int32 (dict, "cmd", &cmd); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not get status type"); goto out; } switch (cmd) { case GF_SNAP_STATUS_TYPE_ALL: { /* IF we give "gluster snapshot status" * then lock is held on all snaps. * This is the place where necessary information * (snapname and snapcount)is populated in dictionary * for locking. */ ++i; list_for_each_entry (snap, &conf->snapshots, snap_list) { snprintf (key, sizeof (key), "snapname%d", i); buf = gf_strdup (snap->snapname); if (!buf) { ret = -1; goto out; } ret = dict_set_dynstr (dict, key, buf); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not save snapname (%s) " "in the dictionary", snap->snapname); GF_FREE (buf); goto out; } buf = NULL; i++; } ret = dict_set_int32 (dict, "snapcount", i - 1); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not " "save snapcount in the dictionary"); goto out; } break; } case GF_SNAP_STATUS_TYPE_SNAP: { /* IF we give "gluster snapshot status " * then lock is held on single snap. * This is the place where necessary information * (snapname)is populated in dictionary * for locking. */ ret = dict_get_str (dict, "snapname", &snapname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to fetch snap name"); goto out; } snap = glusterd_find_snap_by_name (snapname); if (!snap) { snprintf (err_str, len, "Snap (%s)" "does not exist", snapname); gf_log(this->name, GF_LOG_ERROR, "%s", err_str); ret = -1; goto out; } break; } case GF_SNAP_STATUS_TYPE_VOL: ret = dict_get_str (dict, "volname", &volname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to fetch volname"); goto out; } ret = glusterd_volinfo_find (volname, &volinfo); if (ret) { snprintf (err_str, len, "Volume (%s) " "does not exist", volname); gf_log (this->name, GF_LOG_ERROR, "%s", err_str); goto out; } i = 1; list_for_each_entry (snap_volinfo, &volinfo->snap_volumes, snapvol_list) { snprintf (key, sizeof (key), "snapname%d", i); buf = gf_strdup (snap_volinfo->snapshot->snapname); if (!buf) { ret = -1; goto out; } ret = dict_set_dynstr (dict, key, buf); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not save snapname"); GF_FREE (buf); goto out; } buf = NULL; i++; } ret = dict_set_int32 (dict, "snapcount", i-1); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not save snapcount"); goto out; } break; default: { gf_log (this->name, GF_LOG_ERROR, "Unknown type"); ret = -1; goto out; } } ret = glusterd_mgmt_v3_initiate_snap_phases (req, op, dict); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to initiate " "snap phases"); goto out; } ret = 0; out: if (voldict) { dict_unref (voldict); } return ret; } /* This is a snapshot restore handler function. This function will be * executed in the originator node. This function is responsible for * calling mgmt_v3 framework to do the actual restore on all the bricks * * @param req RPC request object * @param op gluster operation * @param dict dictionary containing snapshot restore request * @param err_str In case of an err this string should be populated * @param len length of err_str buffer * * @return Negative value on Failure and 0 in success */ int glusterd_handle_snapshot_restore (rpcsvc_request_t *req, glusterd_op_t op, dict_t *dict, char *err_str, size_t len) { int ret = -1; char *snapname = NULL; char *buf = NULL; glusterd_conf_t *conf = NULL; xlator_t *this = NULL; glusterd_snap_t *snap = NULL; glusterd_volinfo_t *snap_volinfo = NULL; int32_t i = 0; char key[PATH_MAX] = ""; this = THIS; GF_ASSERT (this); conf = this->private; GF_ASSERT (conf); GF_ASSERT (req); GF_ASSERT (dict); GF_ASSERT (err_str); ret = dict_get_str (dict, "snapname", &snapname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to " "get snapname"); goto out; } snap = glusterd_find_snap_by_name (snapname); if (!snap) { snprintf (err_str, len, "Snap (%s) does not exist", snapname); gf_log (this->name, GF_LOG_ERROR, "%s", err_str); ret = -1; goto out; } list_for_each_entry (snap_volinfo, &snap->volumes, vol_list) { i++; snprintf (key, sizeof (key), "volname%d", i); buf = gf_strdup (snap_volinfo->parent_volname); if (!buf) { ret = -1; goto out; } ret = dict_set_dynstr (dict, key, buf); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not set " "parent volume name %s in the dict", snap_volinfo->parent_volname); GF_FREE (buf); goto out; } buf = NULL; } ret = dict_set_int32 (dict, "volcount", i); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not save volume count"); goto out; } ret = glusterd_mgmt_v3_initiate_snap_phases (req, op, dict); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to initiate snap " "phases"); goto out; } ret = 0; out: return ret; } glusterd_snap_t* glusterd_create_snap_object (dict_t *dict, dict_t *rsp_dict) { char *snapname = NULL; uuid_t *snap_id = NULL; char *description = NULL; glusterd_snap_t *snap = NULL; xlator_t *this = NULL; glusterd_conf_t *priv = NULL; int ret = -1; int64_t time_stamp = 0; this = THIS; priv = this->private; GF_ASSERT (dict); GF_ASSERT (rsp_dict); /* Fetch snapname, description, id and time from dict */ ret = dict_get_str (dict, "snapname", &snapname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to fetch snapname"); goto out; } /* Ignore ret value for description*/ ret = dict_get_str (dict, "description", &description); ret = dict_get_bin (dict, "snap-id", (void **)&snap_id); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to fetch snap_id"); goto out; } ret = dict_get_int64 (dict, "snap-time", &time_stamp); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to fetch snap-time"); goto out; } if (time_stamp <= 0) { ret = -1; gf_log (this->name, GF_LOG_ERROR, "Invalid time-stamp: %"PRId64, time_stamp); goto out; } list_for_each_entry (snap, &priv->snapshots, snap_list) { if (!strcmp (snap->snapname, snapname) || !uuid_compare (snap->snap_id, *snap_id)) { gf_log (THIS->name, GF_LOG_ERROR, "Found duplicate snap %s (%s)", snap->snapname, uuid_utoa (snap->snap_id)); ret = -1; break; } } if (ret) { snap = NULL; goto out; } snap = glusterd_new_snap_object (); if (!snap) { gf_log (this->name, GF_LOG_ERROR, "Could not create " "the snap object for snap %s", snapname); goto out; } strcpy (snap->snapname, snapname); uuid_copy (snap->snap_id, *snap_id); snap->time_stamp = (time_t)time_stamp; /* Set the status as GD_SNAP_STATUS_INIT and once the backend snapshot is taken and snap is really ready to use, set the status to GD_SNAP_STATUS_IN_USE. This helps in identifying the incomplete snapshots and cleaning them up. */ snap->snap_status = GD_SNAP_STATUS_INIT; if (description) { snap->description = gf_strdup (description); if (snap->description == NULL) { gf_log (this->name, GF_LOG_ERROR, "Saving the Snap Description Failed"); ret = -1; goto out; } } ret = glusterd_store_snap (snap); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Could not store snap" "object %s", snap->snapname); goto out; } list_add_order (&snap->snap_list, &priv->snapshots, glusterd_compare_snap_time); gf_log (this->name, GF_LOG_TRACE, "Snap %s added to the list", snap->snapname); ret = 0; out: if (ret) { if (snap) glusterd_snap_remove (rsp_dict, snap, _gf_true, _gf_true); snap = NULL; } return snap; } /* Added missed_snap_entry to rsp_dict */ int32_t glusterd_add_missed_snaps_to_dict (dict_t *rsp_dict, glusterd_volinfo_t *snap_vol, glusterd_brickinfo_t *brickinfo, int32_t brick_number, int32_t op) { char *snap_uuid = NULL; char missed_snap_entry[PATH_MAX] = ""; char name_buf[PATH_MAX] = ""; int32_t missed_snap_count = -1; int32_t ret = -1; xlator_t *this = NULL; this = THIS; GF_ASSERT (this); GF_ASSERT (rsp_dict); GF_ASSERT (snap_vol); GF_ASSERT (brickinfo); snap_uuid = gf_strdup (uuid_utoa (snap_vol->snapshot->snap_id)); if (!snap_uuid) { ret = -1; goto out; } snprintf (missed_snap_entry, sizeof(missed_snap_entry), "%s:%s=%s:%d:%s:%d:%d", uuid_utoa(brickinfo->uuid), snap_uuid, snap_vol->volname, brick_number, brickinfo->path, op, GD_MISSED_SNAP_PENDING); /* Fetch the missed_snap_count from the dict */ ret = dict_get_int32 (rsp_dict, "missed_snap_count", &missed_snap_count); if (ret) { /* Initialize the missed_snap_count for the first time */ missed_snap_count = 0; } /* Setting the missed_snap_entry in the rsp_dict */ snprintf (name_buf, sizeof(name_buf), "missed_snaps_%d", missed_snap_count); ret = dict_set_dynstr_with_alloc (rsp_dict, name_buf, missed_snap_entry); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set missed_snap_entry (%s) " "in the rsp_dict.", missed_snap_entry); goto out; } missed_snap_count++; /* Setting the new missed_snap_count in the dict */ ret = dict_set_int32 (rsp_dict, "missed_snap_count", missed_snap_count); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set missed_snap_count for %s " "in the rsp_dict.", missed_snap_entry); goto out; } out: if (snap_uuid) GF_FREE (snap_uuid); gf_log (this->name, GF_LOG_TRACE, "Returning %d", ret); return ret; } /* This function actually calls the command (or the API) for taking the snapshot of the backend brick filesystem. If this is successful, then call the glusterd_snap_create function to create the snap object for glusterd */ int32_t glusterd_take_lvm_snapshot (glusterd_brickinfo_t *brickinfo, char *origin_brick_path) { char msg[NAME_MAX] = ""; char buf[PATH_MAX] = ""; char *ptr = NULL; char *origin_device = NULL; int ret = -1; gf_boolean_t match = _gf_false; runner_t runner = {0,}; xlator_t *this = NULL; this = THIS; GF_ASSERT (this); GF_ASSERT (brickinfo); GF_ASSERT (origin_brick_path); origin_device = glusterd_get_brick_mount_device (origin_brick_path); if (!origin_device) { gf_log (this->name, GF_LOG_ERROR, "getting device name for " "the brick %s failed", origin_brick_path); goto out; } /* Figuring out if setactivationskip flag is supported or not */ runinit (&runner); snprintf (msg, sizeof (msg), "running lvcreate help"); runner_add_args (&runner, LVM_CREATE, "--help", NULL); runner_log (&runner, "", GF_LOG_DEBUG, msg); runner_redir (&runner, STDOUT_FILENO, RUN_PIPE); ret = runner_start (&runner); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to run lvcreate help"); runner_end (&runner); goto out; } /* Looking for setactivationskip in lvcreate --help */ do { ptr = fgets(buf, sizeof(buf), runner_chio (&runner, STDOUT_FILENO)); if (ptr) { if (strstr(buf, "setactivationskip")) { match = _gf_true; break; } } } while (ptr != NULL); runner_end (&runner); /* Takng the actual snapshot */ runinit (&runner); snprintf (msg, sizeof (msg), "taking snapshot of the brick %s", origin_brick_path); if (match == _gf_true) runner_add_args (&runner, LVM_CREATE, "-s", origin_device, "--setactivationskip", "n", "--name", brickinfo->device_path, NULL); else runner_add_args (&runner, LVM_CREATE, "-s", origin_device, "--name", brickinfo->device_path, NULL); runner_log (&runner, this->name, GF_LOG_DEBUG, msg); ret = runner_run (&runner); if (ret) { gf_log (this->name, GF_LOG_ERROR, "taking snapshot of the " "brick (%s) of device %s failed", origin_brick_path, origin_device); } out: return ret; } int32_t glusterd_snap_brick_create (glusterd_volinfo_t *snap_volinfo, glusterd_brickinfo_t *brickinfo, int32_t brick_count) { int32_t ret = -1; xlator_t *this = NULL; glusterd_conf_t *priv = NULL; char snap_brick_mount_path[PATH_MAX] = ""; struct stat statbuf = {0, }; this = THIS; priv = this->private; GF_ASSERT (snap_volinfo); GF_ASSERT (brickinfo); snprintf (snap_brick_mount_path, sizeof (snap_brick_mount_path), "%s/%s/brick%d", snap_mount_folder, snap_volinfo->volname, brick_count + 1); ret = mkdir_p (snap_brick_mount_path, 0777, _gf_true); if (ret) { gf_log (this->name, GF_LOG_ERROR, "creating the brick directory" " %s for the snapshot %s(device: %s) failed", snap_brick_mount_path, snap_volinfo->volname, brickinfo->device_path); goto out; } /* mount the snap logical device on the directory inside /run/gluster/snaps//@snap_brick_mount_path Way to mount the snap brick via mount api is this. ret = mount (device, snap_brick_mount_path, entry->mnt_type, MS_MGC_VAL, "nouuid"); But for now, mounting using runner apis. */ ret = glusterd_mount_lvm_snapshot (brickinfo->device_path, snap_brick_mount_path); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to mount lvm snapshot."); goto out; } ret = stat (brickinfo->path, &statbuf); if (ret) { gf_log (this->name, GF_LOG_WARNING, "stat of the brick %s" "(brick mount: %s) failed (%s)", brickinfo->path, snap_brick_mount_path, strerror (errno)); goto out; } ret = sys_lsetxattr (brickinfo->path, GF_XATTR_VOL_ID_KEY, snap_volinfo->volume_id, 16, XATTR_REPLACE); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set " "extended attribute %s on %s. Reason: " "%s, snap: %s", GF_XATTR_VOL_ID_KEY, brickinfo->path, strerror (errno), snap_volinfo->volname); goto out; } out: if (ret) { gf_log (this->name, GF_LOG_WARNING, "unmounting the snap brick" " mount %s", snap_brick_mount_path); #if !defined(GF_DARWIN_HOST_OS) && !defined(__NetBSD__) umount (snap_brick_mount_path); #else unmount (snap_brick_mount_path, 0); #endif } gf_log (this->name, GF_LOG_TRACE, "Returning %d", ret); return ret; } static int32_t glusterd_add_brick_to_snap_volume (dict_t *dict, dict_t *rsp_dict, glusterd_volinfo_t *snap_vol, glusterd_brickinfo_t *original_brickinfo, int64_t volcount, int32_t brick_count) { char key[PATH_MAX] = ""; char *snap_brick_dir = NULL; char snap_brick_path[PATH_MAX] = ""; char *snap_device = NULL; glusterd_brickinfo_t *snap_brickinfo = NULL; gf_boolean_t add_missed_snap = _gf_false; int32_t ret = -1; xlator_t *this = NULL; this = THIS; GF_ASSERT (this); GF_ASSERT (dict); GF_ASSERT (rsp_dict); GF_ASSERT (snap_vol); GF_ASSERT (original_brickinfo); snprintf (key, sizeof(key), "vol%"PRId64".origin_brickpath%d", volcount, brick_count); ret = dict_set_dynstr_with_alloc (dict, key, original_brickinfo->path); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set %s", key); goto out; } ret = glusterd_brickinfo_new (&snap_brickinfo); if (ret) { gf_log (this->name, GF_LOG_ERROR, "initializing the brick for the snap " "volume failed (snapname: %s)", snap_vol->snapshot->snapname); goto out; } snprintf (key, sizeof(key) - 1, "vol%"PRId64".brickdir%d", volcount, brick_count); ret = dict_get_str (dict, key, &snap_brick_dir); if (ret) { /* Using original brickinfo here because it will be a * pending snapshot and storing the original brickinfo * will help in mapping while recreating the missed snapshot */ gf_log (this->name, GF_LOG_WARNING, "Unable to fetch " "snap mount path(%s). Adding to missed_snap_list", key); snap_brickinfo->snap_status = -1; snap_brick_dir = original_brickinfo->mount_dir; /* In origiator node add snaps missed * from different nodes to the dict */ if (is_origin_glusterd (dict) == _gf_true) add_missed_snap = _gf_true; } if ((snap_brickinfo->snap_status != -1) && (!uuid_compare (original_brickinfo->uuid, MY_UUID)) && (!glusterd_is_brick_started (original_brickinfo))) { /* In case if the brick goes down after prevalidate. */ gf_log (this->name, GF_LOG_WARNING, "brick %s:%s is not" " started (snap: %s)", original_brickinfo->hostname, original_brickinfo->path, snap_vol->snapshot->snapname); snap_brickinfo->snap_status = -1; add_missed_snap = _gf_true; } if (add_missed_snap) { ret = glusterd_add_missed_snaps_to_dict (rsp_dict, snap_vol, original_brickinfo, brick_count + 1, GF_SNAP_OPTION_TYPE_CREATE); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to add missed" " snapshot info for %s:%s in the rsp_dict", original_brickinfo->hostname, original_brickinfo->path); goto out; } } /* Create brick-path in the format /var/run/gluster/snaps/ * * //snap-brick-dir * */ snprintf (snap_brick_path, sizeof(snap_brick_path), "%s/%s/brick%d%s", snap_mount_folder, snap_vol->volname, brick_count+1, snap_brick_dir); snprintf (key, sizeof(key), "vol%"PRId64".brick_snapdevice%d", volcount, brick_count); ret = dict_get_str (dict, key, &snap_device); if (ret) { /* If the device name is empty, so will be the brick path * Hence the missed snap has already been added above */ gf_log (this->name, GF_LOG_ERROR, "Unable to fetch " "snap device (%s). Leaving empty", key); } else strcpy (snap_brickinfo->device_path, snap_device); ret = gf_canonicalize_path (snap_brick_path); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to canonicalize path"); goto out; } strcpy (snap_brickinfo->hostname, original_brickinfo->hostname); strcpy (snap_brickinfo->path, snap_brick_path); strcpy (snap_brickinfo->mount_dir, original_brickinfo->mount_dir); uuid_copy (snap_brickinfo->uuid, original_brickinfo->uuid); /* AFR changelog names are based on brick_id and hence the snap * volume's bricks must retain the same ID */ strcpy (snap_brickinfo->brick_id, original_brickinfo->brick_id); list_add_tail (&snap_brickinfo->brick_list, &snap_vol->bricks); out: if (ret && snap_brickinfo) GF_FREE (snap_brickinfo); gf_log (this->name, GF_LOG_TRACE, "Returning %d", ret); return ret; } static int32_t glusterd_take_brick_snapshot (dict_t *dict, glusterd_volinfo_t *snap_vol, glusterd_brickinfo_t *brickinfo, int32_t volcount, int32_t brick_count) { char *origin_brick_path = NULL; char key[PATH_MAX] = ""; int32_t ret = -1; xlator_t *this = NULL; this = THIS; GF_ASSERT (this); GF_ASSERT (dict); GF_ASSERT (snap_vol); GF_ASSERT (brickinfo); if (strlen(brickinfo->device_path) == 0) { gf_log (this->name, GF_LOG_ERROR, "Device path is empty " "brick %s:%s", brickinfo->hostname, brickinfo->path); ret = -1; goto out; } snprintf (key, sizeof(key) - 1, "vol%d.origin_brickpath%d", volcount, brick_count); ret = dict_get_str (dict, key, &origin_brick_path); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Unable to fetch " "brick path (%s)", key); goto out; } ret = glusterd_take_lvm_snapshot (brickinfo, origin_brick_path); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to take snapshot of " "brick %s:%s", brickinfo->hostname, origin_brick_path); goto out; } /* create the complete brick here */ ret = glusterd_snap_brick_create (snap_vol, brickinfo, brick_count); if (ret) { gf_log (this->name, GF_LOG_ERROR, "not able to" " create the brick for the snap %s" ", volume %s", snap_vol->snapshot->snapname, snap_vol->volname); goto out; } out: gf_log (this->name, GF_LOG_TRACE, "Returning %d", ret); return ret; } glusterd_volinfo_t * glusterd_do_snap_vol (glusterd_volinfo_t *origin_vol, glusterd_snap_t *snap, dict_t *dict, dict_t *rsp_dict, int64_t volcount) { char key[PATH_MAX] = ""; char *username = NULL; char *password = NULL; glusterd_brickinfo_t *brickinfo = NULL; glusterd_conf_t *priv = NULL; glusterd_volinfo_t *snap_vol = NULL; uuid_t *snap_volid = NULL; int32_t ret = -1; int32_t brick_count = 0; xlator_t *this = NULL; int64_t brick_order = 0; this = THIS; GF_ASSERT (this); priv = this->private; GF_ASSERT (priv); GF_ASSERT (dict); GF_ASSERT (origin_vol); GF_ASSERT (rsp_dict); /* fetch username, password and vol_id from dict*/ snprintf (key, sizeof(key), "volume%"PRId64"_username", volcount); ret = dict_get_str (dict, key, &username); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get %s for " "snap %s", key, snap->snapname); goto out; } snprintf (key, sizeof(key), "volume%"PRId64"_password", volcount); ret = dict_get_str (dict, key, &password); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get %s for " "snap %s", key, snap->snapname); goto out; } snprintf (key, sizeof(key) - 1, "vol%"PRId64"_volid", volcount); ret = dict_get_bin (dict, key, (void **)&snap_volid); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to fetch snap_volid"); goto out; } /* We are not setting the username and password here as * we need to set the user name and password passed in * the dictionary */ ret = glusterd_volinfo_dup (origin_vol, &snap_vol, _gf_false); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to duplicate volinfo " "for the snapshot %s", snap->snapname); goto out; } /* uuid is used as lvm snapshot name. This will avoid restrictions on snapshot names provided by user */ GLUSTERD_GET_UUID_NOHYPHEN (snap_vol->volname, *snap_volid); uuid_copy (snap_vol->volume_id, *snap_volid); snap_vol->is_snap_volume = _gf_true; strcpy (snap_vol->parent_volname, origin_vol->volname); snap_vol->snapshot = snap; glusterd_auth_set_username (snap_vol, username); glusterd_auth_set_password (snap_vol, password); /* TODO : Sync before taking a snapshot */ /* Copy the status and config files of geo-replication before * taking a snapshot. During restore operation these files needs * to be copied back in /var/lib/glusterd/georeplication/ */ ret = glusterd_copy_geo_rep_files (origin_vol, snap_vol, rsp_dict); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to copy geo-rep " "config and status files for volume %s", origin_vol->volname); goto out; } /* Adding snap brickinfos to the snap volinfo */ brick_count = 0; list_for_each_entry (brickinfo, &origin_vol->bricks, brick_list) { ret = glusterd_add_brick_to_snap_volume (dict, rsp_dict, snap_vol, brickinfo, volcount, brick_count); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to add the snap brick for " "%s:%s to the snap volume", brickinfo->hostname, brickinfo->path); goto out; } brick_count++; } ret = glusterd_store_volinfo (snap_vol, GLUSTERD_VOLINFO_VER_AC_INCREMENT); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to store snapshot " "volinfo (%s) for snap %s", snap_vol->volname, snap->snapname); goto out; } ret = glusterd_copy_quota_files (origin_vol, snap_vol); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to copy quota " "config and cksum for volume %s", origin_vol->volname); goto out; } ret = generate_brick_volfiles (snap_vol); if (ret) { gf_log (this->name, GF_LOG_ERROR, "generating the brick " "volfiles for the snap %s (volume: %s) failed", snap->snapname, origin_vol->volname); goto out; } ret = generate_client_volfiles (snap_vol, GF_CLIENT_TRUSTED); if (ret) { gf_log (this->name, GF_LOG_ERROR, "generating the trusted " "client volfiles for the snap %s (volume: %s) failed", snap->snapname, origin_vol->volname); goto out; } ret = generate_client_volfiles (snap_vol, GF_CLIENT_OTHER); if (ret) { gf_log (this->name, GF_LOG_ERROR, "generating the client " "volfiles for the snap %s (volume: %s) failed", snap->snapname, origin_vol->volname); goto out; } ret = glusterd_list_add_snapvol (origin_vol, snap_vol); if (ret) { gf_log (this->name, GF_LOG_ERROR, "could not add the snap " "volume %s to the list", snap_vol->volname); goto out; } out: if (ret) { if (snap_vol) glusterd_snap_volume_remove (rsp_dict, snap_vol, _gf_true, _gf_true); snap_vol = NULL; } return snap_vol; } /*This is the prevalidate function for both activate and deactive of snap * For Activate operation pass is_op_activate as _gf_true * For Deactivate operation pass is_op_activate as _gf_false * */ int glusterd_snapshot_activate_deactivate_prevalidate (dict_t *dict, char **op_errstr, dict_t *rsp_dict, gf_boolean_t is_op_activate) { int32_t ret = -1; char *snapname = NULL; xlator_t *this = NULL; glusterd_snap_t *snap = NULL; glusterd_volinfo_t *snap_volinfo = NULL; char err_str[PATH_MAX] = ""; gf_loglevel_t loglevel = GF_LOG_ERROR; glusterd_volume_status volume_status = GLUSTERD_STATUS_STOPPED; int flags = 0; this = THIS; if (!dict || !op_errstr) { gf_log (this->name, GF_LOG_ERROR, "input parameters NULL"); goto out; } ret = dict_get_str (dict, "snapname", &snapname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Getting the snap name " "failed"); goto out; } snap = glusterd_find_snap_by_name (snapname); if (!snap) { snprintf (err_str, sizeof (err_str), "Snap %s does not exist.", snapname); ret = -1; goto out; } /*If its activation of snap then fetch the flags*/ if (is_op_activate) { ret = dict_get_int32 (dict, "flags", &flags); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to get flags"); goto out; } } /* TODO : As of now there is only volume in snapshot. * Change this when multiple volume snapshot is introduced */ snap_volinfo = list_entry (snap->volumes.next, glusterd_volinfo_t, vol_list); if (!snap_volinfo) { gf_log (this->name, GF_LOG_ERROR, "Unable to fetch snap_volinfo"); ret = -1; goto out; } /*TODO: When multiple snapvolume are involved a cummulative * logic is required to tell whether is snapshot is * started/partially started/stopped*/ if (is_op_activate) { volume_status = GLUSTERD_STATUS_STARTED; } if (snap_volinfo->status == volume_status) { if (is_op_activate) { /* if flag is to GF_CLI_FLAG_OP_FORCE * try to start the snap volume, even * if the volume_status is GLUSTERD_STATUS_STARTED. * By doing so we try to bring * back the brick processes that are down*/ if (!(flags & GF_CLI_FLAG_OP_FORCE)) { snprintf (err_str, sizeof (err_str), "Snap %s is already activated.", snapname); ret = -1; } } else { snprintf (err_str, sizeof (err_str), "Snap %s is already deactivated.", snapname); ret = -1; } goto out; } ret = 0; out: if (ret && err_str[0] != '\0') { gf_log (this->name, loglevel, "%s", err_str); *op_errstr = gf_strdup (err_str); } return ret; } /* This is a snapshot remove handler function. This function will be * executed in the originator node. This function is responsible for * calling mgmt v3 framework to do the actual remove on all the bricks * * @param req RPC request object * @param op gluster operation * @param dict dictionary containing snapshot remove request * @param err_str In case of an err this string should be populated * @param len length of err_str buffer * * @return Negative value on Failure and 0 in success */ int glusterd_handle_snapshot_remove (rpcsvc_request_t *req, glusterd_op_t op, dict_t *dict, char *err_str, size_t len) { int ret = -1; int64_t volcount = 0; char *snapname = NULL; char *volname = NULL; char key[PATH_MAX] = ""; glusterd_snap_t *snap = NULL; glusterd_volinfo_t *snap_vol = NULL; glusterd_volinfo_t *tmp = NULL; xlator_t *this = NULL; this = THIS; GF_ASSERT (req); GF_ASSERT (dict); GF_ASSERT (err_str); ret = dict_get_str (dict, "snapname", &snapname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get snapname"); goto out; } snap = glusterd_find_snap_by_name (snapname); if (!snap) { snprintf (err_str, len, "Snap (%s) does not exist", snapname); gf_log (this->name, GF_LOG_ERROR, "%s", err_str); ret = -1; goto out; } /* Set volnames in the dict to get mgmt_v3 lock */ list_for_each_entry_safe (snap_vol, tmp, &snap->volumes, vol_list) { volcount++; volname = gf_strdup (snap_vol->parent_volname); if (!volname) { ret = -1; gf_log (this->name, GF_LOG_ERROR, "strdup failed"); goto out; } snprintf (key, sizeof (key), "volname%"PRId64, volcount); ret = dict_set_dynstr (dict, key, volname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set " "volume name in dictionary"); GF_FREE (volname); goto out; } volname = NULL; } ret = dict_set_int64 (dict, "volcount", volcount); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set volcount"); goto out; } ret = glusterd_mgmt_v3_initiate_snap_phases (req, op, dict); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to initiate snap " "phases"); goto out; } ret = 0; out: return ret; } int glusterd_snapshot_remove_prevalidate (dict_t *dict, char **op_errstr, dict_t *rsp_dict) { int32_t ret = -1; char *snapname = NULL; xlator_t *this = NULL; glusterd_snap_t *snap = NULL; this = THIS; if (!dict || !op_errstr) { gf_log (this->name, GF_LOG_ERROR, "input parameters NULL"); goto out; } ret = dict_get_str (dict, "snapname", &snapname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Getting the snap name " "failed"); goto out; } snap = glusterd_find_snap_by_name (snapname); if (!snap) { gf_log (this->name, GF_LOG_ERROR, "Snap %s does not exist", snapname); ret = -1; goto out; } ret = 0; out: return ret; } int glusterd_snapshot_status_prevalidate (dict_t *dict, char **op_errstr, dict_t *rsp_dict) { int ret = -1; char *snapname = NULL; glusterd_conf_t *conf = NULL; xlator_t *this = NULL; int32_t cmd = -1; glusterd_volinfo_t *volinfo = NULL; char *volname = NULL; this = THIS; GF_ASSERT (this); conf = this->private; GF_ASSERT (conf); GF_ASSERT (op_errstr); if (!dict) { gf_log (this->name, GF_LOG_ERROR, "Input dict is NULL"); goto out; } ret = dict_get_int32 (dict, "cmd", &cmd); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not fetch status cmd"); goto out; } switch (cmd) { case GF_SNAP_STATUS_TYPE_ALL: { break; } case GF_SNAP_STATUS_TYPE_SNAP: { ret = dict_get_str (dict, "snapname", &snapname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not fetch snapname"); goto out; } if (!glusterd_find_snap_by_name (snapname)) { ret = gf_asprintf (op_errstr, "Snap (%s) " "not found", snapname); if (ret < 0) { goto out; } ret = -1; gf_log (this->name, GF_LOG_ERROR, "Snap (%s) " "not found", snapname); goto out; } break; } case GF_SNAP_STATUS_TYPE_VOL: { ret = dict_get_str (dict, "volname", &volname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not fetch volname"); goto out; } ret = glusterd_volinfo_find (volname, &volinfo); if (ret) { ret = gf_asprintf (op_errstr, "Volume (%s)" "not found", volname); if (ret < 0) { goto out; } ret = -1; gf_log (this->name, GF_LOG_ERROR, "Volume " "%s not present", volname); goto out; } break; } default: { gf_log (this->name, GF_LOG_ERROR, "Invalid command"); break; } } ret = 0; out: return ret; } int32_t glusterd_snapshot_activate_commit (dict_t *dict, char **op_errstr, dict_t *rsp_dict) { int32_t ret = -1; char *snapname = NULL; glusterd_snap_t *snap = NULL; glusterd_volinfo_t *snap_volinfo = NULL; xlator_t *this = NULL; int flags = 0; this = THIS; GF_ASSERT (this); GF_ASSERT (dict); GF_ASSERT (rsp_dict); GF_ASSERT (op_errstr); if (!dict || !op_errstr) { gf_log (this->name, GF_LOG_ERROR, "input parameters NULL"); goto out; } ret = dict_get_str (dict, "snapname", &snapname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Getting the snap name " "failed"); goto out; } ret = dict_get_int32 (dict, "flags", &flags); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to get flags"); goto out; } snap = glusterd_find_snap_by_name (snapname); if (!snap) { gf_log (this->name, GF_LOG_ERROR, "Snap %s does not exist", snapname); ret = -1; goto out; } /* TODO : As of now there is only volume in snapshot. * Change this when multiple volume snapshot is introduced */ snap_volinfo = list_entry (snap->volumes.next, glusterd_volinfo_t, vol_list); if (!snap_volinfo) { gf_log (this->name, GF_LOG_ERROR, "Unable to fetch snap_volinfo"); ret = -1; goto out; } ret = glusterd_start_volume (snap_volinfo, flags, _gf_true); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to activate snap volume %s of the snap %s", snap_volinfo->volname, snap->snapname); goto out; } ret = 0; out: return ret; } int32_t glusterd_snapshot_deactivate_commit (dict_t *dict, char **op_errstr, dict_t *rsp_dict) { int32_t ret = -1; char *snapname = NULL; glusterd_snap_t *snap = NULL; glusterd_volinfo_t *snap_volinfo = NULL; xlator_t *this = NULL; this = THIS; GF_ASSERT (this); GF_ASSERT (dict); GF_ASSERT (rsp_dict); GF_ASSERT (op_errstr); if (!dict || !op_errstr) { gf_log (this->name, GF_LOG_ERROR, "input parameters NULL"); goto out; } ret = dict_get_str (dict, "snapname", &snapname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Getting the snap name " "failed"); goto out; } snap = glusterd_find_snap_by_name (snapname); if (!snap) { gf_log (this->name, GF_LOG_ERROR, "Snap %s does not exist", snapname); ret = -1; goto out; } /* TODO : As of now there is only volume in snapshot. * Change this when multiple volume snapshot is introduced */ snap_volinfo = list_entry (snap->volumes.next, glusterd_volinfo_t, vol_list); if (!snap_volinfo) { gf_log (this->name, GF_LOG_ERROR, "Unable to fetch snap_volinfo"); ret = -1; goto out; } ret = glusterd_stop_volume (snap_volinfo); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to deactivate" "snap %s", snapname); goto out; } ret = 0; out: return ret; } int32_t glusterd_snapshot_remove_commit (dict_t *dict, char **op_errstr, dict_t *rsp_dict) { int32_t ret = -1; char *snapname = NULL; char *dup_snapname = NULL; glusterd_snap_t *snap = NULL; glusterd_conf_t *priv = NULL; glusterd_volinfo_t *snap_volinfo = NULL; xlator_t *this = NULL; this = THIS; GF_ASSERT (this); GF_ASSERT (dict); GF_ASSERT (rsp_dict); GF_ASSERT (op_errstr); priv = this->private; GF_ASSERT (priv); if (!dict || !op_errstr) { gf_log (this->name, GF_LOG_ERROR, "input parameters NULL"); goto out; } ret = dict_get_str (dict, "snapname", &snapname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Getting the snap name " "failed"); goto out; } snap = glusterd_find_snap_by_name (snapname); if (!snap) { gf_log (this->name, GF_LOG_ERROR, "Snap %s does not exist", snapname); ret = -1; goto out; } if (is_origin_glusterd (dict) == _gf_true) { /* TODO : As of now there is only volume in snapshot. * Change this when multiple volume snapshot is introduced */ snap_volinfo = list_entry (snap->volumes.next, glusterd_volinfo_t, vol_list); if (!snap_volinfo) { gf_log (this->name, GF_LOG_ERROR, "Unable to fetch snap_volinfo"); ret = -1; goto out; } /* From origin glusterd check if * * any peers with snap bricks is down */ ret = glusterd_find_missed_snap (rsp_dict, snap_volinfo, &priv->peers, GF_SNAP_OPTION_TYPE_DELETE); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to find missed snap deletes"); goto out; } } ret = glusterd_snap_remove (rsp_dict, snap, _gf_true, _gf_false); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to remove snap %s", snapname); goto out; } dup_snapname = gf_strdup (snapname); if (!dup_snapname) { gf_log (this->name, GF_LOG_ERROR, "Strdup failed"); ret = -1; goto out; } ret = dict_set_dynstr (rsp_dict, "snapname", dup_snapname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set the snapname"); GF_FREE (dup_snapname); goto out; } ret = 0; out: return ret; } int32_t glusterd_do_snap_cleanup (dict_t *dict, char **op_errstr, dict_t *rsp_dict) { int32_t ret = -1; char *name = NULL; xlator_t *this = NULL; glusterd_conf_t *conf = NULL; glusterd_volinfo_t *volinfo = NULL; glusterd_snap_t *snap = NULL; this = THIS; GF_ASSERT (this); conf = this->private; GF_ASSERT (conf); if (!dict || !op_errstr) { gf_log (this->name, GF_LOG_ERROR, "input parameters NULL"); goto out; } ret = dict_get_str (dict, "snapname", &name); if (ret) { gf_log (this->name, GF_LOG_ERROR, "getting the snap " "name failed (volume: %s)", volinfo->volname); goto out; } /* If the snapname is not found that means the failure happened at staging, or in commit, before the snap object is created, in which case there is nothing to cleanup. So set ret to 0. */ snap = glusterd_find_snap_by_name (name); if (!snap) { gf_log (this->name, GF_LOG_INFO, "snap %s is not found", name); ret = 0; goto out; } ret = glusterd_snap_remove (rsp_dict, snap, _gf_true, _gf_true); if (ret) { /* Ignore failure as this is a cleanup of half cooked snapshot */ gf_log (this->name, GF_LOG_DEBUG, "removing the snap %s failed", name); ret = 0; } name = NULL; ret = 0; out: return ret; } /* In case of a successful, delete or create operation, during post_validate * * look for missed snap operations and update the missed snap lists */ int32_t glusterd_snapshot_update_snaps_post_validate (dict_t *dict, char **op_errstr, dict_t *rsp_dict) { int32_t ret = -1; int32_t missed_snap_count = -1; xlator_t *this = NULL; this = THIS; GF_ASSERT (this); GF_ASSERT (dict); GF_ASSERT (rsp_dict); GF_ASSERT (op_errstr); ret = dict_get_int32 (dict, "missed_snap_count", &missed_snap_count); if (ret) { gf_log (this->name, GF_LOG_DEBUG, "No missed snaps"); ret = 0; goto out; } ret = glusterd_add_missed_snaps_to_list (dict, missed_snap_count); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to add missed snaps to list"); goto out; } ret = glusterd_store_update_missed_snaps (); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to update missed_snaps_list"); goto out; } out: gf_log (this->name, GF_LOG_TRACE, "Returning %d", ret); return ret; } int glusterd_take_brick_snapshot_task (void *opaque) { int ret = 0; snap_create_args_t *snap_args = NULL; char key[PATH_MAX] = ""; GF_ASSERT (opaque); snap_args = (snap_create_args_t*) opaque; THIS = snap_args->this; ret = glusterd_take_brick_snapshot (snap_args->dict, snap_args->snap_vol, snap_args->brickinfo, snap_args->volcount, snap_args->brickorder); if (ret) { gf_log (THIS->name, GF_LOG_ERROR, "Failed to " "take backend snapshot for brick " "%s:%s volume(%s)", snap_args->brickinfo->hostname, snap_args->brickinfo->path, snap_args->snap_vol->volname); } snprintf (key, sizeof (key), "snap-vol%d.brick%d.status", snap_args->volcount, snap_args->brickorder); if (dict_set_int32 (snap_args->rsp_dict, key, (ret)?0:1)) { gf_log (THIS->name, GF_LOG_ERROR, "failed to " "add %s to dict", key); ret = -1; goto out; } out: return ret; } int32_t glusterd_take_brick_snapshot_cbk (int ret, call_frame_t *frame, void *opaque) { snap_create_args_t *snap_args = NULL; struct syncargs *args = NULL; GF_ASSERT (opaque); snap_args = (snap_create_args_t*) opaque; args = snap_args->args; if (ret) args->op_ret = ret; GF_FREE (opaque); synctask_barrier_wake(args); return 0; } int32_t glusterd_schedule_brick_snapshot (dict_t *dict, dict_t *rsp_dict, glusterd_snap_t *snap) { int ret = -1; int32_t volcount = 0; int32_t brickcount = 0; int32_t brickorder = 0; int32_t taskcount = 0; char key[PATH_MAX] = ""; xlator_t *this = NULL; glusterd_volinfo_t *snap_vol = NULL; glusterd_brickinfo_t *brickinfo = NULL; struct syncargs args = {0}; snap_create_args_t *snap_args = NULL; this = THIS; GF_ASSERT(this); GF_ASSERT(dict); GF_ASSERT(snap); synctask_barrier_init ((&args)); list_for_each_entry (snap_vol, &snap->volumes, vol_list) { volcount++; brickcount = 0; brickorder = 0; list_for_each_entry (brickinfo, &snap_vol->bricks, brick_list) { snprintf (key, sizeof(key) - 1, "snap-vol%d.brick%d.order", volcount, brickcount); ret = dict_set_int32 (rsp_dict, key, brickorder); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set %s", key); goto out; } if ((uuid_compare (brickinfo->uuid, MY_UUID)) || (brickinfo->snap_status == -1)) { if (!uuid_compare (brickinfo->uuid, MY_UUID)) { brickcount++; snprintf (key, sizeof (key), "snap-vol%d.brick%d.status", volcount, brickorder); ret = dict_set_int32 (rsp_dict, key, 0); if (ret) { gf_log (this->name, GF_LOG_ERROR, "failed to add %s to " "dict", key); goto out; } } brickorder++; continue; } snap_args = GF_CALLOC (1, sizeof (*snap_args), gf_gld_mt_snap_create_args_t); if (!snap_args) { ret = -1; goto out; } snap_args->this = this; snap_args->dict = dict; snap_args->rsp_dict = rsp_dict; snap_args->snap_vol = snap_vol; snap_args->brickinfo = brickinfo; snap_args->volcount = volcount; snap_args->brickcount = brickcount; snap_args->brickorder = brickorder; snap_args->args = &args; ret = synctask_new (this->ctx->env, glusterd_take_brick_snapshot_task, glusterd_take_brick_snapshot_cbk, NULL, snap_args); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to " "spawn task for snapshot create"); GF_FREE (snap_args); goto out; } taskcount++; brickcount++; brickorder++; } snprintf (key, sizeof (key), "snap-vol%d_brickcount", volcount); ret = dict_set_int64 (rsp_dict, key, brickcount); if (ret) { gf_log (this->name, GF_LOG_ERROR, "failed to " "add %s to dict", key); goto out; } } synctask_barrier_wait ((&args), taskcount); taskcount = 0; if (args.op_ret) gf_log (this->name, GF_LOG_ERROR, "Failed to create snapshot"); ret = args.op_ret; out: if (ret && taskcount) synctask_barrier_wait ((&args), taskcount); return ret; } int32_t glusterd_snapshot_create_commit (dict_t *dict, char **op_errstr, dict_t *rsp_dict) { int ret = -1; int64_t i = 0; int64_t volcount = 0; char *snapname = NULL; char *volname = NULL; char *tmp_name = NULL; char key[PATH_MAX] = ""; xlator_t *this = NULL; glusterd_snap_t *snap = NULL; glusterd_volinfo_t *origin_vol = NULL; glusterd_volinfo_t *snap_vol = NULL; glusterd_brickinfo_t *brickinfo = NULL; glusterd_conf_t *priv = NULL; this = THIS; GF_ASSERT(this); GF_ASSERT(dict); GF_ASSERT(op_errstr); GF_ASSERT(rsp_dict); priv = this->private; GF_ASSERT(priv); ret = dict_get_int64 (dict, "volcount", &volcount); if (ret) { gf_log (this->name, GF_LOG_ERROR, "failed to " "get the volume count"); goto out; } ret = dict_get_str (dict, "snapname", &snapname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to fetch snapname"); goto out; } tmp_name = gf_strdup (snapname); if (!tmp_name) { gf_log (this->name, GF_LOG_ERROR, "Out of memory"); ret = -1; goto out; } ret = dict_set_dynstr (rsp_dict, "snapname", tmp_name); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to set snapname in rsp_dict"); GF_FREE (tmp_name); goto out; } tmp_name = NULL; snap = glusterd_create_snap_object (dict, rsp_dict); if (!snap) { gf_log (this->name, GF_LOG_ERROR, "creating the" "snap object %s failed", snapname); ret = -1; goto out; } for (i = 1; i <= volcount; i++) { snprintf (key, sizeof (key), "volname%"PRId64, i); ret = dict_get_str (dict, key, &volname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "failed to get volume name"); goto out; } ret = glusterd_volinfo_find (volname, &origin_vol); if (ret) { gf_log (this->name, GF_LOG_ERROR, "failed to get the volinfo for " "the volume %s", volname); goto out; } snap_vol = glusterd_do_snap_vol (origin_vol, snap, dict, rsp_dict, i); if (!snap_vol) { ret = -1; gf_log (this->name, GF_LOG_WARNING, "taking the " "snapshot of the volume %s failed", volname); goto out; } } ret = dict_set_int64 (rsp_dict, "volcount", volcount); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to set volcount"); goto out; } ret = glusterd_schedule_brick_snapshot (dict, rsp_dict, snap); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to take backend " "snapshot %s", snap->snapname); goto out; } /*TODO: As of now start the bricks as part of snapshot creation op. brick_start releases the big_lock and this can cause regression for bug# 1088355. We need to fix brick_connect not to release big_lock*/ list_for_each_entry (snap_vol, &snap->volumes, vol_list) { list_for_each_entry (brickinfo, &snap_vol->bricks, brick_list) { ret = glusterd_brick_start (snap_vol, brickinfo, _gf_false); if (ret) { gf_log (this->name, GF_LOG_WARNING, "starting " "the brick %s:%s for the snap %s " "(volume: %s) failed", brickinfo->hostname, brickinfo->path, snap_vol->snapshot->snapname, snap_vol->volname); goto out; } } snap_vol->status = GLUSTERD_STATUS_STARTED; ret = glusterd_store_volinfo (snap_vol, GLUSTERD_VOLINFO_VER_AC_INCREMENT); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to store " "snap volinfo %s", snap_vol->volname); goto out; } } out: if (ret) { if (snap) glusterd_snap_remove (rsp_dict, snap, _gf_true, _gf_true); snap = NULL; } gf_log (this->name, GF_LOG_TRACE, "Returning %d", ret); return ret; } int snap_max_hard_limit_set_commit (dict_t *dict, uint64_t value, char *volname, char **op_errstr) { char err_str[PATH_MAX] = ""; glusterd_conf_t *conf = NULL; glusterd_volinfo_t *volinfo = NULL; int ret = -1; xlator_t *this = NULL; this = THIS; GF_ASSERT (this); GF_ASSERT (dict); GF_ASSERT (op_errstr); conf = this->private; GF_ASSERT (conf); /* TODO: Initiate auto deletion when there is a limit change */ if (!volname) { /* For system limit */ conf->snap_max_hard_limit = value; ret = glusterd_store_global_info (this); if (ret) { snprintf (err_str, PATH_MAX, "Failed to store " "snap-max-hard-limit for system"); goto out; } } else { /* For one volume */ ret = glusterd_volinfo_find (volname, &volinfo); if (ret) { snprintf (err_str, PATH_MAX, "Failed to get the" " volinfo for volume %s", volname); goto out; } volinfo->snap_max_hard_limit = value; ret = glusterd_store_volinfo (volinfo, GLUSTERD_VOLINFO_VER_AC_INCREMENT); if (ret) { snprintf (err_str, PATH_MAX, "Failed to store " "snap-max-hard-limit for volume %s", volname); goto out; } } ret = 0; out: if (ret) { *op_errstr = gf_strdup (err_str); gf_log (this->name, GF_LOG_ERROR, "%s", err_str); } return ret; } int glusterd_snapshot_config_commit (dict_t *dict, char **op_errstr, dict_t *rsp_dict) { char *volname = NULL; xlator_t *this = NULL; int ret = -1; char err_str[PATH_MAX] = {0,}; glusterd_conf_t *conf = NULL; int config_command = 0; uint64_t hard_limit = 0; uint64_t soft_limit = 0; this = THIS; GF_ASSERT (this); GF_ASSERT (dict); GF_ASSERT (op_errstr); conf = this->private; GF_ASSERT (conf); ret = dict_get_int32 (dict, "config-command", &config_command); if (ret) { gf_log (this->name, GF_LOG_ERROR, "failed to get config-command type"); goto out; } /* Ignore the return value of the following dict_get, * as they are optional */ ret = dict_get_str (dict, "volname", &volname); ret = dict_get_uint64 (dict, "snap-max-hard-limit", &hard_limit); ret = dict_get_uint64 (dict, "snap-max-soft-limit", &soft_limit); switch (config_command) { case GF_SNAP_CONFIG_TYPE_SET: if (hard_limit) { /* Commit ops for snap-max-hard-limit */ ret = snap_max_hard_limit_set_commit (dict, hard_limit, volname, op_errstr); if (ret) { gf_log (this->name, GF_LOG_ERROR, "snap-max-hard-limit set " "commit failed."); goto out; } } if (soft_limit) { /* For system limit */ conf->snap_max_soft_limit = soft_limit; ret = glusterd_store_global_info (this); if (ret) { snprintf (err_str, PATH_MAX, "Failed to store " "snap-max-soft-limit for system"); *op_errstr = gf_strdup (err_str); gf_log (this->name, GF_LOG_ERROR, "%s", err_str); goto out; } } break; default: break; } out: gf_log (this->name, GF_LOG_TRACE, "Returning %d", ret); return ret; } int glusterd_get_brick_lvm_details (dict_t *rsp_dict, glusterd_brickinfo_t *brickinfo, char *volname, char *device, char *key_prefix) { int ret = -1; glusterd_conf_t *priv = NULL; runner_t runner = {0,}; xlator_t *this = NULL; char msg[PATH_MAX] = ""; char buf[PATH_MAX] = ""; char *ptr = NULL; char *token = NULL; char key[PATH_MAX] = ""; char *value = NULL; GF_ASSERT (rsp_dict); GF_ASSERT (brickinfo); GF_ASSERT (volname); this = THIS; GF_ASSERT (this); priv = this->private; GF_ASSERT (priv); device = glusterd_get_brick_mount_device (brickinfo->path); if (!device) { gf_log (this->name, GF_LOG_ERROR, "Getting device name for " "the brick %s:%s failed", brickinfo->hostname, brickinfo->path); goto out; } runinit (&runner); snprintf (msg, sizeof (msg), "running lvs command, " "for getting snap status"); /* Using lvs command fetch the Volume Group name, * Percentage of data filled and Logical Volume size * * "-o" argument is used to get the desired information, * example : "lvs /dev/VolGroup/thin_vol -o vgname,lv_size", * will get us Volume Group name and Logical Volume size. * * Here separator used is ":", * for the above given command with separator ":", * The output will be "vgname:lvsize" */ runner_add_args (&runner, LVS, device, "--noheading", "-o", "vg_name,data_percent,lv_size", "--separator", ":", NULL); runner_redir (&runner, STDOUT_FILENO, RUN_PIPE); runner_log (&runner, "", GF_LOG_DEBUG, msg); ret = runner_start (&runner); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not perform lvs action"); goto end; } do { ptr = fgets (buf, sizeof (buf), runner_chio (&runner, STDOUT_FILENO)); if (ptr == NULL) break; token = strtok (buf, ":"); if (token != NULL) { while (token && token[0] == ' ') token++; if (!token) { ret = -1; gf_log (this->name, GF_LOG_ERROR, "Invalid vg entry"); goto end; } value = gf_strdup (token); if (!value) { ret = -1; goto end; } ret = snprintf (key, sizeof (key), "%s.vgname", key_prefix); if (ret < 0) { goto end; } ret = dict_set_dynstr (rsp_dict, key, value); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not save vgname "); goto end; } } token = strtok (NULL, ":"); if (token != NULL) { value = gf_strdup (token); if (!value) { ret = -1; goto end; } ret = snprintf (key, sizeof (key), "%s.data", key_prefix); if (ret < 0) { goto end; } ret = dict_set_dynstr (rsp_dict, key, value); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not save data percent "); goto end; } } token = strtok (NULL, ":"); if (token != NULL) { value = gf_strdup (token); if (!value) { ret = -1; goto end; } ret = snprintf (key, sizeof (key), "%s.lvsize", key_prefix); if (ret < 0) { goto end; } ret = dict_set_dynstr (rsp_dict, key, value); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not save meta data percent "); goto end; } } } while (ptr != NULL); ret = 0; end: runner_end (&runner); out: if (ret && value) { GF_FREE (value); } return ret; } int glusterd_get_single_brick_status (char **op_errstr, dict_t *rsp_dict, char *keyprefix, int index, glusterd_volinfo_t *snap_volinfo, glusterd_brickinfo_t *brickinfo) { int ret = -1; xlator_t *this = NULL; glusterd_conf_t *priv = NULL; char key[PATH_MAX] = ""; char *device = NULL; char *value = NULL; char brick_path[PATH_MAX] = ""; char pidfile[PATH_MAX] = ""; pid_t pid = -1; this = THIS; GF_ASSERT (this); priv = this->private; GF_ASSERT (priv); GF_ASSERT (op_errstr); GF_ASSERT (rsp_dict); GF_ASSERT (keyprefix); GF_ASSERT (snap_volinfo); GF_ASSERT (brickinfo); ret = snprintf (key, sizeof (key), "%s.brick%d.path", keyprefix, index); if (ret < 0) { goto out; } ret = snprintf (brick_path, sizeof (brick_path), "%s:%s", brickinfo->hostname, brickinfo->path); if (ret < 0) { goto out; } value = gf_strdup (brick_path); if (!value) { ret = -1; goto out; } ret = dict_set_dynstr (rsp_dict, key, value); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to store " "brick_path %s", brickinfo->path); goto out; } if (brickinfo->snap_status == -1) { /* Setting vgname as "Pending Snapshot" */ value = gf_strdup ("Pending Snapshot"); if (!value) { ret = -1; goto out; } snprintf (key, sizeof (key), "%s.brick%d.vgname", keyprefix, index); ret = dict_set_dynstr (rsp_dict, key, value); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not save vgname "); goto out; } ret = 0; goto out; } value = NULL; ret = snprintf (key, sizeof (key), "%s.brick%d.status", keyprefix, index); if (ret < 0) { goto out; } if (brickinfo->status == GF_BRICK_STOPPED) { value = gf_strdup ("No"); if (!value) { ret = -1; goto out; } ret = dict_set_str (rsp_dict, key, value); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not save brick status"); goto out; } value = NULL; } else { value = gf_strdup ("Yes"); if (!value) { ret = -1; goto out; } ret = dict_set_str (rsp_dict, key, value); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not save brick status"); goto out; } value = NULL; GLUSTERD_GET_BRICK_PIDFILE (pidfile, snap_volinfo, brickinfo, priv); ret = gf_is_service_running (pidfile, &pid); ret = snprintf (key, sizeof (key), "%s.brick%d.pid", keyprefix, index); if (ret < 0) { goto out; } ret = dict_set_int32 (rsp_dict, key, pid); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not save pid %d", pid); goto out; } } ret = snprintf (key, sizeof (key), "%s.brick%d", keyprefix, index); if (ret < 0) { goto out; } ret = glusterd_get_brick_lvm_details (rsp_dict, brickinfo, snap_volinfo->volname, device, key); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get " "brick LVM details"); goto out; } out: if (ret && value) { GF_FREE (value); } return ret; } int glusterd_get_single_snap_status (char **op_errstr, dict_t *rsp_dict, char *keyprefix, glusterd_snap_t *snap) { int ret = -1; xlator_t *this = NULL; char key[PATH_MAX] = ""; char brickkey[PATH_MAX] = ""; glusterd_volinfo_t *snap_volinfo = NULL; glusterd_volinfo_t *tmp_volinfo = NULL; glusterd_brickinfo_t *brickinfo = NULL; int volcount = 0; int brickcount = 0; this = THIS; GF_ASSERT (this); GF_ASSERT (op_errstr); GF_ASSERT (rsp_dict); GF_ASSERT (keyprefix); GF_ASSERT (snap); list_for_each_entry_safe (snap_volinfo, tmp_volinfo, &snap->volumes, vol_list) { ret = snprintf (key, sizeof (key), "%s.vol%d", keyprefix, volcount); if (ret < 0) { goto out; } list_for_each_entry (brickinfo, &snap_volinfo->bricks, brick_list) { if (!glusterd_is_local_brick (this, snap_volinfo, brickinfo)) { brickcount++; continue; } ret = glusterd_get_single_brick_status (op_errstr, rsp_dict, key, brickcount, snap_volinfo, brickinfo); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Getting " "single snap status failed"); goto out; } brickcount++; } ret = snprintf (brickkey, sizeof (brickkey), "%s.brickcount", key); if (ret < 0) { goto out; } ret = dict_set_int32 (rsp_dict, brickkey, brickcount); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not save brick count"); goto out; } volcount++; } ret = snprintf (key, sizeof (key), "%s.volcount", keyprefix); if (ret < 0) { goto out; } ret = dict_set_int32 (rsp_dict, key, volcount); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not save volcount"); goto out; } out: return ret; } int glusterd_get_each_snap_object_status (char **op_errstr, dict_t *rsp_dict, glusterd_snap_t *snap, char *keyprefix) { int ret = -1; char key[PATH_MAX] = ""; char *temp = NULL; xlator_t *this = NULL; this = THIS; GF_ASSERT (this); GF_ASSERT (op_errstr); GF_ASSERT (rsp_dict); GF_ASSERT (snap); GF_ASSERT (keyprefix); /* TODO : Get all the snap volume info present in snap object, * as of now, There will be only one snapvolinfo per snap object */ ret = snprintf (key, sizeof (key), "%s.snapname", keyprefix); if (ret < 0) { goto out; } temp = gf_strdup (snap->snapname); if (temp == NULL) { ret = -1; goto out; } ret = dict_set_dynstr (rsp_dict, key, temp); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not save " "snap name"); goto out; } temp = NULL; ret = snprintf (key, sizeof (key), "%s.uuid", keyprefix); if (ret < 0) { goto out; } temp = gf_strdup (uuid_utoa (snap->snap_id)); if (temp == NULL) { ret = -1; goto out; } ret = dict_set_dynstr (rsp_dict, key, temp); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not save " "snap UUID"); goto out; } temp = NULL; ret = glusterd_get_single_snap_status (op_errstr, rsp_dict, keyprefix, snap); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not get single snap status"); goto out; } ret = snprintf (key, sizeof (key), "%s.volcount", keyprefix); if (ret < 0) { goto out; } ret = dict_set_int32 (rsp_dict, key, 1); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not save volcount"); goto out; } out: if (ret && temp) GF_FREE (temp); return ret; } int glusterd_get_snap_status_of_volume (char **op_errstr, dict_t *rsp_dict, char *volname, char *keyprefix) { int ret = -1; glusterd_volinfo_t *snap_volinfo = NULL; glusterd_volinfo_t *temp_volinfo = NULL; glusterd_volinfo_t *volinfo = NULL; char key[PATH_MAX] = ""; xlator_t *this = NULL; glusterd_conf_t *priv = NULL; int i = 0; this = THIS; GF_ASSERT (this); priv = this->private; GF_ASSERT (priv); GF_ASSERT (op_errstr); GF_ASSERT (rsp_dict); GF_ASSERT (volname); GF_ASSERT (keyprefix); ret = glusterd_volinfo_find (volname, &volinfo); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get volinfo of " "volume %s", volname); goto out; } list_for_each_entry_safe (snap_volinfo, temp_volinfo, &volinfo->snap_volumes, snapvol_list) { ret = snprintf (key, sizeof (key), "status.snap%d", i); if (ret < 0) { goto out; } ret = glusterd_get_each_snap_object_status (op_errstr, rsp_dict, snap_volinfo->snapshot, key); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Function : " "glusterd_get_single_snap_status failed"); goto out; } i++; } ret = dict_set_int32 (rsp_dict, "status.snapcount", i); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to save snapcount"); ret = -1; goto out; } out: return ret; } int glusterd_get_all_snapshot_status (dict_t *dict, char **op_errstr, dict_t *rsp_dict) { int32_t i = 0; int ret = -1; char key[PATH_MAX] = ""; glusterd_conf_t *priv = NULL; glusterd_snap_t *snap = NULL; glusterd_snap_t *tmp_snap = NULL; xlator_t *this = NULL; this = THIS; GF_ASSERT (this); priv = this->private; GF_ASSERT (priv); GF_ASSERT (dict); GF_ASSERT (op_errstr); list_for_each_entry_safe (snap, tmp_snap, &priv->snapshots, snap_list) { ret = snprintf (key, sizeof (key), "status.snap%d", i); if (ret < 0) { goto out; } ret = glusterd_get_each_snap_object_status (op_errstr, rsp_dict, snap, key); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not get " "the details of a snap object: %s", snap->snapname); goto out; } i++; } ret = dict_set_int32 (rsp_dict, "status.snapcount", i); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not save snapcount"); goto out; } ret = 0; out: return ret; } int glusterd_snapshot_status_commit (dict_t *dict, char **op_errstr, dict_t *rsp_dict) { xlator_t *this = NULL; int ret = -1; glusterd_conf_t *conf = NULL; char *get_buffer = NULL; int32_t cmd = -1; char *snapname = NULL; glusterd_snap_t *snap = NULL; char *volname = NULL; this = THIS; GF_ASSERT (this); GF_ASSERT (dict); GF_ASSERT (op_errstr); conf = this->private; GF_ASSERT (conf); ret = dict_get_int32 (dict, "cmd", &cmd); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to get status cmd type"); goto out; } ret = dict_set_int32 (rsp_dict, "cmd", cmd); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not save status cmd in rsp dictionary"); goto out; } switch (cmd) { case GF_SNAP_STATUS_TYPE_ALL: { ret = glusterd_get_all_snapshot_status (dict, op_errstr, rsp_dict); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to " "get snapshot status"); goto out; } break; } case GF_SNAP_STATUS_TYPE_SNAP: { ret = dict_get_str (dict, "snapname", &snapname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to " "get snap name"); goto out; } snap = glusterd_find_snap_by_name (snapname); if (!snap) { ret = gf_asprintf (op_errstr, "Snap (%s) " "not found", snapname); if (ret < 0) { goto out; } ret = -1; gf_log (this->name, GF_LOG_ERROR, "Unable to " "get snap volinfo"); goto out; } ret = glusterd_get_each_snap_object_status (op_errstr, rsp_dict, snap, "status.snap0"); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to " "get status of snap %s", get_buffer); goto out; } break; } case GF_SNAP_STATUS_TYPE_VOL: { ret = dict_get_str (dict, "volname", &volname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to" " get volume name"); goto out; } ret = glusterd_get_snap_status_of_volume (op_errstr, rsp_dict, volname, "status.vol0"); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Function :" " glusterd_get_snap_status_of_volume " "failed"); goto out; } } } ret = 0; out: return ret; } int32_t glusterd_handle_snap_limit (dict_t *dict, dict_t *rsp_dict) { int32_t ret = -1; xlator_t *this = NULL; glusterd_conf_t *priv = NULL; uint64_t effective_max_limit = 0; int64_t volcount = 0; int64_t i = 0; char *volname = NULL; char key[PATH_MAX] = {0, }; glusterd_volinfo_t *volinfo = NULL; uint64_t limit = 0; int64_t count = 0; glusterd_snap_t *snap = NULL; glusterd_volinfo_t *tmp_volinfo = NULL; glusterd_volinfo_t *other_volinfo = NULL; int64_t var = 0; this = THIS; GF_ASSERT (this); GF_ASSERT (dict); GF_ASSERT (rsp_dict); priv = this->private; GF_ASSERT (priv); ret = dict_get_int64 (dict, "volcount", &volcount); if (ret) { gf_log (this->name, GF_LOG_ERROR, "failed to get the volcount"); goto out; } for (i = 1; i <= volcount; i++) { snprintf (key, sizeof (key), "volname%ld", i); ret = dict_get_str (dict, key, &volname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "failed to get the " "volname"); goto out; } ret = glusterd_volinfo_find (volname, &volinfo); if (ret) { gf_log (this->name, GF_LOG_ERROR, "volinfo for %s " "not found", volname); goto out; } /* The minimum of the 2 limits i.e system wide limit and volume wide limit will be considered */ if (volinfo->snap_max_hard_limit < priv->snap_max_hard_limit) effective_max_limit = volinfo->snap_max_hard_limit; else effective_max_limit = priv->snap_max_hard_limit; limit = (priv->snap_max_soft_limit * effective_max_limit)/100; count = volinfo->snap_count - limit; if (count <= 0) goto out; list_for_each_entry_safe (tmp_volinfo, other_volinfo, &volinfo->snap_volumes, snapvol_list) { if (var == count) break; snap = tmp_volinfo->snapshot; GF_ASSERT (snap); LOCK (&snap->lock); { snap->snap_status = GD_SNAP_STATUS_DECOMMISSION; ret = glusterd_store_snap (snap); if (ret) { gf_log (this->name, GF_LOG_ERROR, "could " "not store snap object %s", snap->snapname); goto unlock; } ret = glusterd_snap_remove (rsp_dict, snap, _gf_true, _gf_true); if (ret) gf_log (this->name, GF_LOG_WARNING, "failed to remove snap %s", snap->snapname); } unlock: UNLOCK (&snap->lock); var++; } } out: return ret; } int32_t glusterd_snapshot_create_postvalidate (dict_t *dict, int32_t op_ret, char **op_errstr, dict_t *rsp_dict) { xlator_t *this = NULL; glusterd_conf_t *priv = NULL; int ret = -1; int32_t cleanup = 0; glusterd_snap_t *snap = NULL; char *snapname = NULL; this = THIS; GF_ASSERT (this); GF_ASSERT (dict); GF_ASSERT (rsp_dict); priv = this->private; GF_ASSERT (priv); if (op_ret) { ret = dict_get_int32 (dict, "cleanup", &cleanup); if (!ret && cleanup) { ret = glusterd_do_snap_cleanup (dict, op_errstr, rsp_dict); if (ret) { gf_log (this->name, GF_LOG_WARNING, "cleanup " "operation failed"); goto out; } } } ret = dict_get_str (dict, "snapname", &snapname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to fetch " "snapname"); goto out; } snap = glusterd_find_snap_by_name (snapname); if (!snap) { gf_log (this->name, GF_LOG_ERROR, "unable to find snap " "%s", snapname); goto out; } snap->snap_status = GD_SNAP_STATUS_IN_USE; ret = glusterd_store_snap (snap); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Could not store snap" "object %s", snap->snapname); goto out; } ret = glusterd_snapshot_update_snaps_post_validate (dict, op_errstr, rsp_dict); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to " "create snapshot"); goto out; } //ignore the errors of autodelete ret = glusterd_handle_snap_limit (dict, rsp_dict); ret = 0; out: return ret; } int32_t glusterd_snapshot (dict_t *dict, char **op_errstr, dict_t *rsp_dict) { xlator_t *this = NULL; glusterd_conf_t *priv = NULL; int32_t snap_command = 0; int ret = -1; this = THIS; GF_ASSERT (this); GF_ASSERT (dict); GF_ASSERT (rsp_dict); priv = this->private; GF_ASSERT (priv); ret = dict_get_int32 (dict, "type", &snap_command); if (ret) { gf_log (this->name, GF_LOG_ERROR, "unable to get the type of " "the snapshot command"); goto out; } switch (snap_command) { case (GF_SNAP_OPTION_TYPE_CREATE): ret = glusterd_snapshot_create_commit (dict, op_errstr, rsp_dict); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to " "create snapshot"); goto out; } break; case GF_SNAP_OPTION_TYPE_CONFIG: ret = glusterd_snapshot_config_commit (dict, op_errstr, rsp_dict); break; case GF_SNAP_OPTION_TYPE_DELETE: ret = glusterd_snapshot_remove_commit (dict, op_errstr, rsp_dict); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to " "delete snapshot"); goto out; } break; case GF_SNAP_OPTION_TYPE_RESTORE: ret = glusterd_snapshot_restore (dict, op_errstr, rsp_dict); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Failed to " "restore snapshot"); goto out; } break; case GF_SNAP_OPTION_TYPE_ACTIVATE: ret = glusterd_snapshot_activate_commit (dict, op_errstr, rsp_dict); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Failed to " "activate snapshot"); goto out; } break; case GF_SNAP_OPTION_TYPE_DEACTIVATE: ret = glusterd_snapshot_deactivate_commit (dict, op_errstr, rsp_dict); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Failed to " "deactivate snapshot"); goto out; } break; case GF_SNAP_OPTION_TYPE_STATUS: ret = glusterd_snapshot_status_commit (dict, op_errstr, rsp_dict); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to " "show snapshot status"); goto out; } break; default: gf_log (this->name, GF_LOG_WARNING, "invalid snap command"); goto out; break; } ret = 0; out: return ret; } int glusterd_snapshot_brickop (dict_t *dict, char **op_errstr, dict_t *rsp_dict) { int ret = -1; int64_t vol_count = 0; int64_t count = 1; char key[1024] = {0,}; char *volname = NULL; int32_t snap_command = 0; xlator_t *this = NULL; char *op_type = NULL; this = THIS; GF_ASSERT (this); GF_ASSERT (dict); GF_ASSERT (rsp_dict); ret = dict_get_int32 (dict, "type", &snap_command); if (ret) { gf_log (this->name, GF_LOG_ERROR, "unable to get the type of " "the snapshot command"); goto out; } switch (snap_command) { case GF_SNAP_OPTION_TYPE_CREATE: /* op_type with tell us whether its pre-commit operation * or post-commit */ ret = dict_get_str (dict, "operation-type", &op_type); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to fetch " "operation type"); goto out; } if (strcmp (op_type, "pre") == 0) { /* BRICK OP PHASE for enabling barrier, Enable barrier * if its a pre-commit operation */ ret = glusterd_set_barrier_value (dict, "enable"); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to " "set barrier value as enable in dict"); goto out; } } else if (strcmp (op_type, "post") == 0) { /* BRICK OP PHASE for disabling barrier, Disable barrier * if its a post-commit operation */ ret = glusterd_set_barrier_value (dict, "disable"); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to " "set barrier value as disable in " "dict"); goto out; } } else { ret = -1; gf_log (this->name, GF_LOG_ERROR, "Invalid op_type"); goto out; } ret = dict_get_int64 (dict, "volcount", &vol_count); if (ret) goto out; while (count <= vol_count) { snprintf (key, 1024, "volname%"PRId64, count); ret = dict_get_str (dict, key, &volname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to get volname"); goto out; } ret = dict_set_str (dict, "volname", volname); if (ret) goto out; ret = gd_brick_op_phase (GD_OP_SNAP, NULL, dict, op_errstr); if (ret) goto out; volname = NULL; count++; } dict_del (dict, "volname"); ret = 0; break; case GF_SNAP_OPTION_TYPE_DELETE: break; default: break; } out: return ret; } int glusterd_snapshot_prevalidate (dict_t *dict, char **op_errstr, dict_t *rsp_dict) { int snap_command = 0; xlator_t *this = NULL; int ret = -1; this = THIS; GF_ASSERT (this); GF_ASSERT (dict); GF_ASSERT (rsp_dict); ret = dict_get_int32 (dict, "type", &snap_command); if (ret) { gf_log (this->name, GF_LOG_ERROR, "unable to get the type of " "the snapshot command"); goto out; } switch (snap_command) { case (GF_SNAP_OPTION_TYPE_CREATE): ret = glusterd_snapshot_create_prevalidate (dict, op_errstr, rsp_dict); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Snapshot create " "pre-validation failed"); goto out; } break; case (GF_SNAP_OPTION_TYPE_CONFIG): ret = glusterd_snapshot_config_prevalidate (dict, op_errstr); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Snapshot config " "pre-validation failed"); goto out; } break; case GF_SNAP_OPTION_TYPE_RESTORE: ret = glusterd_snapshot_restore_prevalidate (dict, op_errstr, rsp_dict); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Snapshot restore " "validation failed"); goto out; } break; case GF_SNAP_OPTION_TYPE_ACTIVATE: ret = glusterd_snapshot_activate_deactivate_prevalidate (dict, op_errstr, rsp_dict, _gf_true); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Snapshot activate " "validation failed"); goto out; } break; case GF_SNAP_OPTION_TYPE_DEACTIVATE: ret = glusterd_snapshot_activate_deactivate_prevalidate (dict, op_errstr, rsp_dict, _gf_false); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Snapshot deactivate validation failed"); goto out; } break; case GF_SNAP_OPTION_TYPE_DELETE: ret = glusterd_snapshot_remove_prevalidate (dict, op_errstr, rsp_dict); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Snapshot remove " "validation failed"); goto out; } break; case GF_SNAP_OPTION_TYPE_STATUS: ret = glusterd_snapshot_status_prevalidate (dict, op_errstr, rsp_dict); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Snapshot status " "validation failed"); goto out; } break; default: gf_log (this->name, GF_LOG_WARNING, "invalid snap command"); goto out; } ret = 0; out: return ret; } /* This function is called if snapshot restore operation * is successful. It will cleanup the backup files created * during the restore operation. * * @param rsp_dict Response dictionary * @param volinfo volinfo of the volume which is being restored * @param snap snap object * * @return 0 on success or -1 on failure */ int glusterd_snapshot_restore_cleanup (dict_t *rsp_dict, glusterd_volinfo_t *volinfo, glusterd_snap_t *snap) { int ret = -1; char delete_path[PATH_MAX] = {0,}; xlator_t *this = NULL; glusterd_conf_t *priv = NULL; this = THIS; GF_ASSERT (this); priv = this->private; GF_ASSERT (rsp_dict); GF_ASSERT (volinfo); GF_ASSERT (snap); /* If the volinfo is already restored then we should delete * the backend LVMs */ if (!uuid_is_null (volinfo->restored_from_snap)) { ret = glusterd_lvm_snapshot_remove (rsp_dict, volinfo); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to remove " "LVM backend"); goto out; } } snprintf (delete_path, sizeof (delete_path), "%s/"GLUSTERD_TRASH"/vols-%s.deleted", priv->workdir, volinfo->volname); /* Restore is successful therefore delete the original volume's * volinfo. */ ret = glusterd_volinfo_delete (volinfo); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to delete volinfo"); goto out; } /* Now delete the snap entry. */ ret = glusterd_snap_remove (rsp_dict, snap, _gf_false, _gf_true); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Failed to delete " "snap %s", snap->snapname); goto out; } /* Delete the backup copy of volume folder */ ret = glusterd_recursive_rmdir (delete_path); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to remove " "backup dir (%s)", delete_path); goto out; } ret = 0; out: return ret; } /* This function is called when the snapshot restore operation failed * for some reasons. In such case we revert the restore operation. * * @param volinfo volinfo of the origin volume * @param restore_from_store Boolean variable which tells whether to * restore the origin from store or not. * * @return 0 on success and -1 on failure */ int glusterd_snapshot_revert_partial_restored_vol (glusterd_volinfo_t *volinfo, gf_boolean_t restore_from_store) { int ret = 0; char pathname [PATH_MAX] = {0,}; char trash_path[PATH_MAX] = {0,}; glusterd_volinfo_t *reverted_vol = NULL; glusterd_conf_t *priv = NULL; xlator_t *this = NULL; this = THIS; GF_ASSERT (this); priv = this->private; GF_ASSERT (priv); GF_ASSERT (volinfo); GLUSTERD_GET_VOLUME_DIR (pathname, volinfo, priv); snprintf (trash_path, sizeof (trash_path), "%s/"GLUSTERD_TRASH"/vols-%s.deleted", priv->workdir, volinfo->volname); /* Since snapshot restore failed we cannot rely on the volume * data stored under vols folder. Therefore delete the origin * volume's backend folder.*/ ret = glusterd_recursive_rmdir (pathname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to remove " "%s directory", pathname); goto out; } /* Now move the backup copy of the vols to its original * location.*/ ret = rename (trash_path, pathname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to rename folder " "from %s to %s", trash_path, pathname); goto out; } /* Skip the volinfo retrieval from the store if restore_from_store * is not true. */ if (!restore_from_store) { ret = 0; goto out; } /* Retrieve the volume from the store */ reverted_vol = glusterd_store_retrieve_volume (volinfo->volname, NULL); if (NULL == reverted_vol) { gf_log (this->name, GF_LOG_ERROR, "Failed to load restored " "%s volume", volinfo->volname); goto out; } /* Since we retrieved the volinfo from store now we don't * want the older volinfo. Therefore delete the older volinfo */ ret = glusterd_volinfo_delete (volinfo); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to delete volinfo"); goto out; } ret = 0; out: return ret; } /* This function is called when glusterd is started and we need * to revert a failed snapshot restore. * * @param snap snapshot object of the restored snap * * @return 0 on success and -1 on failure */ int glusterd_snapshot_revert_restore_from_snap (glusterd_snap_t *snap) { int ret = -1; char volname [PATH_MAX] = {0,}; glusterd_volinfo_t *snap_volinfo = NULL; glusterd_volinfo_t *volinfo = NULL; xlator_t *this = NULL; this = THIS; GF_ASSERT (this); GF_ASSERT (snap); /* TODO : As of now there is only one volume in snapshot. * Change this when multiple volume snapshot is introduced */ snap_volinfo = list_entry (snap->volumes.next, glusterd_volinfo_t, vol_list); strcpy (volname, snap_volinfo->parent_volname); ret = glusterd_volinfo_find (volname, &volinfo); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not get volinfo of " "%s", snap_volinfo->parent_volname); goto out; } ret = glusterd_snapshot_revert_partial_restored_vol (volinfo, _gf_true); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to revert snapshot " "restore operation for %s volume", volname); goto out; } out: return ret; } /* This function is called from post-validation. Based on the op_ret * it will take a decision on whether to revert the operation or * perform cleanup. * * @param dict dictionary object * @param op_ret return value of the restore operation * @param op_errstr error string * @param rsp_dict Response dictionary * * @return 0 on success and -1 on failure */ int glusterd_snapshot_restore_postop (dict_t *dict, int32_t op_ret, char **op_errstr, dict_t *rsp_dict) { int ret = -1; char *name = NULL; char *volname = NULL; int cleanup = 0; glusterd_snap_t *snap = NULL; glusterd_volinfo_t *volinfo = NULL; xlator_t *this = NULL; this = THIS; GF_ASSERT (this); GF_ASSERT (dict); GF_ASSERT (rsp_dict); ret = dict_get_str (dict, "snapname", &name); if (ret) { gf_log (this->name, GF_LOG_ERROR, "getting the snap " "name failed (volume: %s)", volinfo->volname); goto out; } snap = glusterd_find_snap_by_name (name); if (!snap) { gf_log (this->name, GF_LOG_ERROR, "snap %s is not found", name); ret = -1; goto out; } /* TODO: fix this when multiple volume support will come */ ret = dict_get_str (dict, "volname1", &volname); if (ret) { gf_log (this->name, GF_LOG_ERROR, "failed to get volume name"); goto out; } ret = glusterd_volinfo_find (volname, &volinfo); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Volume (%s) does not exist ", volname); goto out; } /* On success perform the cleanup operation */ if (0 == op_ret) { ret = glusterd_snapshot_restore_cleanup (rsp_dict, volinfo, snap); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to perform " "snapshot restore cleanup for %s volume", volname); goto out; } } else { /* On failure revert snapshot restore */ ret = dict_get_int32 (dict, "cleanup", &cleanup); /* Perform cleanup only when required */ if (ret || (0 == cleanup)) { ret = 0; goto out; } ret = glusterd_snapshot_revert_partial_restored_vol (volinfo, _gf_false); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to revert " "restore operation for %s volume", volname); goto out; } } ret = 0; out: return ret; } int glusterd_snapshot_postvalidate (dict_t *dict, int32_t op_ret, char **op_errstr, dict_t *rsp_dict) { int snap_command = 0; xlator_t *this = NULL; int ret = -1; this = THIS; GF_ASSERT (this); GF_ASSERT (dict); GF_ASSERT (rsp_dict); ret = dict_get_int32 (dict, "type", &snap_command); if (ret) { gf_log (this->name, GF_LOG_ERROR, "unable to get the type of " "the snapshot command"); goto out; } switch (snap_command) { case GF_SNAP_OPTION_TYPE_CREATE: ret = glusterd_snapshot_create_postvalidate (dict, op_ret, op_errstr, rsp_dict); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Snapshot create " "post-validation failed"); goto out; } break; case GF_SNAP_OPTION_TYPE_DELETE: ret = glusterd_snapshot_update_snaps_post_validate (dict, op_errstr, rsp_dict); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to " "update missed snaps list"); goto out; } break; case GF_SNAP_OPTION_TYPE_RESTORE: ret = glusterd_snapshot_update_snaps_post_validate (dict, op_errstr, rsp_dict); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to " "update missed snaps list"); goto out; } ret = glusterd_snapshot_restore_postop (dict, op_ret, op_errstr, rsp_dict); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to " "perform snapshot restore post-op"); goto out; } break; case GF_SNAP_OPTION_TYPE_ACTIVATE: case GF_SNAP_OPTION_TYPE_DEACTIVATE: /*Nothing to be done. But want to * avoid the default case warning*/ ret = 0; break; default: gf_log (this->name, GF_LOG_WARNING, "invalid snap command"); goto out; } ret = 0; out: return ret; } int glusterd_handle_snapshot_fn (rpcsvc_request_t *req) { int32_t ret = 0; dict_t *dict = NULL; gf_cli_req cli_req = {{0},}; glusterd_op_t cli_op = GD_OP_SNAP; int type = 0; glusterd_conf_t *conf = NULL; char *host_uuid = NULL; char err_str[2048] = {0,}; xlator_t *this = NULL; GF_ASSERT (req); this = THIS; GF_ASSERT (this); conf = this->private; GF_ASSERT (conf); ret = xdr_to_generic (req->msg[0], &cli_req, (xdrproc_t)xdr_gf_cli_req); if (ret < 0) { req->rpc_err = GARBAGE_ARGS; goto out; } if (cli_req.dict.dict_len > 0) { dict = dict_new (); if (!dict) goto out; ret = dict_unserialize (cli_req.dict.dict_val, cli_req.dict.dict_len, &dict); if (ret < 0) { gf_log (this->name, GF_LOG_ERROR, "failed to " "unserialize req-buffer to dictionary"); snprintf (err_str, sizeof (err_str), "Unable to decode " "the command"); goto out; } dict->extra_stdfree = cli_req.dict.dict_val; host_uuid = gf_strdup (uuid_utoa(MY_UUID)); if (host_uuid == NULL) { snprintf (err_str, sizeof (err_str), "Failed to get " "the uuid of local glusterd"); ret = -1; goto out; } ret = dict_set_dynstr (dict, "host-uuid", host_uuid); if (ret) { GF_FREE (host_uuid); goto out; } } else { gf_log (this->name, GF_LOG_ERROR, "request dict length is %d", cli_req.dict.dict_len); goto out; } ret = dict_get_int32 (dict, "type", &type); if (ret < 0) { snprintf (err_str, sizeof (err_str), "Command type not found"); gf_log (this->name, GF_LOG_ERROR, "%s", err_str); goto out; } switch (type) { case GF_SNAP_OPTION_TYPE_CREATE: ret = glusterd_handle_snapshot_create (req, cli_op, dict, err_str, sizeof (err_str)); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Snapshot create " "failed: %s", err_str); } break; case GF_SNAP_OPTION_TYPE_RESTORE: ret = glusterd_handle_snapshot_restore (req, cli_op, dict, err_str, sizeof (err_str)); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Snapshot restore " "failed: %s", err_str); } break; case GF_SNAP_OPTION_TYPE_INFO: ret = glusterd_handle_snapshot_info (req, cli_op, dict, err_str, sizeof (err_str)); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Snapshot info " "failed"); } break; case GF_SNAP_OPTION_TYPE_LIST: ret = glusterd_handle_snapshot_list (req, cli_op, dict, err_str, sizeof (err_str)); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Snapshot list " "failed"); } break; case GF_SNAP_OPTION_TYPE_CONFIG: ret = glusterd_handle_snapshot_config (req, cli_op, dict, err_str, sizeof (err_str)); if (ret) { gf_log (this->name, GF_LOG_WARNING, "snapshot config " "failed"); } break; case GF_SNAP_OPTION_TYPE_DELETE: ret = glusterd_handle_snapshot_remove (req, cli_op, dict, err_str, sizeof (err_str)); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Snapshot delete " "failed: %s", err_str); } break; case GF_SNAP_OPTION_TYPE_ACTIVATE: ret = glusterd_mgmt_v3_initiate_snap_phases (req, cli_op, dict); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Snapshot activate failed: %s", err_str); } break; case GF_SNAP_OPTION_TYPE_DEACTIVATE: ret = glusterd_mgmt_v3_initiate_snap_phases (req, cli_op, dict); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Snapshot deactivate failed: %s", err_str); } break; case GF_SNAP_OPTION_TYPE_STATUS: ret = glusterd_handle_snapshot_status (req, cli_op, dict, err_str, sizeof (err_str)); if (ret) { gf_log (this->name, GF_LOG_WARNING, "Snapshot status " "failed: %s", err_str); } break; default: gf_log (this->name, GF_LOG_ERROR, "Unkown snapshot request " "type (%d)", type); ret = -1; /* Failure */ } out: if (ret) { if (err_str[0] == '\0') snprintf (err_str, sizeof (err_str), "Operation failed"); ret = glusterd_op_send_cli_response (cli_op, ret, 0, req, dict, err_str); } return ret; } int glusterd_handle_snapshot (rpcsvc_request_t *req) { return glusterd_big_locked_handler (req, glusterd_handle_snapshot_fn); } static inline void glusterd_free_snap_op (glusterd_snap_op_t *snap_op) { if (snap_op) { if (snap_op->brick_path) GF_FREE (snap_op->brick_path); GF_FREE (snap_op); } } static inline void glusterd_free_missed_snapinfo (glusterd_missed_snap_info *missed_snapinfo) { glusterd_snap_op_t *snap_opinfo = NULL; glusterd_snap_op_t *tmp = NULL; if (missed_snapinfo) { list_for_each_entry_safe (snap_opinfo, tmp, &missed_snapinfo->snap_ops, snap_ops_list) { glusterd_free_snap_op (snap_opinfo); snap_opinfo = NULL; } if (missed_snapinfo->node_uuid) GF_FREE (missed_snapinfo->node_uuid); if (missed_snapinfo->snap_uuid) GF_FREE (missed_snapinfo->snap_uuid); GF_FREE (missed_snapinfo); } } /* Look for duplicates and accordingly update the list */ int32_t glusterd_update_missed_snap_entry (glusterd_missed_snap_info *missed_snapinfo, glusterd_snap_op_t *missed_snap_op) { int32_t ret = -1; glusterd_snap_op_t *snap_opinfo = NULL; gf_boolean_t match = _gf_false; xlator_t *this = NULL; this = THIS; GF_ASSERT(this); GF_ASSERT(missed_snapinfo); GF_ASSERT(missed_snap_op); list_for_each_entry (snap_opinfo, &missed_snapinfo->snap_ops, snap_ops_list) { /* If the entry is not for the same snap_vol_id * then continue */ if (strcmp (snap_opinfo->snap_vol_id, missed_snap_op->snap_vol_id)) continue; if ((!strcmp (snap_opinfo->brick_path, missed_snap_op->brick_path)) && (snap_opinfo->op == missed_snap_op->op)) { /* If two entries have conflicting status * GD_MISSED_SNAP_DONE takes precedence */ if ((snap_opinfo->status == GD_MISSED_SNAP_PENDING) && (missed_snap_op->status == GD_MISSED_SNAP_DONE)) { snap_opinfo->status = GD_MISSED_SNAP_DONE; gf_log (this->name, GF_LOG_INFO, "Updating missed snap status " "for %s:%s=%s:%d:%s:%d as DONE", missed_snapinfo->node_uuid, missed_snapinfo->snap_uuid, snap_opinfo->snap_vol_id, snap_opinfo->brick_num, snap_opinfo->brick_path, snap_opinfo->op); ret = 0; glusterd_free_snap_op (missed_snap_op); goto out; } match = _gf_true; break; } else if ((snap_opinfo->brick_num == missed_snap_op->brick_num) && (snap_opinfo->op == GF_SNAP_OPTION_TYPE_CREATE) && ((missed_snap_op->op == GF_SNAP_OPTION_TYPE_DELETE) || (missed_snap_op->op == GF_SNAP_OPTION_TYPE_RESTORE))) { /* Optimizing create and delete entries for the same * brick and same node */ gf_log (this->name, GF_LOG_INFO, "Updating missed snap status " "for %s:%s=%s:%d:%s:%d as DONE", missed_snapinfo->node_uuid, missed_snapinfo->snap_uuid, snap_opinfo->snap_vol_id, snap_opinfo->brick_num, snap_opinfo->brick_path, snap_opinfo->op); snap_opinfo->status = GD_MISSED_SNAP_DONE; ret = 0; glusterd_free_snap_op (missed_snap_op); goto out; } } if (match == _gf_true) { gf_log (this->name, GF_LOG_INFO, "Duplicate entry. Not updating"); glusterd_free_snap_op (missed_snap_op); } else { list_add_tail (&missed_snap_op->snap_ops_list, &missed_snapinfo->snap_ops); } ret = 0; out: gf_log (this->name, GF_LOG_TRACE, "Returning %d", ret); return ret; } /* Add new missed snap entry to the missed_snaps list. */ int32_t glusterd_add_new_entry_to_list (char *missed_info, char *snap_vol_id, int32_t brick_num, char *brick_path, int32_t snap_op, int32_t snap_status) { char *buf = NULL; char *save_ptr = NULL; char node_snap_info[PATH_MAX] = ""; int32_t ret = -1; glusterd_missed_snap_info *missed_snapinfo = NULL; glusterd_snap_op_t *missed_snap_op = NULL; glusterd_conf_t *priv = NULL; gf_boolean_t match = _gf_false; gf_boolean_t free_missed_snap_info = _gf_false; xlator_t *this = NULL; this = THIS; GF_ASSERT(this); GF_ASSERT(missed_info); GF_ASSERT(snap_vol_id); GF_ASSERT(brick_path); priv = this->private; GF_ASSERT (priv); /* Create the snap_op object consisting of the * * snap id and the op */ ret = glusterd_missed_snap_op_new (&missed_snap_op); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to create new missed snap object."); ret = -1; goto out; } missed_snap_op->snap_vol_id = gf_strdup(snap_vol_id); if (!missed_snap_op->snap_vol_id) { ret = -1; goto out; } missed_snap_op->brick_path = gf_strdup(brick_path); if (!missed_snap_op->brick_path) { ret = -1; goto out; } missed_snap_op->brick_num = brick_num; missed_snap_op->op = snap_op; missed_snap_op->status = snap_status; /* Look for other entries for the same node and same snap */ list_for_each_entry (missed_snapinfo, &priv->missed_snaps_list, missed_snaps) { snprintf (node_snap_info, sizeof(node_snap_info), "%s:%s", missed_snapinfo->node_uuid, missed_snapinfo->snap_uuid); if (!strcmp (node_snap_info, missed_info)) { /* Found missed snapshot info for * * the same node and same snap */ match = _gf_true; break; } } if (match == _gf_false) { /* First snap op missed for the brick */ ret = glusterd_missed_snapinfo_new (&missed_snapinfo); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to create missed snapinfo"); goto out; } free_missed_snap_info = _gf_true; buf = strtok_r (missed_info, ":", &save_ptr); if (!buf) { ret = -1; goto out; } missed_snapinfo->node_uuid = gf_strdup(buf); if (!missed_snapinfo->node_uuid) { ret = -1; goto out; } buf = strtok_r (NULL, ":", &save_ptr); if (!buf) { ret = -1; goto out; } missed_snapinfo->snap_uuid = gf_strdup(buf); if (!missed_snapinfo->snap_uuid) { ret = -1; goto out; } list_add_tail (&missed_snap_op->snap_ops_list, &missed_snapinfo->snap_ops); list_add_tail (&missed_snapinfo->missed_snaps, &priv->missed_snaps_list); ret = 0; goto out; } else { ret = glusterd_update_missed_snap_entry (missed_snapinfo, missed_snap_op); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to update existing missed snap entry."); goto out; } } out: if (ret) { glusterd_free_snap_op (missed_snap_op); if (missed_snapinfo && (free_missed_snap_info == _gf_true)) glusterd_free_missed_snapinfo (missed_snapinfo); } gf_log (this->name, GF_LOG_TRACE, "Returning %d", ret); return ret; } /* Add missing snap entries to the in-memory conf->missed_snap_list */ int32_t glusterd_add_missed_snaps_to_list (dict_t *dict, int32_t missed_snap_count) { char *buf = NULL; char *tmp = NULL; char *save_ptr = NULL; char *nodeid = NULL; char *snap_uuid = NULL; char *snap_vol_id = NULL; char *brick_path = NULL; char missed_info[PATH_MAX] = ""; char name_buf[PATH_MAX] = ""; int32_t i = -1; int32_t ret = -1; int32_t brick_num = -1; int32_t snap_op = -1; int32_t snap_status = -1; glusterd_conf_t *priv = NULL; xlator_t *this = NULL; this = THIS; GF_ASSERT(this); GF_ASSERT(dict); priv = this->private; GF_ASSERT (priv); /* We can update the missed_snaps_list without acquiring * * any additional locks as big lock will be held. */ for (i = 0; i < missed_snap_count; i++) { snprintf (name_buf, sizeof(name_buf), "missed_snaps_%d", i); ret = dict_get_str (dict, name_buf, &buf); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Unable to fetch %s", name_buf); goto out; } gf_log (this->name, GF_LOG_DEBUG, "missed_snap_entry = %s", buf); /* Need to make a duplicate string coz the same dictionary * * is resent to the non-originator nodes */ tmp = gf_strdup (buf); if (!tmp) { ret = -1; goto out; } /* Fetch the node-id, snap-id, brick_num, * brick_path, snap_op and snap status */ nodeid = strtok_r (tmp, ":", &save_ptr); snap_uuid = strtok_r (NULL, "=", &save_ptr); snap_vol_id = strtok_r (NULL, ":", &save_ptr); brick_num = atoi(strtok_r (NULL, ":", &save_ptr)); brick_path = strtok_r (NULL, ":", &save_ptr); snap_op = atoi(strtok_r (NULL, ":", &save_ptr)); snap_status = atoi(strtok_r (NULL, ":", &save_ptr)); if (!nodeid || !snap_uuid || !brick_path || !snap_vol_id || brick_num < 1 || snap_op < 1 || snap_status < 1) { gf_log (this->name, GF_LOG_ERROR, "Invalid missed_snap_entry"); ret = -1; goto out; } snprintf (missed_info, sizeof(missed_info), "%s:%s", nodeid, snap_uuid); ret = glusterd_add_new_entry_to_list (missed_info, snap_vol_id, brick_num, brick_path, snap_op, snap_status); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to store missed snaps_list"); goto out; } GF_FREE (tmp); tmp = NULL; } ret = 0; out: if (tmp) GF_FREE (tmp); gf_log (this->name, GF_LOG_TRACE, "Returning %d", ret); return ret; } /* This function will restore origin volume to it's snap. * The restore operation will simply replace the Gluster origin * volume with the snap volume. * TODO: Multi-volume delete to be done. * Cleanup in case of restore failure is pending. * * @param orig_vol volinfo of origin volume * @param snap_vol volinfo of snapshot volume * * @return 0 on success and negative value on error */ int gd_restore_snap_volume (dict_t *dict, dict_t *rsp_dict, glusterd_volinfo_t *orig_vol, glusterd_volinfo_t *snap_vol, int32_t volcount) { int ret = -1; glusterd_volinfo_t *new_volinfo = NULL; glusterd_snap_t *snap = NULL; xlator_t *this = NULL; glusterd_conf_t *conf = NULL; glusterd_volinfo_t *temp_volinfo = NULL; glusterd_volinfo_t *voliter = NULL; this = THIS; GF_ASSERT (this); GF_ASSERT (dict); GF_ASSERT (rsp_dict); conf = this->private; GF_ASSERT (conf); GF_VALIDATE_OR_GOTO (this->name, orig_vol, out); GF_VALIDATE_OR_GOTO (this->name, snap_vol, out); snap = snap_vol->snapshot; GF_VALIDATE_OR_GOTO (this->name, snap, out); /* Set the status to under restore so that if the * the node goes down during restore and comes back * the state of the volume can be reverted correctly */ snap->snap_status = GD_SNAP_STATUS_UNDER_RESTORE; /* We need to save this in disk so that if node goes * down the status is in updated state. */ ret = glusterd_store_snap (snap); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Could not store snap " "object for %s snap of %s volume", snap_vol->volname, snap_vol->parent_volname); goto out; } /* Snap volume must be stoped before performing the * restore operation. */ ret = glusterd_stop_volume (snap_vol); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to stop " "snap volume"); goto out; } /* Create a new volinfo for the restored volume */ ret = glusterd_volinfo_dup (snap_vol, &new_volinfo, _gf_true); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to create volinfo"); goto out; } /* Following entries need to be derived from origin volume. */ strcpy (new_volinfo->volname, orig_vol->volname); uuid_copy (new_volinfo->volume_id, orig_vol->volume_id); new_volinfo->snap_count = orig_vol->snap_count; new_volinfo->snap_max_hard_limit = orig_vol->snap_max_hard_limit; uuid_copy (new_volinfo->restored_from_snap, snap_vol->snapshot->snap_id); /* Bump the version of the restored volume, so that nodes * * which are done can sync during handshake */ new_volinfo->version = orig_vol->version; list_for_each_entry_safe (voliter, temp_volinfo, &orig_vol->snap_volumes, snapvol_list) { list_add_tail (&voliter->snapvol_list, &new_volinfo->snap_volumes); } /* Copy the snap vol info to the new_volinfo.*/ ret = glusterd_snap_volinfo_restore (dict, rsp_dict, new_volinfo, snap_vol, volcount); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to restore snap"); goto out; } ret = glusterd_restore_geo_rep_files (snap_vol); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to restore " "geo-rep files for snap %s", snap_vol->snapshot->snapname); goto out; } ret = glusterd_copy_quota_files (snap_vol, orig_vol); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to restore " "quota files for snap %s", snap_vol->snapshot->snapname); goto out; } /* New volinfo always shows the status as created. Therefore * set the status to the original volume's status. */ glusterd_set_volume_status (new_volinfo, orig_vol->status); list_add_tail (&new_volinfo->vol_list, &conf->volumes); ret = glusterd_store_volinfo (new_volinfo, GLUSTERD_VOLINFO_VER_AC_INCREMENT); if (ret) { gf_log (this->name, GF_LOG_ERROR, "Failed to store volinfo"); goto out; } ret = 0; out: if (ret && NULL != new_volinfo) { /* In case of any failure we should free new_volinfo. Doing * this will also remove the entry we added in conf->volumes * if it was added there. */ (void)glusterd_volinfo_delete (new_volinfo); } return ret; }