// -*- mode:C++; tab-width:8; c-basic-offset:2; indent-tabs-mode:t -*- // vim: ts=8 sw=2 smarttab /* * Ceph - scalable distributed file system * * Copyright (C) 2004-2006 Sage Weil * * This is free software; you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public * License version 2.1, as published by the Free Software * Foundation. See file COPYING. * */ #include #include #include #include #include using namespace std; #include "include/ceph_features.h" #include "common/config.h" #include "common/strtol.h" #include "mon/MonMap.h" #include "mds/MDS.h" #include "mds/Dumper.h" #include "mds/Resetter.h" #include "msg/Messenger.h" #include "common/Timer.h" #include "common/ceph_argparse.h" #include "common/pick_address.h" #include "global/global_init.h" #include "global/signal_handler.h" #include "global/pidfile.h" #include "mon/MonClient.h" #include "auth/KeyRing.h" #include "include/assert.h" #define dout_subsys ceph_subsys_mds void usage() { derr << "usage: ceph-mds -i name [flags] [[--journal_check rank]|[--hot-standby][rank]]\n" << " -m monitorip:port\n" << " connect to monitor at given address\n" << " --debug_mds n\n" << " debug MDS level (e.g. 10)\n" << " --dump-journal rank filename\n" << " dump the MDS journal for rank.\n" << " --journal-check rank\n" << " replay the journal for rank, then exit\n" << " --hot-standby rank\n" << " start up as a hot standby for rank\n" << " --reset-journal rank\n" << " discard the MDS journal for rank, and replace it with a single\n" << " event that updates/resets inotable and sessionmap on replay.\n" << dendl; generic_server_usage(); } static int do_cmds_special_action(const std::string &action, const std::string &dump_file, int rank) { common_init_finish(g_ceph_context); Messenger *messenger = Messenger::create(g_ceph_context, entity_name_t::CLIENT(), "mds", getpid()); int r = messenger->bind(g_conf->public_addr); if (r < 0) return r; MonClient mc(g_ceph_context); if (mc.build_initial_monmap() < 0) return -1; if (action == "dump-journal") { dout(0) << "dumping journal for mds." << rank << " to " << dump_file << dendl; Dumper *journal_dumper = new Dumper(messenger, &mc); journal_dumper->init(rank); journal_dumper->dump(dump_file.c_str()); mc.shutdown(); } else if (action == "undump-journal") { dout(0) << "undumping journal for mds." << rank << " from " << dump_file << dendl; Dumper *journal_dumper = new Dumper(messenger, &mc); journal_dumper->init(rank); journal_dumper->undump(dump_file.c_str()); mc.shutdown(); } else if (action == "reset-journal") { dout(0) << "resetting journal" << dendl; Resetter *jr = new Resetter(messenger, &mc); jr->init(rank); jr->reset(); mc.shutdown(); } else { assert(0); } return 0; } static void set_special_action(std::string &dest, const std::string &act) { if (!dest.empty()) { derr << "Parse error! Can't specify more than one action. You " << "specified both " << act << " and " << dest << "\n" << dendl; usage(); exit(1); } dest = act; } static int parse_rank(const char *opt_name, const std::string &val) { std::string err; int ret = strict_strtol(val.c_str(), 10, &err); if (!err.empty()) { derr << "error parsing " << opt_name << ": failed to parse rank. " << "It must be an int." << "\n" << dendl; usage(); } return ret; } MDS *mds = NULL; static void handle_mds_signal(int signum) { if (mds) mds->handle_signal(signum); } int main(int argc, const char **argv) { vector args; argv_to_vec(argc, argv, args); env_to_vec(args); global_init(NULL, args, CEPH_ENTITY_TYPE_MDS, CODE_ENVIRONMENT_DAEMON, 0); // mds specific args int shadow = 0; int rank = -1; std::string dump_file; std::string val, action; for (std::vector::iterator i = args.begin(); i != args.end(); ) { if (ceph_argparse_double_dash(args, i)) { break; } else if (ceph_argparse_witharg(args, i, &val, "--dump-journal", (char*)NULL)) { set_special_action(action, "dump-journal"); rank = parse_rank("dump-journal", val); if (i == args.end()) { derr << "error parsing --dump-journal: you must give a second " << "dump-journal argument: the filename to dump the journal to. " << "\n" << dendl; usage(); } dump_file = *i++; } else if (ceph_argparse_witharg(args, i, &val, "--undump-journal", (char*)NULL)) { set_special_action(action, "undump-journal"); rank = parse_rank("undump-journal", val); if (i == args.end()) { derr << "error parsing --undump-journal: you must give a second " << "undump-journal argument: the filename to undump the journal from. " << "\n" << dendl; usage(); } dump_file = *i++; } else if (ceph_argparse_witharg(args, i, &val, "--reset-journal", (char*)NULL)) { set_special_action(action, "reset-journal"); rank = parse_rank("reset-journal", val); } else if (ceph_argparse_witharg(args, i, &val, "--journal-check", (char*)NULL)) { int r = parse_rank("journal-check", val); if (shadow) { dout(0) << "Error: can only select one standby state" << dendl; return -1; } dout(0) << "requesting oneshot_replay for mds." << r << dendl; shadow = MDSMap::STATE_ONESHOT_REPLAY; char rb[32]; snprintf(rb, sizeof(rb), "%d", r); g_conf->set_val("mds_standby_for_rank", rb); g_conf->apply_changes(NULL); } else if (ceph_argparse_witharg(args, i, &val, "--hot-standby", (char*)NULL)) { int r = parse_rank("hot-standby", val); if (shadow) { dout(0) << "Error: can only select one standby state" << dendl; return -1; } dout(0) << "requesting standby_replay for mds." << r << dendl; shadow = MDSMap::STATE_STANDBY_REPLAY; char rb[32]; snprintf(rb, sizeof(rb), "%d", r); g_conf->set_val("mds_standby_for_rank", rb); g_conf->apply_changes(NULL); } else { derr << "Error: can't understand argument: " << *i << "\n" << dendl; usage(); } } pick_addresses(g_ceph_context, CEPH_PICK_ADDRESS_PUBLIC); // Check for special actions if (!action.empty()) { return do_cmds_special_action(action, dump_file, rank); } // Normal startup if (g_conf->name.has_default_id()) { derr << "must specify '-i name' with the ceph-mds instance name" << dendl; usage(); } Messenger *messenger = Messenger::create(g_ceph_context, entity_name_t::MDS(-1), "mds", getpid()); messenger->set_cluster_protocol(CEPH_MDS_PROTOCOL); cout << "starting " << g_conf->name << " at " << messenger->get_myaddr() << std::endl; uint64_t supported = CEPH_FEATURE_UID | CEPH_FEATURE_NOSRCADDR | CEPH_FEATURE_DIRLAYOUTHASH | CEPH_FEATURE_PGID64 | CEPH_FEATURE_MSG_AUTH; uint64_t required = CEPH_FEATURE_OSDREPLYMUX; messenger->set_default_policy(Messenger::Policy::lossy_client(supported, required)); messenger->set_policy(entity_name_t::TYPE_MON, Messenger::Policy::lossy_client(supported, CEPH_FEATURE_UID | CEPH_FEATURE_PGID64)); messenger->set_policy(entity_name_t::TYPE_MDS, Messenger::Policy::lossless_peer(supported, CEPH_FEATURE_UID)); messenger->set_policy(entity_name_t::TYPE_CLIENT, Messenger::Policy::stateful_server(supported, 0)); int r = messenger->bind(g_conf->public_addr); if (r < 0) exit(1); if (shadow != MDSMap::STATE_ONESHOT_REPLAY) global_init_daemonize(g_ceph_context, 0); common_init_finish(g_ceph_context); // get monmap MonClient mc(g_ceph_context); if (mc.build_initial_monmap() < 0) return -1; global_init_chdir(g_ceph_context); messenger->start(); // start mds mds = new MDS(g_conf->name.get_id().c_str(), messenger, &mc); // in case we have to respawn... mds->orig_argc = argc; mds->orig_argv = argv; if (shadow) r = mds->init(shadow); else r = mds->init(); if (r < 0) goto shutdown; // set up signal handlers, now that we've daemonized/forked. init_async_signal_handler(); register_async_signal_handler(SIGHUP, sighup_handler); register_async_signal_handler_oneshot(SIGINT, handle_mds_signal); register_async_signal_handler_oneshot(SIGTERM, handle_mds_signal); if (g_conf->inject_early_sigterm) kill(getpid(), SIGTERM); messenger->wait(); unregister_async_signal_handler(SIGHUP, sighup_handler); unregister_async_signal_handler(SIGINT, handle_mds_signal); unregister_async_signal_handler(SIGTERM, handle_mds_signal); shutdown_async_signal_handler(); shutdown: // yuck: grab the mds lock, so we can be sure that whoever in *mds // called shutdown finishes what they were doing. mds->mds_lock.Lock(); mds->mds_lock.Unlock(); pidfile_remove(); // only delete if it was a clean shutdown (to aid memory leak // detection, etc.). don't bother if it was a suicide. if (mds->is_stopped()) delete mds; g_ceph_context->put(); // cd on exit, so that gmon.out (if any) goes into a separate directory for each node. char s[20]; snprintf(s, sizeof(s), "gmon/%d", getpid()); if ((mkdir(s, 0755) == 0) && (chdir(s) == 0)) { cerr << "ceph-mds: gmon.out should be in " << s << std::endl; } return 0; }