lockspace.c 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873
  1. /******************************************************************************
  2. *******************************************************************************
  3. **
  4. ** Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
  5. ** Copyright (C) 2004-2011 Red Hat, Inc. All rights reserved.
  6. **
  7. ** This copyrighted material is made available to anyone wishing to use,
  8. ** modify, copy, or redistribute it subject to the terms and conditions
  9. ** of the GNU General Public License v.2.
  10. **
  11. *******************************************************************************
  12. ******************************************************************************/
  13. #include "dlm_internal.h"
  14. #include "lockspace.h"
  15. #include "member.h"
  16. #include "recoverd.h"
  17. #include "dir.h"
  18. #include "lowcomms.h"
  19. #include "config.h"
  20. #include "memory.h"
  21. #include "lock.h"
  22. #include "recover.h"
  23. #include "requestqueue.h"
  24. #include "user.h"
  25. #include "ast.h"
  26. static int ls_count;
  27. static struct mutex ls_lock;
  28. static struct list_head lslist;
  29. static spinlock_t lslist_lock;
  30. static struct task_struct * scand_task;
  31. static ssize_t dlm_control_store(struct dlm_ls *ls, const char *buf, size_t len)
  32. {
  33. ssize_t ret = len;
  34. int n = simple_strtol(buf, NULL, 0);
  35. ls = dlm_find_lockspace_local(ls->ls_local_handle);
  36. if (!ls)
  37. return -EINVAL;
  38. switch (n) {
  39. case 0:
  40. dlm_ls_stop(ls);
  41. break;
  42. case 1:
  43. dlm_ls_start(ls);
  44. break;
  45. default:
  46. ret = -EINVAL;
  47. }
  48. dlm_put_lockspace(ls);
  49. return ret;
  50. }
  51. static ssize_t dlm_event_store(struct dlm_ls *ls, const char *buf, size_t len)
  52. {
  53. ls->ls_uevent_result = simple_strtol(buf, NULL, 0);
  54. set_bit(LSFL_UEVENT_WAIT, &ls->ls_flags);
  55. wake_up(&ls->ls_uevent_wait);
  56. return len;
  57. }
  58. static ssize_t dlm_id_show(struct dlm_ls *ls, char *buf)
  59. {
  60. return snprintf(buf, PAGE_SIZE, "%u\n", ls->ls_global_id);
  61. }
  62. static ssize_t dlm_id_store(struct dlm_ls *ls, const char *buf, size_t len)
  63. {
  64. ls->ls_global_id = simple_strtoul(buf, NULL, 0);
  65. return len;
  66. }
  67. static ssize_t dlm_recover_status_show(struct dlm_ls *ls, char *buf)
  68. {
  69. uint32_t status = dlm_recover_status(ls);
  70. return snprintf(buf, PAGE_SIZE, "%x\n", status);
  71. }
  72. static ssize_t dlm_recover_nodeid_show(struct dlm_ls *ls, char *buf)
  73. {
  74. return snprintf(buf, PAGE_SIZE, "%d\n", ls->ls_recover_nodeid);
  75. }
  76. struct dlm_attr {
  77. struct attribute attr;
  78. ssize_t (*show)(struct dlm_ls *, char *);
  79. ssize_t (*store)(struct dlm_ls *, const char *, size_t);
  80. };
  81. static struct dlm_attr dlm_attr_control = {
  82. .attr = {.name = "control", .mode = S_IWUSR},
  83. .store = dlm_control_store
  84. };
  85. static struct dlm_attr dlm_attr_event = {
  86. .attr = {.name = "event_done", .mode = S_IWUSR},
  87. .store = dlm_event_store
  88. };
  89. static struct dlm_attr dlm_attr_id = {
  90. .attr = {.name = "id", .mode = S_IRUGO | S_IWUSR},
  91. .show = dlm_id_show,
  92. .store = dlm_id_store
  93. };
  94. static struct dlm_attr dlm_attr_recover_status = {
  95. .attr = {.name = "recover_status", .mode = S_IRUGO},
  96. .show = dlm_recover_status_show
  97. };
  98. static struct dlm_attr dlm_attr_recover_nodeid = {
  99. .attr = {.name = "recover_nodeid", .mode = S_IRUGO},
  100. .show = dlm_recover_nodeid_show
  101. };
  102. static struct attribute *dlm_attrs[] = {
  103. &dlm_attr_control.attr,
  104. &dlm_attr_event.attr,
  105. &dlm_attr_id.attr,
  106. &dlm_attr_recover_status.attr,
  107. &dlm_attr_recover_nodeid.attr,
  108. NULL,
  109. };
  110. static ssize_t dlm_attr_show(struct kobject *kobj, struct attribute *attr,
  111. char *buf)
  112. {
  113. struct dlm_ls *ls = container_of(kobj, struct dlm_ls, ls_kobj);
  114. struct dlm_attr *a = container_of(attr, struct dlm_attr, attr);
  115. return a->show ? a->show(ls, buf) : 0;
  116. }
  117. static ssize_t dlm_attr_store(struct kobject *kobj, struct attribute *attr,
  118. const char *buf, size_t len)
  119. {
  120. struct dlm_ls *ls = container_of(kobj, struct dlm_ls, ls_kobj);
  121. struct dlm_attr *a = container_of(attr, struct dlm_attr, attr);
  122. return a->store ? a->store(ls, buf, len) : len;
  123. }
  124. static void lockspace_kobj_release(struct kobject *k)
  125. {
  126. struct dlm_ls *ls = container_of(k, struct dlm_ls, ls_kobj);
  127. kfree(ls);
  128. }
  129. static const struct sysfs_ops dlm_attr_ops = {
  130. .show = dlm_attr_show,
  131. .store = dlm_attr_store,
  132. };
  133. static struct kobj_type dlm_ktype = {
  134. .default_attrs = dlm_attrs,
  135. .sysfs_ops = &dlm_attr_ops,
  136. .release = lockspace_kobj_release,
  137. };
  138. static struct kset *dlm_kset;
  139. static int do_uevent(struct dlm_ls *ls, int in)
  140. {
  141. int error;
  142. if (in)
  143. kobject_uevent(&ls->ls_kobj, KOBJ_ONLINE);
  144. else
  145. kobject_uevent(&ls->ls_kobj, KOBJ_OFFLINE);
  146. log_debug(ls, "%s the lockspace group...", in ? "joining" : "leaving");
  147. /* dlm_controld will see the uevent, do the necessary group management
  148. and then write to sysfs to wake us */
  149. error = wait_event_interruptible(ls->ls_uevent_wait,
  150. test_and_clear_bit(LSFL_UEVENT_WAIT, &ls->ls_flags));
  151. log_debug(ls, "group event done %d %d", error, ls->ls_uevent_result);
  152. if (error)
  153. goto out;
  154. error = ls->ls_uevent_result;
  155. out:
  156. if (error)
  157. log_error(ls, "group %s failed %d %d", in ? "join" : "leave",
  158. error, ls->ls_uevent_result);
  159. return error;
  160. }
  161. static int dlm_uevent(struct kset *kset, struct kobject *kobj,
  162. struct kobj_uevent_env *env)
  163. {
  164. struct dlm_ls *ls = container_of(kobj, struct dlm_ls, ls_kobj);
  165. add_uevent_var(env, "LOCKSPACE=%s", ls->ls_name);
  166. return 0;
  167. }
  168. static struct kset_uevent_ops dlm_uevent_ops = {
  169. .uevent = dlm_uevent,
  170. };
  171. int __init dlm_lockspace_init(void)
  172. {
  173. ls_count = 0;
  174. mutex_init(&ls_lock);
  175. INIT_LIST_HEAD(&lslist);
  176. spin_lock_init(&lslist_lock);
  177. dlm_kset = kset_create_and_add("dlm", &dlm_uevent_ops, kernel_kobj);
  178. if (!dlm_kset) {
  179. printk(KERN_WARNING "%s: can not create kset\n", __func__);
  180. return -ENOMEM;
  181. }
  182. return 0;
  183. }
  184. void dlm_lockspace_exit(void)
  185. {
  186. kset_unregister(dlm_kset);
  187. }
  188. static struct dlm_ls *find_ls_to_scan(void)
  189. {
  190. struct dlm_ls *ls;
  191. spin_lock(&lslist_lock);
  192. list_for_each_entry(ls, &lslist, ls_list) {
  193. if (time_after_eq(jiffies, ls->ls_scan_time +
  194. dlm_config.ci_scan_secs * HZ)) {
  195. spin_unlock(&lslist_lock);
  196. return ls;
  197. }
  198. }
  199. spin_unlock(&lslist_lock);
  200. return NULL;
  201. }
  202. static int dlm_scand(void *data)
  203. {
  204. struct dlm_ls *ls;
  205. while (!kthread_should_stop()) {
  206. ls = find_ls_to_scan();
  207. if (ls) {
  208. if (dlm_lock_recovery_try(ls)) {
  209. ls->ls_scan_time = jiffies;
  210. dlm_scan_rsbs(ls);
  211. dlm_scan_timeout(ls);
  212. dlm_scan_waiters(ls);
  213. dlm_unlock_recovery(ls);
  214. } else {
  215. ls->ls_scan_time += HZ;
  216. }
  217. continue;
  218. }
  219. schedule_timeout_interruptible(dlm_config.ci_scan_secs * HZ);
  220. }
  221. return 0;
  222. }
  223. static int dlm_scand_start(void)
  224. {
  225. struct task_struct *p;
  226. int error = 0;
  227. p = kthread_run(dlm_scand, NULL, "dlm_scand");
  228. if (IS_ERR(p))
  229. error = PTR_ERR(p);
  230. else
  231. scand_task = p;
  232. return error;
  233. }
  234. static void dlm_scand_stop(void)
  235. {
  236. kthread_stop(scand_task);
  237. }
  238. struct dlm_ls *dlm_find_lockspace_global(uint32_t id)
  239. {
  240. struct dlm_ls *ls;
  241. spin_lock(&lslist_lock);
  242. list_for_each_entry(ls, &lslist, ls_list) {
  243. if (ls->ls_global_id == id) {
  244. ls->ls_count++;
  245. goto out;
  246. }
  247. }
  248. ls = NULL;
  249. out:
  250. spin_unlock(&lslist_lock);
  251. return ls;
  252. }
  253. struct dlm_ls *dlm_find_lockspace_local(dlm_lockspace_t *lockspace)
  254. {
  255. struct dlm_ls *ls;
  256. spin_lock(&lslist_lock);
  257. list_for_each_entry(ls, &lslist, ls_list) {
  258. if (ls->ls_local_handle == lockspace) {
  259. ls->ls_count++;
  260. goto out;
  261. }
  262. }
  263. ls = NULL;
  264. out:
  265. spin_unlock(&lslist_lock);
  266. return ls;
  267. }
  268. struct dlm_ls *dlm_find_lockspace_device(int minor)
  269. {
  270. struct dlm_ls *ls;
  271. spin_lock(&lslist_lock);
  272. list_for_each_entry(ls, &lslist, ls_list) {
  273. if (ls->ls_device.minor == minor) {
  274. ls->ls_count++;
  275. goto out;
  276. }
  277. }
  278. ls = NULL;
  279. out:
  280. spin_unlock(&lslist_lock);
  281. return ls;
  282. }
  283. void dlm_put_lockspace(struct dlm_ls *ls)
  284. {
  285. spin_lock(&lslist_lock);
  286. ls->ls_count--;
  287. spin_unlock(&lslist_lock);
  288. }
  289. static void remove_lockspace(struct dlm_ls *ls)
  290. {
  291. for (;;) {
  292. spin_lock(&lslist_lock);
  293. if (ls->ls_count == 0) {
  294. WARN_ON(ls->ls_create_count != 0);
  295. list_del(&ls->ls_list);
  296. spin_unlock(&lslist_lock);
  297. return;
  298. }
  299. spin_unlock(&lslist_lock);
  300. ssleep(1);
  301. }
  302. }
  303. static int threads_start(void)
  304. {
  305. int error;
  306. error = dlm_scand_start();
  307. if (error) {
  308. log_print("cannot start dlm_scand thread %d", error);
  309. goto fail;
  310. }
  311. /* Thread for sending/receiving messages for all lockspace's */
  312. error = dlm_lowcomms_start();
  313. if (error) {
  314. log_print("cannot start dlm lowcomms %d", error);
  315. goto scand_fail;
  316. }
  317. return 0;
  318. scand_fail:
  319. dlm_scand_stop();
  320. fail:
  321. return error;
  322. }
  323. static void threads_stop(void)
  324. {
  325. dlm_scand_stop();
  326. dlm_lowcomms_stop();
  327. }
  328. static int new_lockspace(const char *name, const char *cluster,
  329. uint32_t flags, int lvblen,
  330. const struct dlm_lockspace_ops *ops, void *ops_arg,
  331. int *ops_result, dlm_lockspace_t **lockspace)
  332. {
  333. struct dlm_ls *ls;
  334. int i, size, error;
  335. int do_unreg = 0;
  336. int namelen = strlen(name);
  337. if (namelen > DLM_LOCKSPACE_LEN)
  338. return -EINVAL;
  339. if (!lvblen || (lvblen % 8))
  340. return -EINVAL;
  341. if (!try_module_get(THIS_MODULE))
  342. return -EINVAL;
  343. if (!dlm_user_daemon_available()) {
  344. log_print("dlm user daemon not available");
  345. error = -EUNATCH;
  346. goto out;
  347. }
  348. if (ops && ops_result) {
  349. if (!dlm_config.ci_recover_callbacks)
  350. *ops_result = -EOPNOTSUPP;
  351. else
  352. *ops_result = 0;
  353. }
  354. if (dlm_config.ci_recover_callbacks && cluster &&
  355. strncmp(cluster, dlm_config.ci_cluster_name, DLM_LOCKSPACE_LEN)) {
  356. log_print("dlm cluster name %s mismatch %s",
  357. dlm_config.ci_cluster_name, cluster);
  358. error = -EBADR;
  359. goto out;
  360. }
  361. error = 0;
  362. spin_lock(&lslist_lock);
  363. list_for_each_entry(ls, &lslist, ls_list) {
  364. WARN_ON(ls->ls_create_count <= 0);
  365. if (ls->ls_namelen != namelen)
  366. continue;
  367. if (memcmp(ls->ls_name, name, namelen))
  368. continue;
  369. if (flags & DLM_LSFL_NEWEXCL) {
  370. error = -EEXIST;
  371. break;
  372. }
  373. ls->ls_create_count++;
  374. *lockspace = ls;
  375. error = 1;
  376. break;
  377. }
  378. spin_unlock(&lslist_lock);
  379. if (error)
  380. goto out;
  381. error = -ENOMEM;
  382. ls = kzalloc(sizeof(struct dlm_ls) + namelen, GFP_NOFS);
  383. if (!ls)
  384. goto out;
  385. memcpy(ls->ls_name, name, namelen);
  386. ls->ls_namelen = namelen;
  387. ls->ls_lvblen = lvblen;
  388. ls->ls_count = 0;
  389. ls->ls_flags = 0;
  390. ls->ls_scan_time = jiffies;
  391. if (ops && dlm_config.ci_recover_callbacks) {
  392. ls->ls_ops = ops;
  393. ls->ls_ops_arg = ops_arg;
  394. }
  395. if (flags & DLM_LSFL_TIMEWARN)
  396. set_bit(LSFL_TIMEWARN, &ls->ls_flags);
  397. /* ls_exflags are forced to match among nodes, and we don't
  398. need to require all nodes to have some flags set */
  399. ls->ls_exflags = (flags & ~(DLM_LSFL_TIMEWARN | DLM_LSFL_FS |
  400. DLM_LSFL_NEWEXCL));
  401. size = dlm_config.ci_rsbtbl_size;
  402. ls->ls_rsbtbl_size = size;
  403. ls->ls_rsbtbl = vmalloc(sizeof(struct dlm_rsbtable) * size);
  404. if (!ls->ls_rsbtbl)
  405. goto out_lsfree;
  406. for (i = 0; i < size; i++) {
  407. ls->ls_rsbtbl[i].keep.rb_node = NULL;
  408. ls->ls_rsbtbl[i].toss.rb_node = NULL;
  409. spin_lock_init(&ls->ls_rsbtbl[i].lock);
  410. }
  411. idr_init(&ls->ls_lkbidr);
  412. spin_lock_init(&ls->ls_lkbidr_spin);
  413. size = dlm_config.ci_dirtbl_size;
  414. ls->ls_dirtbl_size = size;
  415. ls->ls_dirtbl = vmalloc(sizeof(struct dlm_dirtable) * size);
  416. if (!ls->ls_dirtbl)
  417. goto out_lkbfree;
  418. for (i = 0; i < size; i++) {
  419. INIT_LIST_HEAD(&ls->ls_dirtbl[i].list);
  420. spin_lock_init(&ls->ls_dirtbl[i].lock);
  421. }
  422. INIT_LIST_HEAD(&ls->ls_waiters);
  423. mutex_init(&ls->ls_waiters_mutex);
  424. INIT_LIST_HEAD(&ls->ls_orphans);
  425. mutex_init(&ls->ls_orphans_mutex);
  426. INIT_LIST_HEAD(&ls->ls_timeout);
  427. mutex_init(&ls->ls_timeout_mutex);
  428. INIT_LIST_HEAD(&ls->ls_new_rsb);
  429. spin_lock_init(&ls->ls_new_rsb_spin);
  430. INIT_LIST_HEAD(&ls->ls_nodes);
  431. INIT_LIST_HEAD(&ls->ls_nodes_gone);
  432. ls->ls_num_nodes = 0;
  433. ls->ls_low_nodeid = 0;
  434. ls->ls_total_weight = 0;
  435. ls->ls_node_array = NULL;
  436. memset(&ls->ls_stub_rsb, 0, sizeof(struct dlm_rsb));
  437. ls->ls_stub_rsb.res_ls = ls;
  438. ls->ls_debug_rsb_dentry = NULL;
  439. ls->ls_debug_waiters_dentry = NULL;
  440. init_waitqueue_head(&ls->ls_uevent_wait);
  441. ls->ls_uevent_result = 0;
  442. init_completion(&ls->ls_members_done);
  443. ls->ls_members_result = -1;
  444. mutex_init(&ls->ls_cb_mutex);
  445. INIT_LIST_HEAD(&ls->ls_cb_delay);
  446. ls->ls_recoverd_task = NULL;
  447. mutex_init(&ls->ls_recoverd_active);
  448. spin_lock_init(&ls->ls_recover_lock);
  449. spin_lock_init(&ls->ls_rcom_spin);
  450. get_random_bytes(&ls->ls_rcom_seq, sizeof(uint64_t));
  451. ls->ls_recover_status = 0;
  452. ls->ls_recover_seq = 0;
  453. ls->ls_recover_args = NULL;
  454. init_rwsem(&ls->ls_in_recovery);
  455. init_rwsem(&ls->ls_recv_active);
  456. INIT_LIST_HEAD(&ls->ls_requestqueue);
  457. mutex_init(&ls->ls_requestqueue_mutex);
  458. mutex_init(&ls->ls_clear_proc_locks);
  459. ls->ls_recover_buf = kmalloc(dlm_config.ci_buffer_size, GFP_NOFS);
  460. if (!ls->ls_recover_buf)
  461. goto out_dirfree;
  462. ls->ls_slot = 0;
  463. ls->ls_num_slots = 0;
  464. ls->ls_slots_size = 0;
  465. ls->ls_slots = NULL;
  466. INIT_LIST_HEAD(&ls->ls_recover_list);
  467. spin_lock_init(&ls->ls_recover_list_lock);
  468. ls->ls_recover_list_count = 0;
  469. ls->ls_local_handle = ls;
  470. init_waitqueue_head(&ls->ls_wait_general);
  471. INIT_LIST_HEAD(&ls->ls_root_list);
  472. init_rwsem(&ls->ls_root_sem);
  473. down_write(&ls->ls_in_recovery);
  474. spin_lock(&lslist_lock);
  475. ls->ls_create_count = 1;
  476. list_add(&ls->ls_list, &lslist);
  477. spin_unlock(&lslist_lock);
  478. if (flags & DLM_LSFL_FS) {
  479. error = dlm_callback_start(ls);
  480. if (error) {
  481. log_error(ls, "can't start dlm_callback %d", error);
  482. goto out_delist;
  483. }
  484. }
  485. /* needs to find ls in lslist */
  486. error = dlm_recoverd_start(ls);
  487. if (error) {
  488. log_error(ls, "can't start dlm_recoverd %d", error);
  489. goto out_callback;
  490. }
  491. ls->ls_kobj.kset = dlm_kset;
  492. error = kobject_init_and_add(&ls->ls_kobj, &dlm_ktype, NULL,
  493. "%s", ls->ls_name);
  494. if (error)
  495. goto out_recoverd;
  496. kobject_uevent(&ls->ls_kobj, KOBJ_ADD);
  497. /* let kobject handle freeing of ls if there's an error */
  498. do_unreg = 1;
  499. /* This uevent triggers dlm_controld in userspace to add us to the
  500. group of nodes that are members of this lockspace (managed by the
  501. cluster infrastructure.) Once it's done that, it tells us who the
  502. current lockspace members are (via configfs) and then tells the
  503. lockspace to start running (via sysfs) in dlm_ls_start(). */
  504. error = do_uevent(ls, 1);
  505. if (error)
  506. goto out_recoverd;
  507. wait_for_completion(&ls->ls_members_done);
  508. error = ls->ls_members_result;
  509. if (error)
  510. goto out_members;
  511. dlm_create_debug_file(ls);
  512. log_debug(ls, "join complete");
  513. *lockspace = ls;
  514. return 0;
  515. out_members:
  516. do_uevent(ls, 0);
  517. dlm_clear_members(ls);
  518. kfree(ls->ls_node_array);
  519. out_recoverd:
  520. dlm_recoverd_stop(ls);
  521. out_callback:
  522. dlm_callback_stop(ls);
  523. out_delist:
  524. spin_lock(&lslist_lock);
  525. list_del(&ls->ls_list);
  526. spin_unlock(&lslist_lock);
  527. kfree(ls->ls_recover_buf);
  528. out_dirfree:
  529. vfree(ls->ls_dirtbl);
  530. out_lkbfree:
  531. idr_destroy(&ls->ls_lkbidr);
  532. vfree(ls->ls_rsbtbl);
  533. out_lsfree:
  534. if (do_unreg)
  535. kobject_put(&ls->ls_kobj);
  536. else
  537. kfree(ls);
  538. out:
  539. module_put(THIS_MODULE);
  540. return error;
  541. }
  542. int dlm_new_lockspace(const char *name, const char *cluster,
  543. uint32_t flags, int lvblen,
  544. const struct dlm_lockspace_ops *ops, void *ops_arg,
  545. int *ops_result, dlm_lockspace_t **lockspace)
  546. {
  547. int error = 0;
  548. mutex_lock(&ls_lock);
  549. if (!ls_count)
  550. error = threads_start();
  551. if (error)
  552. goto out;
  553. error = new_lockspace(name, cluster, flags, lvblen, ops, ops_arg,
  554. ops_result, lockspace);
  555. if (!error)
  556. ls_count++;
  557. if (error > 0)
  558. error = 0;
  559. if (!ls_count)
  560. threads_stop();
  561. out:
  562. mutex_unlock(&ls_lock);
  563. return error;
  564. }
  565. static int lkb_idr_is_local(int id, void *p, void *data)
  566. {
  567. struct dlm_lkb *lkb = p;
  568. if (!lkb->lkb_nodeid)
  569. return 1;
  570. return 0;
  571. }
  572. static int lkb_idr_is_any(int id, void *p, void *data)
  573. {
  574. return 1;
  575. }
  576. static int lkb_idr_free(int id, void *p, void *data)
  577. {
  578. struct dlm_lkb *lkb = p;
  579. if (lkb->lkb_lvbptr && lkb->lkb_flags & DLM_IFL_MSTCPY)
  580. dlm_free_lvb(lkb->lkb_lvbptr);
  581. dlm_free_lkb(lkb);
  582. return 0;
  583. }
  584. /* NOTE: We check the lkbidr here rather than the resource table.
  585. This is because there may be LKBs queued as ASTs that have been unlinked
  586. from their RSBs and are pending deletion once the AST has been delivered */
  587. static int lockspace_busy(struct dlm_ls *ls, int force)
  588. {
  589. int rv;
  590. spin_lock(&ls->ls_lkbidr_spin);
  591. if (force == 0) {
  592. rv = idr_for_each(&ls->ls_lkbidr, lkb_idr_is_any, ls);
  593. } else if (force == 1) {
  594. rv = idr_for_each(&ls->ls_lkbidr, lkb_idr_is_local, ls);
  595. } else {
  596. rv = 0;
  597. }
  598. spin_unlock(&ls->ls_lkbidr_spin);
  599. return rv;
  600. }
  601. static int release_lockspace(struct dlm_ls *ls, int force)
  602. {
  603. struct dlm_rsb *rsb;
  604. struct rb_node *n;
  605. int i, busy, rv;
  606. busy = lockspace_busy(ls, force);
  607. spin_lock(&lslist_lock);
  608. if (ls->ls_create_count == 1) {
  609. if (busy) {
  610. rv = -EBUSY;
  611. } else {
  612. /* remove_lockspace takes ls off lslist */
  613. ls->ls_create_count = 0;
  614. rv = 0;
  615. }
  616. } else if (ls->ls_create_count > 1) {
  617. rv = --ls->ls_create_count;
  618. } else {
  619. rv = -EINVAL;
  620. }
  621. spin_unlock(&lslist_lock);
  622. if (rv) {
  623. log_debug(ls, "release_lockspace no remove %d", rv);
  624. return rv;
  625. }
  626. dlm_device_deregister(ls);
  627. if (force < 3 && dlm_user_daemon_available())
  628. do_uevent(ls, 0);
  629. dlm_recoverd_stop(ls);
  630. dlm_callback_stop(ls);
  631. remove_lockspace(ls);
  632. dlm_delete_debug_file(ls);
  633. kfree(ls->ls_recover_buf);
  634. /*
  635. * Free direntry structs.
  636. */
  637. dlm_dir_clear(ls);
  638. vfree(ls->ls_dirtbl);
  639. /*
  640. * Free all lkb's in idr
  641. */
  642. idr_for_each(&ls->ls_lkbidr, lkb_idr_free, ls);
  643. idr_remove_all(&ls->ls_lkbidr);
  644. idr_destroy(&ls->ls_lkbidr);
  645. /*
  646. * Free all rsb's on rsbtbl[] lists
  647. */
  648. for (i = 0; i < ls->ls_rsbtbl_size; i++) {
  649. while ((n = rb_first(&ls->ls_rsbtbl[i].keep))) {
  650. rsb = rb_entry(n, struct dlm_rsb, res_hashnode);
  651. rb_erase(n, &ls->ls_rsbtbl[i].keep);
  652. dlm_free_rsb(rsb);
  653. }
  654. while ((n = rb_first(&ls->ls_rsbtbl[i].toss))) {
  655. rsb = rb_entry(n, struct dlm_rsb, res_hashnode);
  656. rb_erase(n, &ls->ls_rsbtbl[i].toss);
  657. dlm_free_rsb(rsb);
  658. }
  659. }
  660. vfree(ls->ls_rsbtbl);
  661. while (!list_empty(&ls->ls_new_rsb)) {
  662. rsb = list_first_entry(&ls->ls_new_rsb, struct dlm_rsb,
  663. res_hashchain);
  664. list_del(&rsb->res_hashchain);
  665. dlm_free_rsb(rsb);
  666. }
  667. /*
  668. * Free structures on any other lists
  669. */
  670. dlm_purge_requestqueue(ls);
  671. kfree(ls->ls_recover_args);
  672. dlm_clear_free_entries(ls);
  673. dlm_clear_members(ls);
  674. dlm_clear_members_gone(ls);
  675. kfree(ls->ls_node_array);
  676. log_debug(ls, "release_lockspace final free");
  677. kobject_put(&ls->ls_kobj);
  678. /* The ls structure will be freed when the kobject is done with */
  679. module_put(THIS_MODULE);
  680. return 0;
  681. }
  682. /*
  683. * Called when a system has released all its locks and is not going to use the
  684. * lockspace any longer. We free everything we're managing for this lockspace.
  685. * Remaining nodes will go through the recovery process as if we'd died. The
  686. * lockspace must continue to function as usual, participating in recoveries,
  687. * until this returns.
  688. *
  689. * Force has 4 possible values:
  690. * 0 - don't destroy locksapce if it has any LKBs
  691. * 1 - destroy lockspace if it has remote LKBs but not if it has local LKBs
  692. * 2 - destroy lockspace regardless of LKBs
  693. * 3 - destroy lockspace as part of a forced shutdown
  694. */
  695. int dlm_release_lockspace(void *lockspace, int force)
  696. {
  697. struct dlm_ls *ls;
  698. int error;
  699. ls = dlm_find_lockspace_local(lockspace);
  700. if (!ls)
  701. return -EINVAL;
  702. dlm_put_lockspace(ls);
  703. mutex_lock(&ls_lock);
  704. error = release_lockspace(ls, force);
  705. if (!error)
  706. ls_count--;
  707. if (!ls_count)
  708. threads_stop();
  709. mutex_unlock(&ls_lock);
  710. return error;
  711. }
  712. void dlm_stop_lockspaces(void)
  713. {
  714. struct dlm_ls *ls;
  715. restart:
  716. spin_lock(&lslist_lock);
  717. list_for_each_entry(ls, &lslist, ls_list) {
  718. if (!test_bit(LSFL_RUNNING, &ls->ls_flags))
  719. continue;
  720. spin_unlock(&lslist_lock);
  721. log_error(ls, "no userland control daemon, stopping lockspace");
  722. dlm_ls_stop(ls);
  723. goto restart;
  724. }
  725. spin_unlock(&lslist_lock);
  726. }