| David Teigland | e7fd417 | 2006-01-18 09:30:29 +0000 | [diff] [blame] | 1 | /****************************************************************************** | 
 | 2 | ******************************************************************************* | 
 | 3 | ** | 
 | 4 | **  Copyright (C) 2005 Red Hat, Inc.  All rights reserved. | 
 | 5 | ** | 
 | 6 | **  This copyrighted material is made available to anyone wishing to use, | 
 | 7 | **  modify, copy, or redistribute it subject to the terms and conditions | 
 | 8 | **  of the GNU General Public License v.2. | 
 | 9 | ** | 
 | 10 | ******************************************************************************* | 
 | 11 | ******************************************************************************/ | 
 | 12 |  | 
 | 13 | #include "dlm_internal.h" | 
 | 14 | #include "member.h" | 
 | 15 | #include "lock.h" | 
 | 16 | #include "dir.h" | 
 | 17 | #include "config.h" | 
 | 18 | #include "requestqueue.h" | 
 | 19 |  | 
 | 20 | struct rq_entry { | 
 | 21 | 	struct list_head list; | 
 | 22 | 	int nodeid; | 
 | 23 | 	char request[1]; | 
 | 24 | }; | 
 | 25 |  | 
 | 26 | /* | 
 | 27 |  * Requests received while the lockspace is in recovery get added to the | 
 | 28 |  * request queue and processed when recovery is complete.  This happens when | 
 | 29 |  * the lockspace is suspended on some nodes before it is on others, or the | 
 | 30 |  * lockspace is enabled on some while still suspended on others. | 
 | 31 |  */ | 
 | 32 |  | 
| David Teigland | d440015 | 2006-10-31 11:55:56 -0600 | [diff] [blame] | 33 | int dlm_add_requestqueue(struct dlm_ls *ls, int nodeid, struct dlm_header *hd) | 
| David Teigland | e7fd417 | 2006-01-18 09:30:29 +0000 | [diff] [blame] | 34 | { | 
 | 35 | 	struct rq_entry *e; | 
 | 36 | 	int length = hd->h_length; | 
| David Teigland | d440015 | 2006-10-31 11:55:56 -0600 | [diff] [blame] | 37 | 	int rv = 0; | 
| David Teigland | e7fd417 | 2006-01-18 09:30:29 +0000 | [diff] [blame] | 38 |  | 
| David Teigland | e7fd417 | 2006-01-18 09:30:29 +0000 | [diff] [blame] | 39 | 	e = kmalloc(sizeof(struct rq_entry) + length, GFP_KERNEL); | 
 | 40 | 	if (!e) { | 
 | 41 | 		log_print("dlm_add_requestqueue: out of memory\n"); | 
| David Teigland | d440015 | 2006-10-31 11:55:56 -0600 | [diff] [blame] | 42 | 		return 0; | 
| David Teigland | e7fd417 | 2006-01-18 09:30:29 +0000 | [diff] [blame] | 43 | 	} | 
 | 44 |  | 
 | 45 | 	e->nodeid = nodeid; | 
 | 46 | 	memcpy(e->request, hd, length); | 
 | 47 |  | 
| David Teigland | d440015 | 2006-10-31 11:55:56 -0600 | [diff] [blame] | 48 | 	/* We need to check dlm_locking_stopped() after taking the mutex to | 
 | 49 | 	   avoid a race where dlm_recoverd enables locking and runs | 
 | 50 | 	   process_requestqueue between our earlier dlm_locking_stopped check | 
 | 51 | 	   and this addition to the requestqueue. */ | 
 | 52 |  | 
| David Teigland | 9013592 | 2006-01-20 08:47:07 +0000 | [diff] [blame] | 53 | 	mutex_lock(&ls->ls_requestqueue_mutex); | 
| David Teigland | d440015 | 2006-10-31 11:55:56 -0600 | [diff] [blame] | 54 | 	if (dlm_locking_stopped(ls)) | 
 | 55 | 		list_add_tail(&e->list, &ls->ls_requestqueue); | 
 | 56 | 	else { | 
 | 57 | 		log_debug(ls, "dlm_add_requestqueue skip from %d", nodeid); | 
 | 58 | 		kfree(e); | 
 | 59 | 		rv = -EAGAIN; | 
 | 60 | 	} | 
| David Teigland | 9013592 | 2006-01-20 08:47:07 +0000 | [diff] [blame] | 61 | 	mutex_unlock(&ls->ls_requestqueue_mutex); | 
| David Teigland | d440015 | 2006-10-31 11:55:56 -0600 | [diff] [blame] | 62 | 	return rv; | 
| David Teigland | e7fd417 | 2006-01-18 09:30:29 +0000 | [diff] [blame] | 63 | } | 
 | 64 |  | 
 | 65 | int dlm_process_requestqueue(struct dlm_ls *ls) | 
 | 66 | { | 
 | 67 | 	struct rq_entry *e; | 
 | 68 | 	struct dlm_header *hd; | 
 | 69 | 	int error = 0; | 
 | 70 |  | 
| David Teigland | 9013592 | 2006-01-20 08:47:07 +0000 | [diff] [blame] | 71 | 	mutex_lock(&ls->ls_requestqueue_mutex); | 
| David Teigland | e7fd417 | 2006-01-18 09:30:29 +0000 | [diff] [blame] | 72 |  | 
 | 73 | 	for (;;) { | 
 | 74 | 		if (list_empty(&ls->ls_requestqueue)) { | 
| David Teigland | 9013592 | 2006-01-20 08:47:07 +0000 | [diff] [blame] | 75 | 			mutex_unlock(&ls->ls_requestqueue_mutex); | 
| David Teigland | e7fd417 | 2006-01-18 09:30:29 +0000 | [diff] [blame] | 76 | 			error = 0; | 
 | 77 | 			break; | 
 | 78 | 		} | 
 | 79 | 		e = list_entry(ls->ls_requestqueue.next, struct rq_entry, list); | 
| David Teigland | 9013592 | 2006-01-20 08:47:07 +0000 | [diff] [blame] | 80 | 		mutex_unlock(&ls->ls_requestqueue_mutex); | 
| David Teigland | e7fd417 | 2006-01-18 09:30:29 +0000 | [diff] [blame] | 81 |  | 
 | 82 | 		hd = (struct dlm_header *) e->request; | 
| David Teigland | 9013592 | 2006-01-20 08:47:07 +0000 | [diff] [blame] | 83 | 		error = dlm_receive_message(hd, e->nodeid, 1); | 
| David Teigland | e7fd417 | 2006-01-18 09:30:29 +0000 | [diff] [blame] | 84 |  | 
 | 85 | 		if (error == -EINTR) { | 
 | 86 | 			/* entry is left on requestqueue */ | 
 | 87 | 			log_debug(ls, "process_requestqueue abort eintr"); | 
 | 88 | 			break; | 
 | 89 | 		} | 
 | 90 |  | 
| David Teigland | 9013592 | 2006-01-20 08:47:07 +0000 | [diff] [blame] | 91 | 		mutex_lock(&ls->ls_requestqueue_mutex); | 
| David Teigland | e7fd417 | 2006-01-18 09:30:29 +0000 | [diff] [blame] | 92 | 		list_del(&e->list); | 
 | 93 | 		kfree(e); | 
 | 94 |  | 
 | 95 | 		if (dlm_locking_stopped(ls)) { | 
 | 96 | 			log_debug(ls, "process_requestqueue abort running"); | 
| David Teigland | 9013592 | 2006-01-20 08:47:07 +0000 | [diff] [blame] | 97 | 			mutex_unlock(&ls->ls_requestqueue_mutex); | 
| David Teigland | e7fd417 | 2006-01-18 09:30:29 +0000 | [diff] [blame] | 98 | 			error = -EINTR; | 
 | 99 | 			break; | 
 | 100 | 		} | 
 | 101 | 		schedule(); | 
 | 102 | 	} | 
 | 103 |  | 
 | 104 | 	return error; | 
 | 105 | } | 
 | 106 |  | 
 | 107 | /* | 
 | 108 |  * After recovery is done, locking is resumed and dlm_recoverd takes all the | 
 | 109 |  * saved requests and processes them as they would have been by dlm_recvd.  At | 
 | 110 |  * the same time, dlm_recvd will start receiving new requests from remote | 
 | 111 |  * nodes.  We want to delay dlm_recvd processing new requests until | 
 | 112 |  * dlm_recoverd has finished processing the old saved requests. | 
 | 113 |  */ | 
 | 114 |  | 
 | 115 | void dlm_wait_requestqueue(struct dlm_ls *ls) | 
 | 116 | { | 
 | 117 | 	for (;;) { | 
| David Teigland | 9013592 | 2006-01-20 08:47:07 +0000 | [diff] [blame] | 118 | 		mutex_lock(&ls->ls_requestqueue_mutex); | 
| David Teigland | e7fd417 | 2006-01-18 09:30:29 +0000 | [diff] [blame] | 119 | 		if (list_empty(&ls->ls_requestqueue)) | 
 | 120 | 			break; | 
 | 121 | 		if (dlm_locking_stopped(ls)) | 
 | 122 | 			break; | 
| David Teigland | 9013592 | 2006-01-20 08:47:07 +0000 | [diff] [blame] | 123 | 		mutex_unlock(&ls->ls_requestqueue_mutex); | 
| David Teigland | e7fd417 | 2006-01-18 09:30:29 +0000 | [diff] [blame] | 124 | 		schedule(); | 
 | 125 | 	} | 
| David Teigland | 9013592 | 2006-01-20 08:47:07 +0000 | [diff] [blame] | 126 | 	mutex_unlock(&ls->ls_requestqueue_mutex); | 
| David Teigland | e7fd417 | 2006-01-18 09:30:29 +0000 | [diff] [blame] | 127 | } | 
 | 128 |  | 
 | 129 | static int purge_request(struct dlm_ls *ls, struct dlm_message *ms, int nodeid) | 
 | 130 | { | 
 | 131 | 	uint32_t type = ms->m_type; | 
 | 132 |  | 
| David Teigland | 2896ee3 | 2006-11-27 11:31:22 -0600 | [diff] [blame] | 133 | 	/* the ls is being cleaned up and freed by release_lockspace */ | 
 | 134 | 	if (!ls->ls_count) | 
 | 135 | 		return 1; | 
 | 136 |  | 
| David Teigland | e7fd417 | 2006-01-18 09:30:29 +0000 | [diff] [blame] | 137 | 	if (dlm_is_removed(ls, nodeid)) | 
 | 138 | 		return 1; | 
 | 139 |  | 
 | 140 | 	/* directory operations are always purged because the directory is | 
 | 141 | 	   always rebuilt during recovery and the lookups resent */ | 
 | 142 |  | 
 | 143 | 	if (type == DLM_MSG_REMOVE || | 
 | 144 | 	    type == DLM_MSG_LOOKUP || | 
 | 145 | 	    type == DLM_MSG_LOOKUP_REPLY) | 
 | 146 | 		return 1; | 
 | 147 |  | 
 | 148 | 	if (!dlm_no_directory(ls)) | 
 | 149 | 		return 0; | 
 | 150 |  | 
 | 151 | 	/* with no directory, the master is likely to change as a part of | 
 | 152 | 	   recovery; requests to/from the defunct master need to be purged */ | 
 | 153 |  | 
 | 154 | 	switch (type) { | 
 | 155 | 	case DLM_MSG_REQUEST: | 
 | 156 | 	case DLM_MSG_CONVERT: | 
 | 157 | 	case DLM_MSG_UNLOCK: | 
 | 158 | 	case DLM_MSG_CANCEL: | 
 | 159 | 		/* we're no longer the master of this resource, the sender | 
 | 160 | 		   will resend to the new master (see waiter_needs_recovery) */ | 
 | 161 |  | 
 | 162 | 		if (dlm_hash2nodeid(ls, ms->m_hash) != dlm_our_nodeid()) | 
 | 163 | 			return 1; | 
 | 164 | 		break; | 
 | 165 |  | 
 | 166 | 	case DLM_MSG_REQUEST_REPLY: | 
 | 167 | 	case DLM_MSG_CONVERT_REPLY: | 
 | 168 | 	case DLM_MSG_UNLOCK_REPLY: | 
 | 169 | 	case DLM_MSG_CANCEL_REPLY: | 
 | 170 | 	case DLM_MSG_GRANT: | 
 | 171 | 		/* this reply is from the former master of the resource, | 
 | 172 | 		   we'll resend to the new master if needed */ | 
 | 173 |  | 
 | 174 | 		if (dlm_hash2nodeid(ls, ms->m_hash) != nodeid) | 
 | 175 | 			return 1; | 
 | 176 | 		break; | 
 | 177 | 	} | 
 | 178 |  | 
 | 179 | 	return 0; | 
 | 180 | } | 
 | 181 |  | 
 | 182 | void dlm_purge_requestqueue(struct dlm_ls *ls) | 
 | 183 | { | 
 | 184 | 	struct dlm_message *ms; | 
 | 185 | 	struct rq_entry *e, *safe; | 
 | 186 |  | 
| David Teigland | 9013592 | 2006-01-20 08:47:07 +0000 | [diff] [blame] | 187 | 	mutex_lock(&ls->ls_requestqueue_mutex); | 
| David Teigland | e7fd417 | 2006-01-18 09:30:29 +0000 | [diff] [blame] | 188 | 	list_for_each_entry_safe(e, safe, &ls->ls_requestqueue, list) { | 
 | 189 | 		ms = (struct dlm_message *) e->request; | 
 | 190 |  | 
 | 191 | 		if (purge_request(ls, ms, e->nodeid)) { | 
 | 192 | 			list_del(&e->list); | 
 | 193 | 			kfree(e); | 
 | 194 | 		} | 
 | 195 | 	} | 
| David Teigland | 9013592 | 2006-01-20 08:47:07 +0000 | [diff] [blame] | 196 | 	mutex_unlock(&ls->ls_requestqueue_mutex); | 
| David Teigland | e7fd417 | 2006-01-18 09:30:29 +0000 | [diff] [blame] | 197 | } | 
 | 198 |  |