Use cluster-aware procid_is_me instead of comparing pid's
[nivanova/samba-autobuild/.git] / source3 / smbd / oplock.c
1 /* 
2    Unix SMB/CIFS implementation.
3    oplock processing
4    Copyright (C) Andrew Tridgell 1992-1998
5    Copyright (C) Jeremy Allison 1998 - 2001
6    Copyright (C) Volker Lendecke 2005
7    
8    This program is free software; you can redistribute it and/or modify
9    it under the terms of the GNU General Public License as published by
10    the Free Software Foundation; either version 3 of the License, or
11    (at your option) any later version.
12    
13    This program is distributed in the hope that it will be useful,
14    but WITHOUT ANY WARRANTY; without even the implied warranty of
15    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
16    GNU General Public License for more details.
17    
18    You should have received a copy of the GNU General Public License
19    along with this program.  If not, see <http://www.gnu.org/licenses/>.
20 */
21
22 #define DBGC_CLASS DBGC_LOCKING
23 #include "includes.h"
24 #include "smbd/globals.h"
25
26 /****************************************************************************
27  Get the number of current exclusive oplocks.
28 ****************************************************************************/
29
30 int32 get_number_of_exclusive_open_oplocks(void)
31 {
32   return exclusive_oplocks_open;
33 }
34
35 /*
36  * helper function used by the kernel oplock backends to post the break message
37  */
38 void break_kernel_oplock(struct messaging_context *msg_ctx, files_struct *fsp)
39 {
40         uint8_t msg[MSG_SMB_KERNEL_BREAK_SIZE];
41
42         /* Put the kernel break info into the message. */
43         push_file_id_24((char *)msg, &fsp->file_id);
44         SIVAL(msg,24,fsp->fh->gen_id);
45
46         /* Don't need to be root here as we're only ever
47            sending to ourselves. */
48
49         messaging_send_buf(msg_ctx, procid_self(),
50                            MSG_SMB_KERNEL_BREAK,
51                            msg, MSG_SMB_KERNEL_BREAK_SIZE);
52 }
53
54 /****************************************************************************
55  Attempt to set an oplock on a file. Always succeeds if kernel oplocks are
56  disabled (just sets flags). Returns True if oplock set.
57 ****************************************************************************/
58
59 bool set_file_oplock(files_struct *fsp, int oplock_type)
60 {
61         if ((fsp->oplock_type != NO_OPLOCK) &&
62             (fsp->oplock_type != FAKE_LEVEL_II_OPLOCK) &&
63             koplocks &&
64             !koplocks->ops->set_oplock(koplocks, fsp, oplock_type)) {
65                 return False;
66         }
67
68         fsp->oplock_type = oplock_type;
69         fsp->sent_oplock_break = NO_BREAK_SENT;
70         if (oplock_type == LEVEL_II_OPLOCK) {
71                 level_II_oplocks_open++;
72         } else if (EXCLUSIVE_OPLOCK_TYPE(fsp->oplock_type)) {
73                 exclusive_oplocks_open++;
74         }
75
76         DEBUG(5,("set_file_oplock: granted oplock on file %s, %s/%lu, "
77                     "tv_sec = %x, tv_usec = %x\n",
78                  fsp->fsp_name, file_id_string_tos(&fsp->file_id),
79                  fsp->fh->gen_id, (int)fsp->open_time.tv_sec,
80                  (int)fsp->open_time.tv_usec ));
81
82         return True;
83 }
84
85 /****************************************************************************
86  Attempt to release an oplock on a file. Decrements oplock count.
87 ****************************************************************************/
88
89 void release_file_oplock(files_struct *fsp)
90 {
91         if ((fsp->oplock_type != NO_OPLOCK) &&
92             (fsp->oplock_type != FAKE_LEVEL_II_OPLOCK) &&
93             koplocks) {
94                 koplocks->ops->release_oplock(koplocks, fsp, NO_OPLOCK);
95         }
96
97         if (fsp->oplock_type == LEVEL_II_OPLOCK) {
98                 level_II_oplocks_open--;
99         } else if (EXCLUSIVE_OPLOCK_TYPE(fsp->oplock_type)) {
100                 exclusive_oplocks_open--;
101         }
102
103         SMB_ASSERT(exclusive_oplocks_open>=0);
104         SMB_ASSERT(level_II_oplocks_open>=0);
105
106         if (EXCLUSIVE_OPLOCK_TYPE(fsp->oplock_type)) {
107                 /* This doesn't matter for close. */
108                 fsp->oplock_type = FAKE_LEVEL_II_OPLOCK;
109         } else {
110                 fsp->oplock_type = NO_OPLOCK;
111         }
112         fsp->sent_oplock_break = NO_BREAK_SENT;
113
114         flush_write_cache(fsp, OPLOCK_RELEASE_FLUSH);
115
116         TALLOC_FREE(fsp->oplock_timeout);
117 }
118
119 /****************************************************************************
120  Attempt to downgrade an oplock on a file. Doesn't decrement oplock count.
121 ****************************************************************************/
122
123 static void downgrade_file_oplock(files_struct *fsp)
124 {
125         if (!EXCLUSIVE_OPLOCK_TYPE(fsp->oplock_type)) {
126                 DEBUG(0, ("trying to downgrade an already-downgraded oplock!\n"));
127                 return;
128         }
129
130         if (koplocks) {
131                 koplocks->ops->release_oplock(koplocks, fsp, LEVEL_II_OPLOCK);
132         }
133         fsp->oplock_type = LEVEL_II_OPLOCK;
134         exclusive_oplocks_open--;
135         level_II_oplocks_open++;
136         fsp->sent_oplock_break = NO_BREAK_SENT;
137 }
138
139 /****************************************************************************
140  Remove a file oplock. Copes with level II and exclusive.
141  Locks then unlocks the share mode lock. Client can decide to go directly
142  to none even if a "break-to-level II" was sent.
143 ****************************************************************************/
144
145 bool remove_oplock(files_struct *fsp)
146 {
147         bool ret;
148         struct share_mode_lock *lck;
149
150         /* Remove the oplock flag from the sharemode. */
151         lck = get_share_mode_lock(talloc_tos(), fsp->file_id, NULL, NULL,
152                                   NULL);
153         if (lck == NULL) {
154                 DEBUG(0,("remove_oplock: failed to lock share entry for "
155                          "file %s\n", fsp->fsp_name ));
156                 return False;
157         }
158         ret = remove_share_oplock(lck, fsp);
159         if (!ret) {
160                 DEBUG(0,("remove_oplock: failed to remove share oplock for "
161                          "file %s fnum %d, %s\n",
162                          fsp->fsp_name, fsp->fnum, file_id_string_tos(&fsp->file_id)));
163         }
164         release_file_oplock(fsp);
165         TALLOC_FREE(lck);
166         return ret;
167 }
168
169 /*
170  * Deal with a reply when a break-to-level II was sent.
171  */
172 bool downgrade_oplock(files_struct *fsp)
173 {
174         bool ret;
175         struct share_mode_lock *lck;
176
177         lck = get_share_mode_lock(talloc_tos(), fsp->file_id, NULL, NULL,
178                                   NULL);
179         if (lck == NULL) {
180                 DEBUG(0,("downgrade_oplock: failed to lock share entry for "
181                          "file %s\n", fsp->fsp_name ));
182                 return False;
183         }
184         ret = downgrade_share_oplock(lck, fsp);
185         if (!ret) {
186                 DEBUG(0,("downgrade_oplock: failed to downgrade share oplock "
187                          "for file %s fnum %d, file_id %s\n",
188                          fsp->fsp_name, fsp->fnum, file_id_string_tos(&fsp->file_id)));
189         }
190
191         downgrade_file_oplock(fsp);
192         TALLOC_FREE(lck);
193         return ret;
194 }
195
196 /*
197  * Some kernel oplock implementations handle the notification themselves.
198  */
199 bool should_notify_deferred_opens()
200 {
201         return !(koplocks &&
202                 (koplocks->flags & KOPLOCKS_DEFERRED_OPEN_NOTIFICATION));
203 }
204
205 /****************************************************************************
206  Set up an oplock break message.
207 ****************************************************************************/
208
209 static char *new_break_smb_message(TALLOC_CTX *mem_ctx,
210                                    files_struct *fsp, uint8 cmd)
211 {
212         char *result = TALLOC_ARRAY(mem_ctx, char, smb_size + 8*2 + 0);
213
214         if (result == NULL) {
215                 DEBUG(0, ("talloc failed\n"));
216                 return NULL;
217         }
218
219         memset(result,'\0',smb_size);
220         srv_set_message(result,8,0,true);
221         SCVAL(result,smb_com,SMBlockingX);
222         SSVAL(result,smb_tid,fsp->conn->cnum);
223         SSVAL(result,smb_pid,0xFFFF);
224         SSVAL(result,smb_uid,0);
225         SSVAL(result,smb_mid,0xFFFF);
226         SCVAL(result,smb_vwv0,0xFF);
227         SSVAL(result,smb_vwv2,fsp->fnum);
228         SCVAL(result,smb_vwv3,LOCKING_ANDX_OPLOCK_RELEASE);
229         SCVAL(result,smb_vwv3+1,cmd);
230         return result;
231 }
232
233 /****************************************************************************
234  Function to do the waiting before sending a local break.
235 ****************************************************************************/
236
237 static void wait_before_sending_break(void)
238 {
239         long wait_time = (long)lp_oplock_break_wait_time();
240
241         if (wait_time) {
242                 smb_msleep(wait_time);
243         }
244 }
245
246 /****************************************************************************
247  Ensure that we have a valid oplock.
248 ****************************************************************************/
249
250 static files_struct *initial_break_processing(struct file_id id, unsigned long file_id)
251 {
252         files_struct *fsp = NULL;
253
254         if( DEBUGLVL( 3 ) ) {
255                 dbgtext( "initial_break_processing: called for %s/%u\n",
256                          file_id_string_tos(&id), (int)file_id);
257                 dbgtext( "Current oplocks_open (exclusive = %d, levelII = %d)\n",
258                         exclusive_oplocks_open, level_II_oplocks_open );
259         }
260
261         /*
262          * We need to search the file open table for the
263          * entry containing this dev and inode, and ensure
264          * we have an oplock on it.
265          */
266
267         fsp = file_find_dif(id, file_id);
268
269         if(fsp == NULL) {
270                 /* The file could have been closed in the meantime - return success. */
271                 if( DEBUGLVL( 3 ) ) {
272                         dbgtext( "initial_break_processing: cannot find open file with " );
273                         dbgtext( "file_id %s gen_id = %lu", file_id_string_tos(&id), file_id);
274                         dbgtext( "allowing break to succeed.\n" );
275                 }
276                 return NULL;
277         }
278
279         /* Ensure we have an oplock on the file */
280
281         /*
282          * There is a potential race condition in that an oplock could
283          * have been broken due to another udp request, and yet there are
284          * still oplock break messages being sent in the udp message
285          * queue for this file. So return true if we don't have an oplock,
286          * as we may have just freed it.
287          */
288
289         if(fsp->oplock_type == NO_OPLOCK) {
290                 if( DEBUGLVL( 3 ) ) {
291                         dbgtext( "initial_break_processing: file %s ", fsp->fsp_name );
292                         dbgtext( "(file_id = %s gen_id = %lu) has no oplock.\n",
293                                  file_id_string_tos(&id), fsp->fh->gen_id );
294                         dbgtext( "Allowing break to succeed regardless.\n" );
295                 }
296                 return NULL;
297         }
298
299         return fsp;
300 }
301
302 static void oplock_timeout_handler(struct event_context *ctx,
303                                    struct timed_event *te,
304                                    struct timeval now,
305                                    void *private_data)
306 {
307         files_struct *fsp = (files_struct *)private_data;
308
309         /* Remove the timed event handler. */
310         TALLOC_FREE(fsp->oplock_timeout);
311         DEBUG(0, ("Oplock break failed for file %s -- replying anyway\n", fsp->fsp_name));
312         global_client_failed_oplock_break = True;
313         remove_oplock(fsp);
314         reply_to_oplock_break_requests(fsp);
315 }
316
317 /*******************************************************************
318  Add a timeout handler waiting for the client reply.
319 *******************************************************************/
320
321 static void add_oplock_timeout_handler(files_struct *fsp)
322 {
323         /*
324          * If kernel oplocks already notifies smbds when an oplock break times
325          * out, just return.
326          */
327         if (koplocks &&
328             (koplocks->flags & KOPLOCKS_TIMEOUT_NOTIFICATION)) {
329                 return;
330         }
331
332         if (fsp->oplock_timeout != NULL) {
333                 DEBUG(0, ("Logic problem -- have an oplock event hanging "
334                           "around\n"));
335         }
336
337         fsp->oplock_timeout =
338                 event_add_timed(smbd_event_context(), NULL,
339                                 timeval_current_ofs(OPLOCK_BREAK_TIMEOUT, 0),
340                                 oplock_timeout_handler, fsp);
341
342         if (fsp->oplock_timeout == NULL) {
343                 DEBUG(0, ("Could not add oplock timeout handler\n"));
344         }
345 }
346
347 /*******************************************************************
348  This handles the case of a write triggering a break to none
349  message on a level2 oplock.
350  When we get this message we may be in any of three states :
351  NO_OPLOCK, LEVEL_II, FAKE_LEVEL2. We only send a message to
352  the client for LEVEL2.
353 *******************************************************************/
354
355 void process_oplock_async_level2_break_message(struct messaging_context *msg_ctx,
356                                                       void *private_data,
357                                                       uint32_t msg_type,
358                                                       struct server_id src,
359                                                       DATA_BLOB *data)
360 {
361         struct share_mode_entry msg;
362         files_struct *fsp;
363         char *break_msg;
364
365         if (data->data == NULL) {
366                 DEBUG(0, ("Got NULL buffer\n"));
367                 return;
368         }
369
370         if (data->length != MSG_SMB_SHARE_MODE_ENTRY_SIZE) {
371                 DEBUG(0, ("Got invalid msg len %d\n", (int)data->length));
372                 return;
373         }
374
375         /* De-linearize incoming message. */
376         message_to_share_mode_entry(&msg, (char *)data->data);
377
378         DEBUG(10, ("Got oplock async level 2 break message from pid %s: "
379                    "%s/%lu\n", procid_str(debug_ctx(), &src),
380                    file_id_string_tos(&msg.id), msg.share_file_id));
381
382         fsp = initial_break_processing(msg.id, msg.share_file_id);
383
384         if (fsp == NULL) {
385                 /* We hit a race here. Break messages are sent, and before we
386                  * get to process this message, we have closed the file. 
387                  * No need to reply as this is an async message. */
388                 DEBUG(3, ("process_oplock_async_level2_break_message: Did not find fsp, ignoring\n"));
389                 return;
390         }
391
392         if (fsp->oplock_type == NO_OPLOCK) {
393                 /* We already got a "break to none" message and we've handled it.
394                  * just ignore. */
395                 DEBUG(3, ("process_oplock_async_level2_break_message: already broken to none, ignoring.\n"));
396                 return;
397         }
398
399         if (fsp->oplock_type == FAKE_LEVEL_II_OPLOCK) {
400                 /* Don't tell the client, just downgrade. */
401                 DEBUG(3, ("process_oplock_async_level2_break_message: downgrading fake level 2 oplock.\n"));
402                 remove_oplock(fsp);
403                 return;
404         }
405
406         /* Ensure we're really at level2 state. */
407         SMB_ASSERT(fsp->oplock_type == LEVEL_II_OPLOCK);
408
409         DEBUG(10,("process_oplock_async_level2_break_message: sending break to "
410                 "none message for fid %d, file %s\n",
411                 fsp->fnum,
412                 fsp->fsp_name));
413
414         /* Now send a break to none message to our client. */
415
416         break_msg = new_break_smb_message(NULL, fsp, OPLOCKLEVEL_NONE);
417         if (break_msg == NULL) {
418                 exit_server("Could not talloc break_msg\n");
419         }
420
421         /* Need to wait before sending a break message if we sent ourselves this message. */
422         if (procid_is_me(&src)) {
423                 wait_before_sending_break();
424         }
425
426         show_msg(break_msg);
427         if (!srv_send_smb(smbd_server_fd(),
428                         break_msg, false, 0,
429                         IS_CONN_ENCRYPTED(fsp->conn),
430                         NULL)) {
431                 exit_server_cleanly("oplock_break: srv_send_smb failed.");
432         }
433
434         TALLOC_FREE(break_msg);
435
436         /* Async level2 request, don't send a reply, just remove the oplock. */
437         remove_oplock(fsp);
438 }
439
440 /*******************************************************************
441  This handles the generic oplock break message from another smbd.
442 *******************************************************************/
443
444 static void process_oplock_break_message(struct messaging_context *msg_ctx,
445                                          void *private_data,
446                                          uint32_t msg_type,
447                                          struct server_id src,
448                                          DATA_BLOB *data)
449 {
450         struct share_mode_entry msg;
451         files_struct *fsp;
452         char *break_msg;
453         bool break_to_level2 = False;
454
455         if (data->data == NULL) {
456                 DEBUG(0, ("Got NULL buffer\n"));
457                 return;
458         }
459
460         if (data->length != MSG_SMB_SHARE_MODE_ENTRY_SIZE) {
461                 DEBUG(0, ("Got invalid msg len %d\n", (int)data->length));
462                 return;
463         }
464
465         /* De-linearize incoming message. */
466         message_to_share_mode_entry(&msg, (char *)data->data);
467
468         DEBUG(10, ("Got oplock break message from pid %s: %s/%lu\n",
469                    procid_str(debug_ctx(), &src), file_id_string_tos(&msg.id),
470                    msg.share_file_id));
471
472         fsp = initial_break_processing(msg.id, msg.share_file_id);
473
474         if (fsp == NULL) {
475                 /* a We hit race here. Break messages are sent, and before we
476                  * get to process this message, we have closed the file. Reply
477                  * with 'ok, oplock broken' */
478                 DEBUG(3, ("Did not find fsp\n"));
479
480                 /* We just send the same message back. */
481                 messaging_send_buf(msg_ctx, src, MSG_SMB_BREAK_RESPONSE,
482                                    (uint8 *)data->data,
483                                    MSG_SMB_SHARE_MODE_ENTRY_SIZE);
484                 return;
485         }
486
487         if (fsp->sent_oplock_break != NO_BREAK_SENT) {
488                 /* Remember we have to inform the requesting PID when the
489                  * client replies */
490                 msg.pid = src;
491                 ADD_TO_ARRAY(NULL, struct share_mode_entry, msg,
492                              &fsp->pending_break_messages,
493                              &fsp->num_pending_break_messages);
494                 return;
495         }
496
497         if (EXCLUSIVE_OPLOCK_TYPE(msg.op_type) &&
498             !EXCLUSIVE_OPLOCK_TYPE(fsp->oplock_type)) {
499                 DEBUG(3, ("Already downgraded oplock on %s: %s\n",
500                           file_id_string_tos(&fsp->file_id),
501                           fsp->fsp_name));
502                 /* We just send the same message back. */
503                 messaging_send_buf(msg_ctx, src, MSG_SMB_BREAK_RESPONSE,
504                                    (uint8 *)data->data,
505                                    MSG_SMB_SHARE_MODE_ENTRY_SIZE);
506                 return;
507         }
508
509         if ((global_client_caps & CAP_LEVEL_II_OPLOCKS) && 
510             !(msg.op_type & FORCE_OPLOCK_BREAK_TO_NONE) &&
511             !(koplocks && !(koplocks->flags & KOPLOCKS_LEVEL2_SUPPORTED)) &&
512             lp_level2_oplocks(SNUM(fsp->conn))) {
513                 break_to_level2 = True;
514         }
515
516         break_msg = new_break_smb_message(NULL, fsp, break_to_level2 ?
517                                           OPLOCKLEVEL_II : OPLOCKLEVEL_NONE);
518         if (break_msg == NULL) {
519                 exit_server("Could not talloc break_msg\n");
520         }
521
522         /* Need to wait before sending a break message if we sent ourselves this message. */
523         if (procid_is_me(&src)) {
524                 wait_before_sending_break();
525         }
526
527         show_msg(break_msg);
528         if (!srv_send_smb(smbd_server_fd(),
529                         break_msg, false, 0,
530                         IS_CONN_ENCRYPTED(fsp->conn),
531                         NULL)) {
532                 exit_server_cleanly("oplock_break: srv_send_smb failed.");
533         }
534
535         TALLOC_FREE(break_msg);
536
537         fsp->sent_oplock_break = break_to_level2 ? LEVEL_II_BREAK_SENT:BREAK_TO_NONE_SENT;
538
539         msg.pid = src;
540         ADD_TO_ARRAY(NULL, struct share_mode_entry, msg,
541                      &fsp->pending_break_messages,
542                      &fsp->num_pending_break_messages);
543
544         add_oplock_timeout_handler(fsp);
545 }
546
547 /*******************************************************************
548  This handles the kernel oplock break message.
549 *******************************************************************/
550
551 static void process_kernel_oplock_break(struct messaging_context *msg_ctx,
552                                         void *private_data,
553                                         uint32_t msg_type,
554                                         struct server_id src,
555                                         DATA_BLOB *data)
556 {
557         struct file_id id;
558         unsigned long file_id;
559         files_struct *fsp;
560         char *break_msg;
561
562         if (data->data == NULL) {
563                 DEBUG(0, ("Got NULL buffer\n"));
564                 return;
565         }
566
567         if (data->length != MSG_SMB_KERNEL_BREAK_SIZE) {
568                 DEBUG(0, ("Got invalid msg len %d\n", (int)data->length));
569                 return;
570         }
571
572         /* Pull the data from the message. */
573         pull_file_id_24((char *)data->data, &id);
574         file_id = (unsigned long)IVAL(data->data, 24);
575
576         DEBUG(10, ("Got kernel oplock break message from pid %s: %s/%u\n",
577                    procid_str(debug_ctx(), &src), file_id_string_tos(&id),
578                    (unsigned int)file_id));
579
580         fsp = initial_break_processing(id, file_id);
581
582         if (fsp == NULL) {
583                 DEBUG(3, ("Got a kernel oplock break message for a file "
584                           "I don't know about\n"));
585                 return;
586         }
587
588         if (fsp->sent_oplock_break != NO_BREAK_SENT) {
589                 /* This is ok, kernel oplocks come in completely async */
590                 DEBUG(3, ("Got a kernel oplock request while waiting for a "
591                           "break reply\n"));
592                 return;
593         }
594
595         break_msg = new_break_smb_message(NULL, fsp, OPLOCKLEVEL_NONE);
596         if (break_msg == NULL) {
597                 exit_server("Could not talloc break_msg\n");
598         }
599
600         show_msg(break_msg);
601         if (!srv_send_smb(smbd_server_fd(),
602                         break_msg, false, 0,
603                         IS_CONN_ENCRYPTED(fsp->conn),
604                         NULL)) {
605                 exit_server_cleanly("oplock_break: srv_send_smb failed.");
606         }
607
608         TALLOC_FREE(break_msg);
609
610         fsp->sent_oplock_break = BREAK_TO_NONE_SENT;
611
612         add_oplock_timeout_handler(fsp);
613 }
614
615 void reply_to_oplock_break_requests(files_struct *fsp)
616 {
617         int i;
618
619         /*
620          * If kernel oplocks already notifies smbds when oplocks are
621          * broken/removed, just return.
622          */
623         if (koplocks &&
624             (koplocks->flags & KOPLOCKS_OPLOCK_BROKEN_NOTIFICATION)) {
625                 return;
626         }
627
628         for (i=0; i<fsp->num_pending_break_messages; i++) {
629                 struct share_mode_entry *e = &fsp->pending_break_messages[i];
630                 char msg[MSG_SMB_SHARE_MODE_ENTRY_SIZE];
631
632                 share_mode_entry_to_message(msg, e);
633
634                 messaging_send_buf(smbd_messaging_context(), e->pid,
635                                    MSG_SMB_BREAK_RESPONSE,
636                                    (uint8 *)msg,
637                                    MSG_SMB_SHARE_MODE_ENTRY_SIZE);
638         }
639
640         SAFE_FREE(fsp->pending_break_messages);
641         fsp->num_pending_break_messages = 0;
642         if (fsp->oplock_timeout != NULL) {
643                 /* Remove the timed event handler. */
644                 TALLOC_FREE(fsp->oplock_timeout);
645                 fsp->oplock_timeout = NULL;
646         }
647         return;
648 }
649
650 static void process_oplock_break_response(struct messaging_context *msg_ctx,
651                                           void *private_data,
652                                           uint32_t msg_type,
653                                           struct server_id src,
654                                           DATA_BLOB *data)
655 {
656         struct share_mode_entry msg;
657
658         if (data->data == NULL) {
659                 DEBUG(0, ("Got NULL buffer\n"));
660                 return;
661         }
662
663         if (data->length != MSG_SMB_SHARE_MODE_ENTRY_SIZE) {
664                 DEBUG(0, ("Got invalid msg len %u\n",
665                           (unsigned int)data->length));
666                 return;
667         }
668
669         /* De-linearize incoming message. */
670         message_to_share_mode_entry(&msg, (char *)data->data);
671
672         DEBUG(10, ("Got oplock break response from pid %s: %s/%lu mid %u\n",
673                    procid_str(debug_ctx(), &src), file_id_string_tos(&msg.id),
674                    msg.share_file_id, (unsigned int)msg.op_mid));
675
676         /* Here's the hack from open.c, store the mid in the 'port' field */
677         schedule_deferred_open_smb_message(msg.op_mid);
678 }
679
680 static void process_open_retry_message(struct messaging_context *msg_ctx,
681                                        void *private_data,
682                                        uint32_t msg_type,
683                                        struct server_id src,
684                                        DATA_BLOB *data)
685 {
686         struct share_mode_entry msg;
687         
688         if (data->data == NULL) {
689                 DEBUG(0, ("Got NULL buffer\n"));
690                 return;
691         }
692
693         if (data->length != MSG_SMB_SHARE_MODE_ENTRY_SIZE) {
694                 DEBUG(0, ("Got invalid msg len %d\n", (int)data->length));
695                 return;
696         }
697
698         /* De-linearize incoming message. */
699         message_to_share_mode_entry(&msg, (char *)data->data);
700
701         DEBUG(10, ("Got open retry msg from pid %s: %s mid %u\n",
702                    procid_str(debug_ctx(), &src), file_id_string_tos(&msg.id),
703                    (unsigned int)msg.op_mid));
704
705         schedule_deferred_open_smb_message(msg.op_mid);
706 }
707
708 /****************************************************************************
709  This function is called on any file modification or lock request. If a file
710  is level 2 oplocked then it must tell all other level 2 holders to break to
711  none.
712 ****************************************************************************/
713
714 static void contend_level2_oplocks_begin_default(files_struct *fsp,
715                                               enum level2_contention_type type)
716 {
717         int i;
718         struct share_mode_lock *lck;
719
720         /*
721          * If this file is level II oplocked then we need
722          * to grab the shared memory lock and inform all
723          * other files with a level II lock that they need
724          * to flush their read caches. We keep the lock over
725          * the shared memory area whilst doing this.
726          */
727
728         if (!LEVEL_II_OPLOCK_TYPE(fsp->oplock_type))
729                 return;
730
731         lck = get_share_mode_lock(talloc_tos(), fsp->file_id, NULL, NULL,
732                                   NULL);
733         if (lck == NULL) {
734                 DEBUG(0,("release_level_2_oplocks_on_change: failed to lock "
735                          "share mode entry for file %s.\n", fsp->fsp_name ));
736                 return;
737         }
738
739         DEBUG(10,("release_level_2_oplocks_on_change: num_share_modes = %d\n", 
740                   lck->num_share_modes ));
741
742         for(i = 0; i < lck->num_share_modes; i++) {
743                 struct share_mode_entry *share_entry = &lck->share_modes[i];
744                 char msg[MSG_SMB_SHARE_MODE_ENTRY_SIZE];
745
746                 if (!is_valid_share_mode_entry(share_entry)) {
747                         continue;
748                 }
749
750                 /*
751                  * As there could have been multiple writes waiting at the
752                  * lock_share_entry gate we may not be the first to
753                  * enter. Hence the state of the op_types in the share mode
754                  * entries may be partly NO_OPLOCK and partly LEVEL_II or FAKE_LEVEL_II
755                  * oplock. It will do no harm to re-send break messages to
756                  * those smbd's that are still waiting their turn to remove
757                  * their LEVEL_II state, and also no harm to ignore existing
758                  * NO_OPLOCK states. JRA.
759                  */
760
761                 DEBUG(10,("release_level_2_oplocks_on_change: "
762                           "share_entry[%i]->op_type == %d\n",
763                           i, share_entry->op_type ));
764
765                 if (share_entry->op_type == NO_OPLOCK) {
766                         continue;
767                 }
768
769                 /* Paranoia .... */
770                 if (EXCLUSIVE_OPLOCK_TYPE(share_entry->op_type)) {
771                         DEBUG(0,("release_level_2_oplocks_on_change: PANIC. "
772                                  "share mode entry %d is an exlusive "
773                                  "oplock !\n", i ));
774                         TALLOC_FREE(lck);
775                         abort();
776                 }
777
778                 share_mode_entry_to_message(msg, share_entry);
779
780                 /*
781                  * Deal with a race condition when breaking level2
782                  * oplocks. Don't send all the messages and release
783                  * the lock, this allows someone else to come in and
784                  * get a level2 lock before any of the messages are
785                  * processed, and thus miss getting a break message.
786                  * Ensure at least one entry (the one we're breaking)
787                  * is processed immediately under the lock and becomes
788                  * set as NO_OPLOCK to stop any waiter getting a level2.
789                  * Bugid #5980.
790                  */
791
792                 if (procid_is_me(&share_entry->pid)) {
793                         DATA_BLOB blob = data_blob_const(msg,
794                                         MSG_SMB_SHARE_MODE_ENTRY_SIZE);
795                         process_oplock_async_level2_break_message(smbd_messaging_context(),
796                                                 NULL,
797                                                 MSG_SMB_ASYNC_LEVEL2_BREAK,
798                                                 share_entry->pid,
799                                                 &blob);
800                 } else {
801                         messaging_send_buf(smbd_messaging_context(),
802                                         share_entry->pid,
803                                         MSG_SMB_ASYNC_LEVEL2_BREAK,
804                                         (uint8 *)msg,
805                                         MSG_SMB_SHARE_MODE_ENTRY_SIZE);
806                 }
807         }
808
809         /* We let the message receivers handle removing the oplock state
810            in the share mode lock db. */
811
812         TALLOC_FREE(lck);
813 }
814
815 void contend_level2_oplocks_begin(files_struct *fsp,
816                                   enum level2_contention_type type)
817 {
818         if (koplocks && koplocks->ops->contend_level2_oplocks_begin) {
819                 koplocks->ops->contend_level2_oplocks_begin(fsp, type);
820                 return;
821         }
822
823         contend_level2_oplocks_begin_default(fsp, type);
824 }
825
826 void contend_level2_oplocks_end(files_struct *fsp,
827                                 enum level2_contention_type type)
828 {
829         /* Only kernel oplocks implement this so far */
830         if (koplocks && koplocks->ops->contend_level2_oplocks_end) {
831                 koplocks->ops->contend_level2_oplocks_end(fsp, type);
832         }
833 }
834
835 /****************************************************************************
836  Linearize a share mode entry struct to an internal oplock break message.
837 ****************************************************************************/
838
839 void share_mode_entry_to_message(char *msg, const struct share_mode_entry *e)
840 {
841         SIVAL(msg,0,(uint32)e->pid.pid);
842         SSVAL(msg,4,e->op_mid);
843         SSVAL(msg,6,e->op_type);
844         SIVAL(msg,8,e->access_mask);
845         SIVAL(msg,12,e->share_access);
846         SIVAL(msg,16,e->private_options);
847         SIVAL(msg,20,(uint32)e->time.tv_sec);
848         SIVAL(msg,24,(uint32)e->time.tv_usec);
849         push_file_id_24(msg+28, &e->id);
850         SIVAL(msg,52,e->share_file_id);
851         SIVAL(msg,56,e->uid);
852         SSVAL(msg,60,e->flags);
853 #ifdef CLUSTER_SUPPORT
854         SIVAL(msg,62,e->pid.vnn);
855 #endif
856 }
857
858 /****************************************************************************
859  De-linearize an internal oplock break message to a share mode entry struct.
860 ****************************************************************************/
861
862 void message_to_share_mode_entry(struct share_mode_entry *e, char *msg)
863 {
864         e->pid.pid = (pid_t)IVAL(msg,0);
865         e->op_mid = SVAL(msg,4);
866         e->op_type = SVAL(msg,6);
867         e->access_mask = IVAL(msg,8);
868         e->share_access = IVAL(msg,12);
869         e->private_options = IVAL(msg,16);
870         e->time.tv_sec = (time_t)IVAL(msg,20);
871         e->time.tv_usec = (int)IVAL(msg,24);
872         pull_file_id_24(msg+28, &e->id);
873         e->share_file_id = (unsigned long)IVAL(msg,52);
874         e->uid = (uint32)IVAL(msg,56);
875         e->flags = (uint16)SVAL(msg,60);
876 #ifdef CLUSTER_SUPPORT
877         e->pid.vnn = IVAL(msg,62);
878 #endif
879 }
880
881 /****************************************************************************
882  Setup oplocks for this process.
883 ****************************************************************************/
884
885 bool init_oplocks(struct messaging_context *msg_ctx)
886 {
887         DEBUG(3,("init_oplocks: initializing messages.\n"));
888
889         messaging_register(msg_ctx, NULL, MSG_SMB_BREAK_REQUEST,
890                            process_oplock_break_message);
891         messaging_register(msg_ctx, NULL, MSG_SMB_ASYNC_LEVEL2_BREAK,
892                            process_oplock_async_level2_break_message);
893         messaging_register(msg_ctx, NULL, MSG_SMB_BREAK_RESPONSE,
894                            process_oplock_break_response);
895         messaging_register(msg_ctx, NULL, MSG_SMB_KERNEL_BREAK,
896                            process_kernel_oplock_break);
897         messaging_register(msg_ctx, NULL, MSG_SMB_OPEN_RETRY,
898                            process_open_retry_message);
899
900         if (lp_kernel_oplocks()) {
901 #if HAVE_KERNEL_OPLOCKS_IRIX
902                 koplocks = irix_init_kernel_oplocks(talloc_autofree_context());
903 #elif HAVE_KERNEL_OPLOCKS_LINUX
904                 koplocks = linux_init_kernel_oplocks(talloc_autofree_context());
905 #elif HAVE_ONEFS
906                 koplocks = onefs_init_kernel_oplocks(talloc_autofree_context());
907 #endif
908         }
909
910         return True;
911 }