From boyang - ensure we never "return" from a forked child, always _exit().
[jra/samba/.git] / source3 / winbindd / winbindd_cm.c
index adb631b57b85b930ac6fee5b9c3d2ff9f25e446a..962b6e6d1b7257c768fb40fafaf5beec18cee5e6 100644 (file)
@@ -8,17 +8,17 @@
    Copyright (C) Gerald (Jerry) Carter     2003-2005.
    Copyright (C) Volker Lendecke           2004-2005
    Copyright (C) Jeremy Allison                   2006
-   
+
    This program is free software; you can redistribute it and/or modify
    it under the terms of the GNU General Public License as published by
    the Free Software Foundation; either version 3 of the License, or
    (at your option) any later version.
-   
+
    This program is distributed in the hope that it will be useful,
    but WITHOUT ANY WARRANTY; without even the implied warranty of
    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.         See the
    GNU General Public License for more details.
-   
+
    You should have received a copy of the GNU General Public License
    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 */
    We need to manage connections to domain controllers without having to
    mess up the main winbindd code with other issues.  The aim of the
    connection manager is to:
-  
+
        - make connections to domain controllers and cache them
        - re-establish connections when networks or servers go down
        - centralise the policy on connection timeouts, domain controller
         selection etc
        - manage re-entrancy for when winbindd becomes able to handle
         multiple outstanding rpc requests
-  
+
    Why not have connection management as part of the rpc layer like tng?
    Good question.  This code may morph into libsmb/rpc_cache.c or something
    like that but at the moment it's simply staying as part of winbind. I
@@ -171,20 +171,34 @@ static bool fork_child_dc_connect(struct winbindd_domain *domain)
        struct dc_name_ip *dcs = NULL;
        int num_dcs = 0;
        TALLOC_CTX *mem_ctx = NULL;
-       pid_t child_pid;
        pid_t parent_pid = sys_getpid();
+       char *lfile = NULL;
 
        /* Stop zombies */
        CatchChild();
 
-       child_pid = sys_fork();
+       if (domain->dc_probe_pid != (pid_t)-1) {
+               /*
+                * We might already have a DC probe
+                * child working, check.
+                */
+               if (process_exists_by_pid(domain->dc_probe_pid)) {
+                       DEBUG(10,("fork_child_dc_connect: pid %u already "
+                               "checking for DC's.\n",
+                               (unsigned int)domain->dc_probe_pid));
+                       return true;
+               }
+               domain->dc_probe_pid = (pid_t)-1;
+       }
 
-       if (child_pid == -1) {
+       domain->dc_probe_pid = sys_fork();
+
+       if (domain->dc_probe_pid == (pid_t)-1) {
                DEBUG(0, ("fork_child_dc_connect: Could not fork: %s\n", strerror(errno)));
                return False;
        }
 
-       if (child_pid != 0) {
+       if (domain->dc_probe_pid != (pid_t)0) {
                /* Parent */
                messaging_register(winbind_messaging_context(), NULL,
                                   MSG_WINBIND_TRY_TO_GO_ONLINE,
@@ -199,27 +213,32 @@ static bool fork_child_dc_connect(struct winbindd_domain *domain)
 
        /* Leave messages blocked - we will never process one. */
 
-       /* tdb needs special fork handling */
-       if (tdb_reopen_all(1) == -1) {
-               DEBUG(0,("tdb_reopen_all failed.\n"));
-               _exit(0);
-       }
-
-       close_conns_after_fork();
-
        if (!override_logfile) {
-               char *logfile;
-               if (asprintf(&logfile, "%s/log.winbindd-dc-connect", get_dyn_LOGFILEBASE()) > 0) {
-                       lp_set_logfile(logfile);
-                       SAFE_FREE(logfile);
-                       reopen_logs();
+               if (asprintf(&lfile, "%s/log.winbindd-dc-connect", get_dyn_LOGFILEBASE()) == -1) {
+                       DEBUG(0, ("fork_child_dc_connect: out of memory.\n"));
+                       _exit(1);
                }
        }
 
+       if (!winbindd_reinit_after_fork(lfile)) {
+               messaging_send_buf(winbind_messaging_context(),
+                                  pid_to_procid(parent_pid),
+                                  MSG_WINBIND_FAILED_TO_GO_ONLINE,
+                                  (uint8 *)domain->name,
+                                  strlen(domain->name)+1);
+               _exit(1);
+       }
+       SAFE_FREE(lfile);
+
        mem_ctx = talloc_init("fork_child_dc_connect");
        if (!mem_ctx) {
                DEBUG(0,("talloc_init failed.\n"));
-               _exit(0);
+               messaging_send_buf(winbind_messaging_context(),
+                                  pid_to_procid(parent_pid),
+                                  MSG_WINBIND_FAILED_TO_GO_ONLINE,
+                                  (uint8 *)domain->name,
+                                  strlen(domain->name)+1);
+               _exit(1);
        }
 
        if ((!get_dcs(mem_ctx, domain, &dcs, &num_dcs)) || (num_dcs == 0)) {
@@ -249,7 +268,7 @@ static bool fork_child_dc_connect(struct winbindd_domain *domain)
 
 static void check_domain_online_handler(struct event_context *ctx,
                                        struct timed_event *te,
-                                       const struct timeval *now,
+                                       struct timeval now,
                                        void *private_data)
 {
         struct winbindd_domain *domain =
@@ -263,7 +282,7 @@ static void check_domain_online_handler(struct event_context *ctx,
 
        /* Are we still in "startup" mode ? */
 
-       if (domain->startup && (now->tv_sec > domain->startup_time + 30)) {
+       if (domain->startup && (now.tv_sec > domain->startup_time + 30)) {
                /* No longer in "startup" mode. */
                DEBUG(10,("check_domain_online_handler: domain %s no longer in 'startup' mode.\n",
                        domain->name ));
@@ -292,12 +311,12 @@ static void check_domain_online_handler(struct event_context *ctx,
 
 static void calc_new_online_timeout_check(struct winbindd_domain *domain)
 {
-       int wbc = lp_winbind_cache_time();
+       int wbr = lp_winbind_reconnect_delay();
 
        if (domain->startup) {
                domain->check_online_timeout = 10;
-       } else if (domain->check_online_timeout < wbc) {
-               domain->check_online_timeout = wbc;
+       } else if (domain->check_online_timeout < wbr) {
+               domain->check_online_timeout = wbr;
        }
 }
 
@@ -337,14 +356,13 @@ void set_domain_offline(struct winbindd_domain *domain)
        }
 
        /* If we're in statup mode, check again in 10 seconds, not in
-          lp_winbind_cache_time() seconds (which is 5 mins by default). */
+          lp_winbind_reconnect_delay() seconds (which is 30 seconds by default). */
 
        calc_new_online_timeout_check(domain);
 
        domain->check_online_event = event_add_timed(winbind_event_context(),
                                                NULL,
                                                timeval_current_ofs(domain->check_online_timeout,0),
-                                               "check_domain_online_handler",
                                                check_domain_online_handler,
                                                domain);
 
@@ -361,7 +379,7 @@ void set_domain_offline(struct winbindd_domain *domain)
 
        if ( domain->primary ) {
                struct winbindd_child *idmap = idmap_child();
-               
+
                if ( idmap->pid != 0 ) {
                        messaging_send_buf(winbind_messaging_context(),
                                           pid_to_procid(idmap->pid), 
@@ -380,8 +398,6 @@ void set_domain_offline(struct winbindd_domain *domain)
 
 static void set_domain_online(struct winbindd_domain *domain)
 {
-       struct timeval now;
-
        DEBUG(10,("set_domain_online: called for domain %s\n",
                domain->name ));
 
@@ -400,9 +416,7 @@ static void set_domain_online(struct winbindd_domain *domain)
        winbindd_set_locator_kdc_envs(domain);
 
        /* If we are waiting to get a krb5 ticket, trigger immediately. */
-       GetTimeOfDay(&now);
-       set_event_dispatch_time(winbind_event_context(),
-                               "krb5_ticket_gain_handler", now);
+       ccache_regain_all_now();
 
        /* Ok, we're out of any startup mode now... */
        domain->startup = False;
@@ -440,7 +454,7 @@ static void set_domain_online(struct winbindd_domain *domain)
 
        if ( domain->primary ) {
                struct winbindd_child *idmap = idmap_child();
-               
+
                if ( idmap->pid != 0 ) {
                        messaging_send_buf(winbind_messaging_context(),
                                           pid_to_procid(idmap->pid), 
@@ -475,6 +489,15 @@ void set_domain_online_request(struct winbindd_domain *domain)
           because network manager seems to lie.
           Wait at least 5 seconds. Heuristics suck... */
 
+
+       GetTimeOfDay(&tev);
+
+       /* Go into "startup" mode again. */
+       domain->startup_time = tev.tv_sec;
+       domain->startup = True;
+
+       tev.tv_sec += 5;
+
        if (!domain->check_online_event) {
                /* If we've come from being globally offline we
                   don't have a check online event handler set.
@@ -483,29 +506,20 @@ void set_domain_online_request(struct winbindd_domain *domain)
 
                DEBUG(10,("set_domain_online_request: domain %s was globally offline.\n",
                        domain->name ));
-
-               domain->check_online_event = event_add_timed(winbind_event_context(),
-                                                               NULL,
-                                                               timeval_current_ofs(5, 0),
-                                                               "check_domain_online_handler",
-                                                               check_domain_online_handler,
-                                                               domain);
-
-               /* The above *has* to succeed for winbindd to work. */
-               if (!domain->check_online_event) {
-                       smb_panic("set_domain_online_request: failed to add online handler");
-               }
        }
 
-       GetTimeOfDay(&tev);
-
-       /* Go into "startup" mode again. */
-       domain->startup_time = tev.tv_sec;
-       domain->startup = True;
+       TALLOC_FREE(domain->check_online_event);
 
-       tev.tv_sec += 5;
+       domain->check_online_event = event_add_timed(winbind_event_context(),
+                                                    NULL,
+                                                    tev,
+                                                    check_domain_online_handler,
+                                                    domain);
 
-       set_event_dispatch_time(winbind_event_context(), "check_domain_online_handler", tev);
+       /* The above *has* to succeed for winbindd to work. */
+       if (!domain->check_online_event) {
+               smb_panic("set_domain_online_request: failed to add online handler");
+       }
 }
 
 /****************************************************************
@@ -531,7 +545,7 @@ void winbind_add_failed_connection_entry(const struct winbindd_domain *domain,
    an authenticated connection if DCs have the RestrictAnonymous registry
    entry set > 0, or the "Additional restrictions for anonymous
    connections" set in the win2k Local Security Policy. 
-   
+
    Caller to free() result in domain, username, password
 */
 
@@ -540,12 +554,12 @@ static void cm_get_ipc_userpass(char **username, char **domain, char **password)
        *username = (char *)secrets_fetch(SECRETS_AUTH_USER, NULL);
        *domain = (char *)secrets_fetch(SECRETS_AUTH_DOMAIN, NULL);
        *password = (char *)secrets_fetch(SECRETS_AUTH_PASSWORD, NULL);
-       
+
        if (*username && **username) {
 
                if (!*domain || !**domain)
                        *domain = smb_xstrdup(lp_workgroup());
-               
+
                if (!*password || !**password)
                        *password = smb_xstrdup("");
 
@@ -599,7 +613,7 @@ static bool get_dc_name_via_netlogon(struct winbindd_domain *domain,
        /* This call can take a long time - allow the server to time out.
           35 seconds should do it. */
 
-       orig_timeout = cli_set_timeout(netlogon_pipe->cli, 35000);
+       orig_timeout = rpccli_set_timeout(netlogon_pipe, 35000);
 
        if (our_domain->active_directory) {
                struct netr_DsRGetDCNameInfo *domain_info = NULL;
@@ -639,7 +653,7 @@ static bool get_dc_name_via_netlogon(struct winbindd_domain *domain,
        }
 
        /* And restore our original timeout. */
-       cli_set_timeout(netlogon_pipe->cli, orig_timeout);
+       rpccli_set_timeout(netlogon_pipe, orig_timeout);
 
        if (!NT_STATUS_IS_OK(result)) {
                DEBUG(10,("rpccli_netr_GetAnyDCName failed: %s\n",
@@ -650,19 +664,13 @@ static bool get_dc_name_via_netlogon(struct winbindd_domain *domain,
 
        if (!W_ERROR_IS_OK(werr)) {
                DEBUG(10,("rpccli_netr_GetAnyDCName failed: %s\n",
-                          dos_errstr(werr)));
+                          win_errstr(werr)));
                talloc_destroy(mem_ctx);
                return false;
        }
 
        /* rpccli_netr_GetAnyDCName gives us a name with \\ */
-       p = tmp;
-       if (*p == '\\') {
-               p+=1;
-       }
-       if (*p == '\\') {
-               p+=1;
-       }
+       p = strip_hostname(tmp);
 
        fstrcpy(dcname, p);
 
@@ -687,7 +695,7 @@ static NTSTATUS get_trust_creds(const struct winbindd_domain *domain,
 {
        const char *account_name;
        const char *name = NULL;
-       
+
        /* If we are a DC and this is not our own domain */
 
        if (IS_DC) {
@@ -697,10 +705,10 @@ static NTSTATUS get_trust_creds(const struct winbindd_domain *domain,
 
                if (!our_domain)
                        return NT_STATUS_INVALID_SERVER_STATE;          
-               
+
                name = our_domain->name;                
        }       
-       
+
        if (!get_trust_pw_clear(name, machine_password,
                                &account_name, NULL))
        {
@@ -713,12 +721,18 @@ static NTSTATUS get_trust_creds(const struct winbindd_domain *domain,
                return NT_STATUS_NO_MEMORY;
        }
 
-       /* this is at least correct when domain is our domain,
-        * which is the only case, when this is currently used: */
+       /* For now assume our machine account only exists in our domain */
+
        if (machine_krb5_principal != NULL)
        {
+               struct winbindd_domain *our_domain = find_our_domain();
+
+               if (!our_domain) {
+                       return NT_STATUS_CANT_ACCESS_DOMAIN_INFO;                       
+               }
+
                if (asprintf(machine_krb5_principal, "%s$@%s",
-                            account_name, domain->alt_name) == -1)
+                            account_name, our_domain->alt_name) == -1)
                {
                        return NT_STATUS_NO_MEMORY;
                }
@@ -809,13 +823,14 @@ static NTSTATUS cm_prepare_connection(const struct winbindd_domain *domain,
 
        cli_setup_signing_state(*cli, Undefined);
 
-       if (!cli_negprot(*cli)) {
-               DEBUG(1, ("cli_negprot failed\n"));
-               result = NT_STATUS_UNSUCCESSFUL;
+       result = cli_negprot(*cli);
+
+       if (!NT_STATUS_IS_OK(result)) {
+               DEBUG(1, ("cli_negprot failed: %s\n", nt_errstr(result)));
                goto done;
        }
 
-       if (!is_trusted_domain_situation(domain->name) &&
+       if (!is_dc_trusted_domain_situation(domain->name) &&
            (*cli)->protocol >= PROTOCOL_NT1 &&
            (*cli)->capabilities & CAP_EXTENDED_SECURITY)
        {
@@ -834,14 +849,15 @@ static NTSTATUS cm_prepare_connection(const struct winbindd_domain *domain,
 
                        (*cli)->use_kerberos = True;
                        DEBUG(5, ("connecting to %s from %s with kerberos principal "
-                                 "[%s]\n", controller, global_myname(),
-                                 machine_krb5_principal));
+                                 "[%s] and realm [%s]\n", controller, global_myname(),
+                                 machine_krb5_principal, domain->alt_name));
 
                        winbindd_set_locator_kdc_envs(domain);
 
                        ads_status = cli_session_setup_spnego(*cli,
                                                              machine_krb5_principal, 
-                                                             machine_password, 
+                                                             machine_password,
+                                                             lp_workgroup(),
                                                              domain->name);
 
                        if (!ADS_ERR_OK(ads_status)) {
@@ -852,7 +868,7 @@ static NTSTATUS cm_prepare_connection(const struct winbindd_domain *domain,
                        result = ads_ntstatus(ads_status);
                        if (NT_STATUS_IS_OK(result)) {
                                /* Ensure creds are stored for NTLMSSP authenticated pipe access. */
-                               cli_init_creds(*cli, machine_account, domain->name, machine_password);
+                               cli_init_creds(*cli, machine_account, lp_workgroup(), machine_password);
                                goto session_setup_done;
                        }
                }
@@ -862,12 +878,13 @@ static NTSTATUS cm_prepare_connection(const struct winbindd_domain *domain,
 
                DEBUG(5, ("connecting to %s from %s with username "
                          "[%s]\\[%s]\n",  controller, global_myname(),
-                         domain->name, machine_account));
+                         lp_workgroup(), machine_account));
 
                ads_status = cli_session_setup_spnego(*cli,
                                                      machine_account, 
                                                      machine_password, 
-                                                     domain->name);
+                                                     lp_workgroup(),
+                                                     NULL);
                if (!ADS_ERR_OK(ads_status)) {
                        DEBUG(4, ("authenticated session setup failed with %s\n",
                                ads_errstr(ads_status)));
@@ -876,7 +893,7 @@ static NTSTATUS cm_prepare_connection(const struct winbindd_domain *domain,
                result = ads_ntstatus(ads_status);
                if (NT_STATUS_IS_OK(result)) {
                        /* Ensure creds are stored for NTLMSSP authenticated pipe access. */
-                       cli_init_creds(*cli, machine_account, domain->name, machine_password);
+                       cli_init_creds(*cli, machine_account, lp_workgroup(), machine_password);
                        goto session_setup_done;
                }
        }
@@ -913,6 +930,9 @@ static NTSTATUS cm_prepare_connection(const struct winbindd_domain *domain,
  anon_fallback:
 
        /* Fall back to anonymous connection, this might fail later */
+       DEBUG(10,("cm_prepare_connection: falling back to anonymous "
+               "connection for DC %s\n",
+               controller ));
 
        if (NT_STATUS_IS_OK(cli_session_setup(*cli, "", NULL, 0,
                                              NULL, 0, ""))) {
@@ -983,15 +1003,37 @@ static NTSTATUS cm_prepare_connection(const struct winbindd_domain *domain,
        return result;
 }
 
+/*******************************************************************
+ Add a dcname and sockaddr_storage pair to the end of a dc_name_ip
+ array.
+
+ Keeps the list unique by not adding duplicate entries.
+
+ @param[in] mem_ctx talloc memory context to allocate from
+ @param[in] domain_name domain of the DC
+ @param[in] dcname name of the DC to add to the list
+ @param[in] pss Internet address and port pair to add to the list
+ @param[in,out] dcs array of dc_name_ip structures to add to
+ @param[in,out] num_dcs number of dcs returned in the dcs array
+ @return true if the list was added to, false otherwise
+*******************************************************************/
+
 static bool add_one_dc_unique(TALLOC_CTX *mem_ctx, const char *domain_name,
                              const char *dcname, struct sockaddr_storage *pss,
                              struct dc_name_ip **dcs, int *num)
 {
+       int i = 0;
+
        if (!NT_STATUS_IS_OK(check_negative_conn_cache(domain_name, dcname))) {
                DEBUG(10, ("DC %s was in the negative conn cache\n", dcname));
                return False;
        }
 
+       /* Make sure there's no duplicates in the list */
+       for (i=0; i<*num; i++)
+               if (sockaddr_equal((struct sockaddr *)&(*dcs)[i].ss, (struct sockaddr *)pss))
+                       return False;
+
        *dcs = TALLOC_REALLOC_ARRAY(mem_ctx, *dcs, struct dc_name_ip, (*num)+1);
 
        if (*dcs == NULL)
@@ -1015,7 +1057,7 @@ static bool add_sockaddr_to_array(TALLOC_CTX *mem_ctx,
        }
 
        (*addrs)[*num] = *pss;
-       set_sockaddr_port(&(*addrs)[*num], port);
+       set_sockaddr_port((struct sockaddr *)&(*addrs)[*num], port);
 
        *num += 1;
        return True;
@@ -1025,11 +1067,13 @@ static bool add_sockaddr_to_array(TALLOC_CTX *mem_ctx,
  convert an ip to a name
 *******************************************************************/
 
-static bool dcip_to_name(const struct winbindd_domain *domain,
+static bool dcip_to_name(TALLOC_CTX *mem_ctx,
+               const struct winbindd_domain *domain,
                struct sockaddr_storage *pss,
                fstring name )
 {
        struct ip_service ip_list;
+       uint32_t nt_version = NETLOGON_NT_VERSION_1;
 
        ip_list.ss = *pss;
        ip_list.port = 0;
@@ -1040,21 +1084,23 @@ static bool dcip_to_name(const struct winbindd_domain *domain,
 
        if (lp_security() == SEC_ADS) {
                ADS_STRUCT *ads;
+               ADS_STATUS ads_status;
                char addr[INET6_ADDRSTRLEN];
 
                print_sockaddr(addr, sizeof(addr), pss);
 
-               ads = ads_init(domain->alt_name, domain->name, NULL);
+               ads = ads_init(domain->alt_name, domain->name, addr);
                ads->auth.flags |= ADS_AUTH_NO_BIND;
 
-               if (ads_try_connect(ads, addr)) {
+               ads_status = ads_connect(ads);
+               if (ADS_ERR_OK(ads_status)) {
                        /* We got a cldap packet. */
                        fstrcpy(name, ads->config.ldap_server_name);
                        namecache_store(name, 0x20, 1, &ip_list);
 
                        DEBUG(10,("dcip_to_name: flags = 0x%x\n", (unsigned int)ads->config.flags));
 
-                       if (domain->primary && (ads->config.flags & ADS_KDC)) {
+                       if (domain->primary && (ads->config.flags & NBT_SERVER_KDC)) {
                                if (ads_closest_dc(ads)) {
                                        char *sitename = sitename_fetch(ads->config.realm);
 
@@ -1092,12 +1138,17 @@ static bool dcip_to_name(const struct winbindd_domain *domain,
 
        /* try GETDC requests next */
 
-       if (send_getdc_request(winbind_messaging_context(),
-                              pss, domain->name, &domain->sid)) {
+       if (send_getdc_request(mem_ctx, winbind_messaging_context(),
+                              pss, domain->name, &domain->sid,
+                              nt_version)) {
+               const char *dc_name = NULL;
                int i;
                smb_msleep(100);
                for (i=0; i<5; i++) {
-                       if (receive_getdc_response(pss, domain->name, name)) {
+                       if (receive_getdc_response(mem_ctx, pss, domain->name,
+                                                  &nt_version,
+                                                  &dc_name, NULL)) {
+                               fstrcpy(name, dc_name);
                                namecache_store(name, 0x20, 1, &ip_list);
                                return True;
                        }
@@ -1115,8 +1166,15 @@ static bool dcip_to_name(const struct winbindd_domain *domain,
 }
 
 /*******************************************************************
- Retreive a list of IP address for domain controllers.  Fill in 
- the dcs[]  with results.
+ Retrieve a list of IP addresses for domain controllers.
+
+ The array is sorted in the preferred connection order.
+
+ @param[in] mem_ctx talloc memory context to allocate from
+ @param[in] domain domain to retrieve DCs for
+ @param[out] dcs array of dcs that will be returned
+ @param[out] num_dcs number of dcs returned in the dcs array
+ @return always true
 *******************************************************************/
 
 static bool get_dcs(TALLOC_CTX *mem_ctx, struct winbindd_domain *domain,
@@ -1132,9 +1190,11 @@ static bool get_dcs(TALLOC_CTX *mem_ctx, struct winbindd_domain *domain,
 
        is_our_domain = strequal(domain->name, lp_workgroup());
 
+       /* If not our domain, get the preferred DC, by asking our primary DC */
        if ( !is_our_domain
                && get_dc_name_via_netlogon(domain, dcname, &ss)
-               && add_one_dc_unique(mem_ctx, domain->name, dcname, &ss, dcs, num_dcs) )
+               && add_one_dc_unique(mem_ctx, domain->name, dcname, &ss, dcs,
+                      num_dcs) )
        {
                char addr[INET6_ADDRSTRLEN];
                print_sockaddr(addr, sizeof(addr), &ss);
@@ -1161,8 +1221,13 @@ static bool get_dcs(TALLOC_CTX *mem_ctx, struct winbindd_domain *domain,
                if (sitename) {
 
                        /* Do the site-specific AD dns lookup first. */
-                       get_sorted_dc_list(domain->alt_name, sitename, &ip_list, &iplist_size, True);
+                       get_sorted_dc_list(domain->alt_name, sitename, &ip_list,
+                              &iplist_size, True);
 
+                       /* Add ips to the DC array.  We don't look up the name
+                          of the DC in this function, but we fill in the char*
+                          of the ip now to make the failed connection cache
+                          work */
                        for ( i=0; i<iplist_size; i++ ) {
                                char addr[INET6_ADDRSTRLEN];
                                print_sockaddr(addr, sizeof(addr),
@@ -1180,8 +1245,9 @@ static bool get_dcs(TALLOC_CTX *mem_ctx, struct winbindd_domain *domain,
                        iplist_size = 0;
                }
 
-               /* Now we add DCs from the main AD dns lookup. */
-               get_sorted_dc_list(domain->alt_name, NULL, &ip_list, &iplist_size, True);
+               /* Now we add DCs from the main AD DNS lookup. */
+               get_sorted_dc_list(domain->alt_name, NULL, &ip_list,
+                       &iplist_size, True);
 
                for ( i=0; i<iplist_size; i++ ) {
                        char addr[INET6_ADDRSTRLEN];
@@ -1194,33 +1260,46 @@ static bool get_dcs(TALLOC_CTX *mem_ctx, struct winbindd_domain *domain,
                                        dcs,
                                        num_dcs);
                }
-        }
-
-       /* try standard netbios queries if no ADS */
 
-       if (iplist_size==0) {
-               get_sorted_dc_list(domain->name, NULL, &ip_list, &iplist_size, False);
-       }
+               SAFE_FREE(ip_list);
+               iplist_size = 0;
+        }
 
-       /* FIXME!! this is where we should re-insert the GETDC requests --jerry */
+       /* Try standard netbios queries if no ADS */
+       if (*num_dcs == 0) {
+               get_sorted_dc_list(domain->name, NULL, &ip_list, &iplist_size,
+                      False);
 
-       /* now add to the dc array.  We'll wait until the last minute 
-          to look up the name of the DC.  But we fill in the char* for 
-          the ip now in to make the failed connection cache work */
+               for ( i=0; i<iplist_size; i++ ) {
+                       char addr[INET6_ADDRSTRLEN];
+                       print_sockaddr(addr, sizeof(addr),
+                                       &ip_list[i].ss);
+                       add_one_dc_unique(mem_ctx,
+                                       domain->name,
+                                       addr,
+                                       &ip_list[i].ss,
+                                       dcs,
+                                       num_dcs);
+               }
 
-       for ( i=0; i<iplist_size; i++ ) {
-               char addr[INET6_ADDRSTRLEN];
-               print_sockaddr(addr, sizeof(addr),
-                               &ip_list[i].ss);
-               add_one_dc_unique(mem_ctx, domain->name, addr,
-                       &ip_list[i].ss, dcs, num_dcs);
+               SAFE_FREE(ip_list);
+               iplist_size = 0;
        }
 
-       SAFE_FREE( ip_list );
-
        return True;
 }
 
+/*******************************************************************
+ Find and make a connection to a DC in the given domain.
+
+ @param[in] mem_ctx talloc memory context to allocate from
+ @param[in] domain domain to find a dc in
+ @param[out] dcname NetBIOS or FQDN of DC that's connected to
+ @param[out] pss DC Internet address and port
+ @param[out] fd fd of the open socket connected to the newly found dc
+ @return true when a DC connection is made, false otherwise
+*******************************************************************/
+
 static bool find_new_dc(TALLOC_CTX *mem_ctx,
                        struct winbindd_domain *domain,
                        fstring dcname, struct sockaddr_storage *pss, int *fd)
@@ -1236,6 +1315,8 @@ static bool find_new_dc(TALLOC_CTX *mem_ctx,
 
        int i, fd_index;
 
+       *fd = -1;
+
  again:
        if (!get_dcs(mem_ctx, domain, &dcs, &num_dcs) || (num_dcs == 0))
                return False;
@@ -1290,13 +1371,27 @@ static bool find_new_dc(TALLOC_CTX *mem_ctx,
        }
 
        /* Try to figure out the name */
-       if (dcip_to_name(domain, pss, dcname)) {
+       if (dcip_to_name(mem_ctx, domain, pss, dcname)) {
                return True;
        }
 
        /* We can not continue without the DC's name */
        winbind_add_failed_connection_entry(domain, dcs[fd_index].name,
                                    NT_STATUS_UNSUCCESSFUL);
+
+       /* Throw away all arrays as we're doing this again. */
+       TALLOC_FREE(dcs);
+       num_dcs = 0;
+
+       TALLOC_FREE(dcnames);
+       num_dcnames = 0;
+
+       TALLOC_FREE(addrs);
+       num_addrs = 0;
+
+       close(*fd);
+       *fd = -1;
+
        goto again;
 }
 
@@ -1316,7 +1411,7 @@ static NTSTATUS cm_open_connection(struct winbindd_domain *domain,
 
        /* we have to check the server affinity cache here since 
           later we selecte a DC based on response time and not preference */
-          
+
        /* Check the negative connection cache
           before talking to it. It going down may have
           triggered the reconnection. */
@@ -1335,7 +1430,7 @@ static NTSTATUS cm_open_connection(struct winbindd_domain *domain,
                                                AI_NUMERICHOST)) {
                                return NT_STATUS_UNSUCCESSFUL;
                        }
-                       if (dcip_to_name( domain, &ss, saf_name )) {
+                       if (dcip_to_name(mem_ctx, domain, &ss, saf_name )) {
                                fstrcpy( domain->dcname, saf_name );
                        } else {
                                winbind_add_failed_connection_entry(
@@ -1433,33 +1528,27 @@ void invalidate_cm_connection(struct winbindd_cm_conn *conn)
        }
 
        if (conn->samr_pipe != NULL) {
-               if (!cli_rpc_pipe_close(conn->samr_pipe)) {
-                       /* Ok, it must be dead. Drop timeout to 0.5 sec. */
-                       if (conn->cli) {
-                               cli_set_timeout(conn->cli, 500);
-                       }
+               TALLOC_FREE(conn->samr_pipe);
+               /* Ok, it must be dead. Drop timeout to 0.5 sec. */
+               if (conn->cli) {
+                       cli_set_timeout(conn->cli, 500);
                }
-               conn->samr_pipe = NULL;
        }
 
        if (conn->lsa_pipe != NULL) {
-               if (!cli_rpc_pipe_close(conn->lsa_pipe)) {
-                       /* Ok, it must be dead. Drop timeout to 0.5 sec. */
-                       if (conn->cli) {
-                               cli_set_timeout(conn->cli, 500);
-                       }
+               TALLOC_FREE(conn->lsa_pipe);
+               /* Ok, it must be dead. Drop timeout to 0.5 sec. */
+               if (conn->cli) {
+                       cli_set_timeout(conn->cli, 500);
                }
-               conn->lsa_pipe = NULL;
        }
 
        if (conn->netlogon_pipe != NULL) {
-               if (!cli_rpc_pipe_close(conn->netlogon_pipe)) {
-                       /* Ok, it must be dead. Drop timeout to 0.5 sec. */
-                       if (conn->cli) {
-                               cli_set_timeout(conn->cli, 500);
-                       }
+               TALLOC_FREE(conn->netlogon_pipe);
+               /* Ok, it must be dead. Drop timeout to 0.5 sec. */
+               if (conn->cli) {
+                       cli_set_timeout(conn->cli, 500);
                }
-               conn->netlogon_pipe = NULL;
        }
 
        if (conn->cli) {
@@ -1572,26 +1661,26 @@ static bool set_dc_type_and_flags_trustinfo( struct winbindd_domain *domain )
        TALLOC_CTX *mem_ctx = NULL;
 
        DEBUG(5, ("set_dc_type_and_flags_trustinfo: domain %s\n", domain->name ));
-       
+
        /* Our primary domain doesn't need to worry about trust flags.
           Force it to go through the network setup */
        if ( domain->primary ) {                
                return False;           
        }
-       
+
        our_domain = find_our_domain();
-       
+
        if ( !connection_ok(our_domain) ) {
                DEBUG(3,("set_dc_type_and_flags_trustinfo: No connection to our domain!\n"));           
                return False;
        }
 
        /* This won't work unless our domain is AD */
-        
+
        if ( !our_domain->active_directory ) {
                return False;
        }
-       
+
        /* Use DsEnumerateDomainTrusts to get us the trust direction
           and type */
 
@@ -1610,7 +1699,7 @@ static bool set_dc_type_and_flags_trustinfo( struct winbindd_domain *domain )
        }       
 
        result = rpccli_netr_DsrEnumerateDomainTrusts(cli, mem_ctx,
-                                                     cli->cli->desthost,
+                                                     cli->desthost,
                                                      flags,
                                                      &trusts,
                                                      NULL);
@@ -1652,13 +1741,13 @@ static bool set_dc_type_and_flags_trustinfo( struct winbindd_domain *domain )
 
                        if ( !winbindd_can_contact_domain( domain) )
                                domain->internal = True;
-                       
+
                        break;
                }               
        }
-       
+
        talloc_destroy( mem_ctx );
-       
+
        return domain->initialized;     
 }
 
@@ -1693,10 +1782,11 @@ static void set_dc_type_and_flags_connect( struct winbindd_domain *domain )
 
        DEBUG(5, ("set_dc_type_and_flags_connect: domain %s\n", domain->name ));
 
-       cli = cli_rpc_pipe_open_noauth(domain->conn.cli, PI_DSSETUP,
-                                      &result);
+       result = cli_rpc_pipe_open_noauth(domain->conn.cli,
+                                         &ndr_table_dssetup.syntax_id,
+                                         &cli);
 
-       if (cli == NULL) {
+       if (!NT_STATUS_IS_OK(result)) {
                DEBUG(5, ("set_dc_type_and_flags_connect: Could not bind to "
                          "PI_DSSETUP on domain %s: (%s)\n",
                          domain->name, nt_errstr(result)));
@@ -1712,7 +1802,7 @@ static void set_dc_type_and_flags_connect( struct winbindd_domain *domain )
                                                                  DS_ROLE_BASIC_INFORMATION,
                                                                  &info,
                                                                  &werr);
-       cli_rpc_pipe_close(cli);
+       TALLOC_FREE(cli);
 
        if (!NT_STATUS_IS_OK(result)) {
                DEBUG(5, ("set_dc_type_and_flags_connect: rpccli_ds_getprimarydominfo "
@@ -1740,20 +1830,21 @@ static void set_dc_type_and_flags_connect( struct winbindd_domain *domain )
        }
 
 no_dssetup:
-       cli = cli_rpc_pipe_open_noauth(domain->conn.cli, PI_LSARPC, &result);
+       result = cli_rpc_pipe_open_noauth(domain->conn.cli,
+                                         &ndr_table_lsarpc.syntax_id, &cli);
 
-       if (cli == NULL) {
+       if (!NT_STATUS_IS_OK(result)) {
                DEBUG(5, ("set_dc_type_and_flags_connect: Could not bind to "
                          "PI_LSARPC on domain %s: (%s)\n",
                          domain->name, nt_errstr(result)));
-               cli_rpc_pipe_close(cli);
+               TALLOC_FREE(cli);
                TALLOC_FREE(mem_ctx);
                return;
        }
 
        result = rpccli_lsa_open_policy2(cli, mem_ctx, True, 
                                         SEC_RIGHTS_MAXIMUM_ALLOWED, &pol);
-               
+
        if (NT_STATUS_IS_OK(result)) {
                /* This particular query is exactly what Win2k clients use 
                   to determine that the DC is active directory */
@@ -1826,7 +1917,7 @@ done:
        DEBUG(5,("set_dc_type_and_flags_connect: domain %s is %srunning active directory.\n",
                  domain->name, domain->active_directory ? "" : "NOT "));
 
-       cli_rpc_pipe_close(cli);
+       TALLOC_FREE(cli);
 
        TALLOC_FREE(mem_ctx);
 
@@ -1882,6 +1973,10 @@ static bool cm_get_schannel_dcinfo(struct winbindd_domain *domain,
        /* Return a pointer to the struct dcinfo from the
           netlogon pipe. */
 
+       if (!domain->conn.netlogon_pipe->dc) {
+               return false;
+       }
+
        *ppdc = domain->conn.netlogon_pipe->dc;
        return True;
 }
@@ -1908,6 +2003,7 @@ NTSTATUS cm_connect_sam(struct winbindd_domain *domain, TALLOC_CTX *mem_ctx,
                goto done;
        }
 
+
        /*
         * No SAMR pipe yet. Attempt to get an NTLMSSP SPNEGO authenticated
         * sign and sealed pipe using the machine account password by
@@ -1941,14 +2037,15 @@ NTSTATUS cm_connect_sam(struct winbindd_domain *domain, TALLOC_CTX *mem_ctx,
 
        /* We have an authenticated connection. Use a NTLMSSP SPNEGO
           authenticated SAMR pipe with sign & seal. */
-       conn->samr_pipe =
-               cli_rpc_pipe_open_spnego_ntlmssp(conn->cli, PI_SAMR,
-                                                PIPE_AUTH_LEVEL_PRIVACY,
-                                                domain_name,
-                                                machine_account,
-                                                machine_password, &result);
-
-       if (conn->samr_pipe == NULL) {
+       result = cli_rpc_pipe_open_spnego_ntlmssp(conn->cli,
+                                                 &ndr_table_samr.syntax_id,
+                                                 PIPE_AUTH_LEVEL_PRIVACY,
+                                                 domain_name,
+                                                 machine_account,
+                                                 machine_password,
+                                                 &conn->samr_pipe);
+
+       if (!NT_STATUS_IS_OK(result)) {
                DEBUG(10,("cm_connect_sam: failed to connect to SAMR "
                          "pipe for domain %s using NTLMSSP "
                          "authenticated pipe: user %s\\%s. Error was "
@@ -1963,7 +2060,7 @@ NTSTATUS cm_connect_sam(struct winbindd_domain *domain, TALLOC_CTX *mem_ctx,
                  domain_name, machine_account));
 
        result = rpccli_samr_Connect2(conn->samr_pipe, mem_ctx,
-                                     conn->samr_pipe->cli->desthost,
+                                     conn->samr_pipe->desthost,
                                      SEC_RIGHTS_MAXIMUM_ALLOWED,
                                      &conn->sam_connect_handle);
        if (NT_STATUS_IS_OK(result)) {
@@ -1972,7 +2069,7 @@ NTSTATUS cm_connect_sam(struct winbindd_domain *domain, TALLOC_CTX *mem_ctx,
        DEBUG(10,("cm_connect_sam: ntlmssp-sealed rpccli_samr_Connect2 "
                  "failed for domain %s, error was %s. Trying schannel\n",
                  domain->name, nt_errstr(result) ));
-       cli_rpc_pipe_close(conn->samr_pipe);
+       TALLOC_FREE(conn->samr_pipe);
 
  schannel:
 
@@ -1984,11 +2081,11 @@ NTSTATUS cm_connect_sam(struct winbindd_domain *domain, TALLOC_CTX *mem_ctx,
                           "for domain %s, trying anon\n", domain->name));
                goto anonymous;
        }
-       conn->samr_pipe = cli_rpc_pipe_open_schannel_with_key
-               (conn->cli, PI_SAMR, PIPE_AUTH_LEVEL_PRIVACY,
-                domain->name, p_dcinfo, &result);
+       result = cli_rpc_pipe_open_schannel_with_key
+               (conn->cli, &ndr_table_samr.syntax_id, PIPE_AUTH_LEVEL_PRIVACY,
+                domain->name, p_dcinfo, &conn->samr_pipe);
 
-       if (conn->samr_pipe == NULL) {
+       if (!NT_STATUS_IS_OK(result)) {
                DEBUG(10,("cm_connect_sam: failed to connect to SAMR pipe for "
                          "domain %s using schannel. Error was %s\n",
                          domain->name, nt_errstr(result) ));
@@ -1998,7 +2095,7 @@ NTSTATUS cm_connect_sam(struct winbindd_domain *domain, TALLOC_CTX *mem_ctx,
                  "schannel.\n", domain->name ));
 
        result = rpccli_samr_Connect2(conn->samr_pipe, mem_ctx,
-                                     conn->samr_pipe->cli->desthost,
+                                     conn->samr_pipe->desthost,
                                      SEC_RIGHTS_MAXIMUM_ALLOWED,
                                      &conn->sam_connect_handle);
        if (NT_STATUS_IS_OK(result)) {
@@ -2007,21 +2104,20 @@ NTSTATUS cm_connect_sam(struct winbindd_domain *domain, TALLOC_CTX *mem_ctx,
        DEBUG(10,("cm_connect_sam: schannel-sealed rpccli_samr_Connect2 failed "
                  "for domain %s, error was %s. Trying anonymous\n",
                  domain->name, nt_errstr(result) ));
-       cli_rpc_pipe_close(conn->samr_pipe);
+       TALLOC_FREE(conn->samr_pipe);
 
  anonymous:
 
        /* Finally fall back to anonymous. */
-       conn->samr_pipe = cli_rpc_pipe_open_noauth(conn->cli, PI_SAMR,
-                                                  &result);
+       result = cli_rpc_pipe_open_noauth(conn->cli, &ndr_table_samr.syntax_id,
+                                         &conn->samr_pipe);
 
-       if (conn->samr_pipe == NULL) {
-               result = NT_STATUS_PIPE_NOT_AVAILABLE;
+       if (!NT_STATUS_IS_OK(result)) {
                goto done;
        }
 
        result = rpccli_samr_Connect2(conn->samr_pipe, mem_ctx,
-                                     conn->samr_pipe->cli->desthost,
+                                     conn->samr_pipe->desthost,
                                      SEC_RIGHTS_MAXIMUM_ALLOWED,
                                      &conn->sam_connect_handle);
        if (!NT_STATUS_IS_OK(result)) {
@@ -2082,11 +2178,13 @@ NTSTATUS cm_connect_lsa(struct winbindd_domain *domain, TALLOC_CTX *mem_ctx,
 
        /* We have an authenticated connection. Use a NTLMSSP SPNEGO
         * authenticated LSA pipe with sign & seal. */
-       conn->lsa_pipe = cli_rpc_pipe_open_spnego_ntlmssp
-               (conn->cli, PI_LSARPC, PIPE_AUTH_LEVEL_PRIVACY,
-                conn->cli->domain, conn->cli->user_name, conn_pwd, &result);
+       result = cli_rpc_pipe_open_spnego_ntlmssp
+               (conn->cli, &ndr_table_lsarpc.syntax_id,
+                PIPE_AUTH_LEVEL_PRIVACY,
+                conn->cli->domain, conn->cli->user_name, conn_pwd,
+                &conn->lsa_pipe);
 
-       if (conn->lsa_pipe == NULL) {
+       if (!NT_STATUS_IS_OK(result)) {
                DEBUG(10,("cm_connect_lsa: failed to connect to LSA pipe for "
                          "domain %s using NTLMSSP authenticated pipe: user "
                          "%s\\%s. Error was %s. Trying schannel.\n",
@@ -2109,7 +2207,7 @@ NTSTATUS cm_connect_lsa(struct winbindd_domain *domain, TALLOC_CTX *mem_ctx,
        DEBUG(10,("cm_connect_lsa: rpccli_lsa_open_policy failed, trying "
                  "schannel\n"));
 
-       cli_rpc_pipe_close(conn->lsa_pipe);
+       TALLOC_FREE(conn->lsa_pipe);
 
  schannel:
 
@@ -2121,11 +2219,12 @@ NTSTATUS cm_connect_lsa(struct winbindd_domain *domain, TALLOC_CTX *mem_ctx,
                           "for domain %s, trying anon\n", domain->name));
                goto anonymous;
        }
-       conn->lsa_pipe = cli_rpc_pipe_open_schannel_with_key
-               (conn->cli, PI_LSARPC, PIPE_AUTH_LEVEL_PRIVACY,
-                domain->name, p_dcinfo, &result);
+       result = cli_rpc_pipe_open_schannel_with_key
+               (conn->cli, &ndr_table_lsarpc.syntax_id,
+                PIPE_AUTH_LEVEL_PRIVACY,
+                domain->name, p_dcinfo, &conn->lsa_pipe);
 
-       if (conn->lsa_pipe == NULL) {
+       if (!NT_STATUS_IS_OK(result)) {
                DEBUG(10,("cm_connect_lsa: failed to connect to LSA pipe for "
                          "domain %s using schannel. Error was %s\n",
                          domain->name, nt_errstr(result) ));
@@ -2144,13 +2243,14 @@ NTSTATUS cm_connect_lsa(struct winbindd_domain *domain, TALLOC_CTX *mem_ctx,
        DEBUG(10,("cm_connect_lsa: rpccli_lsa_open_policy failed, trying "
                  "anonymous\n"));
 
-       cli_rpc_pipe_close(conn->lsa_pipe);
+       TALLOC_FREE(conn->lsa_pipe);
 
  anonymous:
 
-       conn->lsa_pipe = cli_rpc_pipe_open_noauth(conn->cli, PI_LSARPC,
-                                                 &result);
-       if (conn->lsa_pipe == NULL) {
+       result = cli_rpc_pipe_open_noauth(conn->cli,
+                                         &ndr_table_lsarpc.syntax_id,
+                                         &conn->lsa_pipe);
+       if (!NT_STATUS_IS_OK(result)) {
                result = NT_STATUS_PIPE_NOT_AVAILABLE;
                goto done;
        }
@@ -2200,9 +2300,10 @@ NTSTATUS cm_connect_netlogon(struct winbindd_domain *domain,
                return NT_STATUS_OK;
        }
 
-       netlogon_pipe = cli_rpc_pipe_open_noauth(conn->cli, PI_NETLOGON,
-                                                &result);
-       if (netlogon_pipe == NULL) {
+       result = cli_rpc_pipe_open_noauth(conn->cli,
+                                         &ndr_table_netlogon.syntax_id,
+                                         &netlogon_pipe);
+       if (!NT_STATUS_IS_OK(result)) {
                return result;
        }
 
@@ -2219,7 +2320,7 @@ NTSTATUS cm_connect_netlogon(struct winbindd_domain *domain,
        if (!get_trust_pw_hash(domain->name, mach_pwd, &account_name,
                               &sec_chan_type))
        {
-               cli_rpc_pipe_close(netlogon_pipe);
+               TALLOC_FREE(netlogon_pipe);
                return NT_STATUS_CANT_ACCESS_DOMAIN_INFO;
        }
 
@@ -2234,14 +2335,14 @@ NTSTATUS cm_connect_netlogon(struct winbindd_domain *domain,
                 &neg_flags);
 
        if (!NT_STATUS_IS_OK(result)) {
-               cli_rpc_pipe_close(netlogon_pipe);
+               TALLOC_FREE(netlogon_pipe);
                return result;
        }
 
        if ((lp_client_schannel() == True) &&
                        ((neg_flags & NETLOGON_NEG_SCHANNEL) == 0)) {
                DEBUG(3, ("Server did not offer schannel\n"));
-               cli_rpc_pipe_close(netlogon_pipe);
+               TALLOC_FREE(netlogon_pipe);
                return NT_STATUS_ACCESS_DENIED;
        }
 
@@ -2265,21 +2366,18 @@ NTSTATUS cm_connect_netlogon(struct winbindd_domain *domain,
           part of the new pipe auth struct.
        */
 
-       conn->netlogon_pipe =
-               cli_rpc_pipe_open_schannel_with_key(conn->cli,
-                                                   PI_NETLOGON,
-                                                   PIPE_AUTH_LEVEL_PRIVACY,
-                                                   domain->name,
-                                                   netlogon_pipe->dc,
-                                                   &result);
+       result = cli_rpc_pipe_open_schannel_with_key(
+               conn->cli, &ndr_table_netlogon.syntax_id,
+               PIPE_AUTH_LEVEL_PRIVACY, domain->name, netlogon_pipe->dc,
+               &conn->netlogon_pipe);
 
        /* We can now close the initial netlogon pipe. */
-       cli_rpc_pipe_close(netlogon_pipe);
+       TALLOC_FREE(netlogon_pipe);
 
-       if (conn->netlogon_pipe == NULL) {
+       if (!NT_STATUS_IS_OK(result)) {
                DEBUG(3, ("Could not open schannel'ed NETLOGON pipe. Error "
                          "was %s\n", nt_errstr(result)));
-                         
+
                /* make sure we return something besides OK */
                return !NT_STATUS_IS_OK(result) ? result : NT_STATUS_PIPE_NOT_AVAILABLE;
        }