Merge with 0.5
[prosody.git] / core / s2smanager.lua
1 -- Prosody IM
2 -- Copyright (C) 2008-2009 Matthew Wild
3 -- Copyright (C) 2008-2009 Waqas Hussain
4 -- 
5 -- This project is MIT/X11 licensed. Please see the
6 -- COPYING file in the source package for more information.
7 --
8
9
10
11 local hosts = hosts;
12 local sessions = sessions;
13 local core_process_stanza = function(a, b) core_process_stanza(a, b); end
14 local add_task = require "util.timer".add_task;
15 local socket = require "socket";
16 local format = string.format;
17 local t_insert, t_sort = table.insert, table.sort;
18 local get_traceback = debug.traceback;
19 local tostring, pairs, ipairs, getmetatable, newproxy, error, tonumber
20     = tostring, pairs, ipairs, getmetatable, newproxy, error, tonumber;
21
22 local idna_to_ascii = require "util.encodings".idna.to_ascii;
23 local connlisteners_get = require "net.connlisteners".get;
24 local wrapclient = require "net.server".wrapclient;
25 local modulemanager = require "core.modulemanager";
26 local st = require "stanza";
27 local stanza = st.stanza;
28 local nameprep = require "util.encodings".stringprep.nameprep;
29
30 local uuid_gen = require "util.uuid".generate;
31
32 local logger_init = require "util.logger".init;
33
34 local log = logger_init("s2smanager");
35
36 local sha256_hash = require "util.hashes".sha256;
37
38 local dialback_secret = uuid_gen();
39
40 local adns = require "net.adns";
41
42 local dns_timeout = config.get("*", "core", "dns_timeout") or 60;
43
44 incoming_s2s = {};
45 local incoming_s2s = incoming_s2s;
46
47 module "s2smanager"
48
49 local function compare_srv_priorities(a,b) return a.priority < b.priority or a.weight < b.weight; end
50
51 local function bounce_sendq(session)
52         local sendq = session.sendq;
53         if sendq then
54                 session.log("info", "sending error replies for "..#sendq.." queued stanzas because of failed outgoing connection to "..tostring(session.to_host));
55                 local dummy = {
56                         type = "s2sin";
57                         send = function(s)
58                                 (session.log or log)("error", "Replying to to an s2s error reply, please report this! Traceback: %s", get_traceback());
59                         end;
60                         dummy = true;
61                 };
62                 for i, data in ipairs(sendq) do
63                         local reply = data[2];
64                         local xmlns = reply.attr.xmlns;
65                         if not xmlns or xmlns == "jabber:client" or xmlns == "jabber:server" then
66                                 reply.attr.type = "error";
67                                 reply:tag("error", {type = "cancel"})
68                                         :tag("remote-server-not-found", {xmlns = "urn:ietf:params:xml:ns:xmpp-stanzas"}):up();
69                                 core_process_stanza(dummy, reply);
70                         end
71                         sendq[i] = nil;
72                 end
73                 session.sendq = nil;
74         end
75 end
76
77 function send_to_host(from_host, to_host, data)
78         local host = hosts[from_host].s2sout[to_host];
79         if host then
80                 -- We have a connection to this host already
81                 if host.type == "s2sout_unauthed" and data.name ~= "db:verify" and ((not data.xmlns) or data.xmlns == "jabber:client" or data.xmlns == "jabber:server") then
82                         (host.log or log)("debug", "trying to send over unauthed s2sout to "..to_host);
83                         if not host.notopen and not host.dialback_key and host.sends2s then
84                                 host.log("debug", "dialback had not been initiated");
85                                 initiate_dialback(host);
86                         end
87                         
88                         -- Queue stanza until we are able to send it
89                         if host.sendq then t_insert(host.sendq, {tostring(data), st.reply(data)});
90                         else host.sendq = { {tostring(data), st.reply(data)} }; end
91                         host.log("debug", "stanza [%s] queued ", data.name);
92                 elseif host.type == "local" or host.type == "component" then
93                         log("error", "Trying to send a stanza to ourselves??")
94                         log("error", "Traceback: %s", get_traceback());
95                         log("error", "Stanza: %s", tostring(data));
96                 else
97                         (host.log or log)("debug", "going to send stanza to "..to_host.." from "..from_host);
98                         -- FIXME
99                         if host.from_host ~= from_host then
100                                 log("error", "WARNING! This might, possibly, be a bug, but it might not...");
101                                 log("error", "We are going to send from %s instead of %s", tostring(host.from_host), tostring(from_host));
102                         end
103                         host.sends2s(data);
104                         host.log("debug", "stanza sent over "..host.type);
105                 end
106         else
107                 log("debug", "opening a new outgoing connection for this stanza");
108                 local host_session = new_outgoing(from_host, to_host);
109                 -- Store in buffer
110                 host_session.sendq = { {tostring(data), st.reply(data)} };
111                 log("debug", "stanza [%s] queued until connection complete", tostring(data.name));
112                 if (not host_session.connecting) and (not host_session.conn) then
113                         log("warn", "Connection to %s failed already, destroying session...", to_host);
114                         destroy_session(host_session);
115                 end
116         end
117 end
118
119 local open_sessions = 0;
120
121 function new_incoming(conn)
122         local session = { conn = conn, type = "s2sin_unauthed", direction = "incoming", hosts = {} };
123         if true then
124                 session.trace = newproxy(true);
125                 getmetatable(session.trace).__gc = function () open_sessions = open_sessions - 1; end;
126         end
127         open_sessions = open_sessions + 1;
128         local w, log = conn.write, logger_init("s2sin"..tostring(conn):match("[a-f0-9]+$"));
129         session.log = log;
130         session.sends2s = function (t) log("debug", "sending: %s", tostring(t)); w(tostring(t)); end
131         incoming_s2s[session] = true;
132         return session;
133 end
134
135 function new_outgoing(from_host, to_host)
136                 local host_session = { to_host = to_host, from_host = from_host, notopen = true, type = "s2sout_unauthed", direction = "outgoing" };
137                 hosts[from_host].s2sout[to_host] = host_session;
138                 
139                 local log;
140                 do
141                         local conn_name = "s2sout"..tostring(host_session):match("[a-f0-9]*$");
142                         log = logger_init(conn_name);
143                         host_session.log = log;
144                 end
145                 
146                 -- This is the first call, can't fail (the first step is DNS lookup)
147                 attempt_connection(host_session);
148                 
149                 if not host_session.sends2s then                
150                         -- A sends2s which buffers data (until the stream is opened)
151                         -- note that data in this buffer will be sent before the stream is authed
152                         -- and will not be ack'd in any way, successful or otherwise
153                         local buffer;
154                         function host_session.sends2s(data)
155                                 if not buffer then
156                                         buffer = {};
157                                         host_session.send_buffer = buffer;
158                                 end
159                                 log("debug", "Buffering data on unconnected s2sout to %s", to_host);
160                                 buffer[#buffer+1] = data;
161                                 log("debug", "Buffered item %d: %s", #buffer, tostring(data));
162                         end
163                         
164                 end
165
166                 return host_session;
167 end
168
169
170 function attempt_connection(host_session, err)
171         local from_host, to_host = host_session.from_host, host_session.to_host;
172         local connect_host, connect_port = idna_to_ascii(to_host), 5269;
173         
174         if not err then -- This is our first attempt
175                 log("debug", "First attempt to connect to %s, starting with SRV lookup...", to_host);
176                 host_session.connecting = true;
177                 local handle;
178                 handle = adns.lookup(function (answer)
179                         handle = nil;
180                         host_session.connecting = nil;
181                         if answer then
182                                 log("debug", to_host.." has SRV records, handling...");
183                                 local srv_hosts = {};
184                                 host_session.srv_hosts = srv_hosts;
185                                 for _, record in ipairs(answer) do
186                                         t_insert(srv_hosts, record.srv);
187                                 end
188                                 t_sort(srv_hosts, compare_srv_priorities);
189                                 
190                                 local srv_choice = srv_hosts[1];
191                                 host_session.srv_choice = 1;
192                                 if srv_choice then
193                                         connect_host, connect_port = srv_choice.target or to_host, srv_choice.port or connect_port;
194                                         log("debug", "Best record found, will connect to %s:%d", connect_host, connect_port);
195                                 end
196                         else
197                                 log("debug", to_host.." has no SRV records, falling back to A");
198                         end
199                         -- Try with SRV, or just the plain hostname if no SRV
200                         local ok, err = try_connect(host_session, connect_host, connect_port);
201                         if not ok then
202                                 if not attempt_connection(host_session, err) then
203                                         -- No more attempts will be made
204                                         destroy_session(host_session);
205                                 end
206                         end
207                 end, "_xmpp-server._tcp."..connect_host..".", "SRV");
208                 
209                 -- Set handler for DNS timeout
210                 add_task(dns_timeout, function ()
211                         if handle then
212                                 adns.cancel(handle, true);
213                         end
214                 end);
215                 
216                 log("debug", "DNS lookup for %s sent, waiting for response before we can connect", to_host);
217                 return true; -- Attempt in progress
218         elseif host_session.srv_hosts and #host_session.srv_hosts > host_session.srv_choice then -- Not our first attempt, and we also have SRV
219                 host_session.srv_choice = host_session.srv_choice + 1;
220                 local srv_choice = host_session.srv_hosts[host_session.srv_choice];
221                 connect_host, connect_port = srv_choice.target or to_host, srv_choice.port or connect_port;
222                 host_session.log("info", "Connection failed (%s). Attempt #%d: This time to %s:%d", tostring(err), host_session.srv_choice, connect_host, connect_port);
223         else
224                 host_session.log("info", "Out of connection options, can't connect to %s", tostring(host_session.to_host));
225                 -- We're out of options
226                 return false;
227         end
228         
229         if not (connect_host and connect_port) then
230                 -- Likely we couldn't resolve DNS
231                 log("warn", "Hmm, we're without a host (%s) and port (%s) to connect to for %s, giving up :(", tostring(connect_host), tostring(connect_port), tostring(to_host));
232                 return false;
233         end
234         
235         return try_connect(host_session, connect_host, connect_port);
236 end
237
238 function try_connect(host_session, connect_host, connect_port)
239         host_session.connecting = true;
240         local handle;
241         handle = adns.lookup(function (reply)
242                 handle = nil;
243                 host_session.connecting = nil;
244                 if reply and reply[1] and reply[1].a then
245                         log("debug", "DNS reply for %s gives us %s", connect_host, reply[1].a);
246                         return make_connect(host_session, reply[1].a, connect_port);
247                 else
248                         log("debug", "DNS lookup failed to get a response for %s", connect_host);
249                         if not attempt_connection(host_session, "name resolution failed") then -- Retry if we can
250                                 log("debug", "No other records to try for %s - destroying", host_session.to_host);
251                                 destroy_session(host_session); -- End of the line, we can't
252                         end
253                 end
254         end, connect_host, "A", "IN");
255
256         -- Set handler for DNS timeout
257         add_task(dns_timeout, function ()
258                 if handle then
259                         adns.cancel(handle, true);
260                 end
261         end);
262                 
263         return true;
264 end
265
266 function make_connect(host_session, connect_host, connect_port)
267         host_session.log("info", "Beginning new connection attempt to %s (%s:%d)", host_session.to_host, connect_host, connect_port);
268         -- Ok, we're going to try to connect
269         
270         local from_host, to_host = host_session.from_host, host_session.to_host;
271         
272         local conn, handler = socket.tcp()
273
274         conn:settimeout(0);
275         local success, err = conn:connect(connect_host, connect_port);
276         if not success and err ~= "timeout" then
277                 log("warn", "s2s connect() to %s (%s:%d) failed: %s", host_session.to_host, connect_host, connect_port, err);
278                 return false, err;
279         end
280         
281         local cl = connlisteners_get("xmppserver");
282         conn = wrapclient(conn, connect_host, connect_port, cl, cl.default_mode or 1, hosts[from_host].ssl_ctx, false );
283         host_session.conn = conn;
284         
285         -- Register this outgoing connection so that xmppserver_listener knows about it
286         -- otherwise it will assume it is a new incoming connection
287         cl.register_outgoing(conn, host_session);
288         
289         local w = conn.write;
290         host_session.sends2s = function (t) log("debug", "sending: %s", tostring(t)); w(tostring(t)); end
291         
292         conn.write(format([[<stream:stream xmlns='jabber:server' xmlns:db='jabber:server:dialback' xmlns:stream='http://etherx.jabber.org/streams' from='%s' to='%s' version='1.0' xml:lang='en'>]], from_host, to_host));
293         log("debug", "Connection attempt in progress...");
294         return true;
295 end
296
297 function streamopened(session, attr)
298         local send = session.sends2s;
299         
300         -- TODO: #29: SASL/TLS on s2s streams
301         session.version = 0; --tonumber(attr.version) or 0;
302         
303         if session.version >= 1.0 and not (attr.to and attr.from) then
304                 log("warn", (session.to_host or "(unknown)").." failed to specify 'to' or 'from' hostname as per RFC");
305         end
306         
307         if session.direction == "incoming" then
308                 -- Send a reply stream header
309                 session.to_host = attr.to and nameprep(attr.to);
310                 session.from_host = attr.from and nameprep(attr.from);
311         
312                 session.streamid = uuid_gen();
313                 (session.log or log)("debug", "incoming s2s received <stream:stream>");
314                 send("<?xml version='1.0'?>");
315                 send(stanza("stream:stream", { xmlns='jabber:server', ["xmlns:db"]='jabber:server:dialback', 
316                                 ["xmlns:stream"]='http://etherx.jabber.org/streams', id=session.streamid, from=session.to_host }):top_tag());
317                 if session.to_host and not hosts[session.to_host] then
318                         -- Attempting to connect to a host we don't serve
319                         session:close({ condition = "host-unknown"; text = "This host does not serve "..session.to_host });
320                         return;
321                 end
322                 if session.version >= 1.0 then
323                         send(st.stanza("stream:features")
324                                         :tag("dialback", { xmlns='urn:xmpp:features:dialback' }):tag("optional"):up():up());
325                 end
326         elseif session.direction == "outgoing" then
327                 -- If we are just using the connection for verifying dialback keys, we won't try and auth it
328                 if not attr.id then error("stream response did not give us a streamid!!!"); end
329                 session.streamid = attr.id;
330         
331                 -- Send unauthed buffer
332                 -- (stanzas which are fine to send before dialback)
333                 -- Note that this is *not* the stanza queue (which 
334                 -- we can only send if auth succeeds) :)
335                 local send_buffer = session.send_buffer;
336                 if send_buffer and #send_buffer > 0 then
337                         log("debug", "Sending s2s send_buffer now...");
338                         for i, data in ipairs(send_buffer) do
339                                 session.sends2s(tostring(data));
340                                 send_buffer[i] = nil;
341                         end
342                 end
343                 session.send_buffer = nil;
344         
345                 if not session.dialback_verifying then
346                         initiate_dialback(session);
347                 else
348                         mark_connected(session);
349                 end
350         end
351
352         session.notopen = nil;
353 end
354
355 function streamclosed(session)
356         (session.log or log)("debug", "</stream:stream>");
357         if session.sends2s then
358                 session.sends2s("</stream:stream>");
359         end
360         session.notopen = true;
361 end
362
363 function initiate_dialback(session)
364         -- generate dialback key
365         session.dialback_key = generate_dialback(session.streamid, session.to_host, session.from_host);
366         session.sends2s(format("<db:result from='%s' to='%s'>%s</db:result>", session.from_host, session.to_host, session.dialback_key));
367         session.log("info", "sent dialback key on outgoing s2s stream");
368 end
369
370 function generate_dialback(id, to, from)
371         return sha256_hash(id..to..from..dialback_secret, true);
372 end
373
374 function verify_dialback(id, to, from, key)
375         return key == generate_dialback(id, to, from);
376 end
377
378 function make_authenticated(session, host)
379         if session.type == "s2sout_unauthed" then
380                 session.type = "s2sout";
381         elseif session.type == "s2sin_unauthed" then
382                 session.type = "s2sin";
383                 if host then
384                         session.hosts[host].authed = true;
385                 end
386         elseif session.type == "s2sin" and host then
387                 session.hosts[host].authed = true;
388         else
389                 return false;
390         end
391         session.log("debug", "connection %s->%s is now authenticated", session.from_host or "(unknown)", session.to_host or "(unknown)");
392         
393         mark_connected(session);
394         
395         return true;
396 end
397
398 function mark_connected(session)
399         local sendq, send = session.sendq, session.sends2s;
400         
401         local from, to = session.from_host, session.to_host;
402         
403         session.log("info", session.direction.." s2s connection "..from.."->"..to.." complete");
404         
405         local send_to_host = send_to_host;
406         function session.send(data) send_to_host(to, from, data); end
407         
408         
409         if session.direction == "outgoing" then
410                 if sendq then
411                         session.log("debug", "sending "..#sendq.." queued stanzas across new outgoing connection to "..session.to_host);
412                         for i, data in ipairs(sendq) do
413                                 send(data[1]);
414                                 sendq[i] = nil;
415                         end
416                         session.sendq = nil;
417                 end
418                 
419                 session.srv_hosts = nil;
420         end
421 end
422
423 function destroy_session(session)
424         (session.log or log)("info", "Destroying "..tostring(session.direction).." session "..tostring(session.from_host).."->"..tostring(session.to_host));
425         
426         if session.direction == "outgoing" then
427                 hosts[session.from_host].s2sout[session.to_host] = nil;
428                 bounce_sendq(session);
429         elseif session.direction == "incoming" then
430                 incoming_s2s[session] = nil;
431         end
432         
433         for k in pairs(session) do
434                 if k ~= "trace" then
435                         session[k] = nil;
436                 end
437         end
438 end
439
440 return _M;