Merge branch 'fixes' of git://git.kernel.org/pub/scm/linux/kernel/git/jesse/openvswitch
[GitHub/mt8127/android_kernel_alcatel_ttab.git] / net / tipc / net.c
CommitLineData
b97bf3fd
PL
1/*
2 * net/tipc/net.c: TIPC network routing code
c4307285 3 *
593a5f22 4 * Copyright (c) 1995-2006, Ericsson AB
9df3b7eb 5 * Copyright (c) 2005, 2010-2011, Wind River Systems
b97bf3fd
PL
6 * All rights reserved.
7 *
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions are met:
10 *
9ea1fd3c
PL
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in the
15 * documentation and/or other materials provided with the distribution.
16 * 3. Neither the names of the copyright holders nor the names of its
17 * contributors may be used to endorse or promote products derived from
18 * this software without specific prior written permission.
19 *
20 * Alternatively, this software may be distributed under the terms of the
21 * GNU General Public License ("GPL") version 2 as published by the Free
22 * Software Foundation.
b97bf3fd
PL
23 *
24 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
25 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
26 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
27 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
28 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
29 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
30 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
31 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
32 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
33 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
34 * POSSIBILITY OF SUCH DAMAGE.
35 */
36
37#include "core.h"
b97bf3fd 38#include "net.h"
b97bf3fd
PL
39#include "name_distr.h"
40#include "subscr.h"
b97bf3fd 41#include "port.h"
672d99e1 42#include "node.h"
b97bf3fd
PL
43#include "config.h"
44
c4307285 45/*
b97bf3fd
PL
46 * The TIPC locking policy is designed to ensure a very fine locking
47 * granularity, permitting complete parallel access to individual
c4307285 48 * port and node/link instances. The code consists of three major
b97bf3fd
PL
49 * locking domains, each protected with their own disjunct set of locks.
50 *
51 * 1: The routing hierarchy.
c4307285
YH
52 * Comprises the structures 'zone', 'cluster', 'node', 'link'
53 * and 'bearer'. The whole hierarchy is protected by a big
54 * read/write lock, tipc_net_lock, to enssure that nothing is added
55 * or removed while code is accessing any of these structures.
56 * This layer must not be called from the two others while they
b97bf3fd
PL
57 * hold any of their own locks.
58 * Neither must it itself do any upcalls to the other two before
4323add6 59 * it has released tipc_net_lock and other protective locks.
b97bf3fd 60 *
c4307285 61 * Within the tipc_net_lock domain there are two sub-domains;'node' and
b97bf3fd
PL
62 * 'bearer', where local write operations are permitted,
63 * provided that those are protected by individual spin_locks
c4307285 64 * per instance. Code holding tipc_net_lock(read) and a node spin_lock
b97bf3fd 65 * is permitted to poke around in both the node itself and its
c4307285
YH
66 * subordinate links. I.e, it can update link counters and queues,
67 * change link state, send protocol messages, and alter the
68 * "active_links" array in the node; but it can _not_ remove a link
b97bf3fd 69 * or a node from the overall structure.
c4307285
YH
70 * Correspondingly, individual bearers may change status within a
71 * tipc_net_lock(read), protected by an individual spin_lock ber bearer
4323add6 72 * instance, but it needs tipc_net_lock(write) to remove/add any bearers.
b97bf3fd 73 *
c4307285
YH
74 *
75 * 2: The transport level of the protocol.
76 * This consists of the structures port, (and its user level
77 * representations, such as user_port and tipc_sock), reference and
78 * tipc_user (port.c, reg.c, socket.c).
b97bf3fd
PL
79 *
80 * This layer has four different locks:
81 * - The tipc_port spin_lock. This is protecting each port instance
c4307285
YH
82 * from parallel data access and removal. Since we can not place
83 * this lock in the port itself, it has been placed in the
b97bf3fd 84 * corresponding reference table entry, which has the same life
c4307285
YH
85 * cycle as the module. This entry is difficult to access from
86 * outside the TIPC core, however, so a pointer to the lock has
87 * been added in the port instance, -to be used for unlocking
b97bf3fd 88 * only.
c4307285
YH
89 * - A read/write lock to protect the reference table itself (teg.c).
90 * (Nobody is using read-only access to this, so it can just as
b97bf3fd
PL
91 * well be changed to a spin_lock)
92 * - A spin lock to protect the registry of kernel/driver users (reg.c)
c4307285 93 * - A global spin_lock (tipc_port_lock), which only task is to ensure
b97bf3fd
PL
94 * consistency where more than one port is involved in an operation,
95 * i.e., whe a port is part of a linked list of ports.
96 * There are two such lists; 'port_list', which is used for management,
97 * and 'wait_list', which is used to queue ports during congestion.
c4307285 98 *
b97bf3fd 99 * 3: The name table (name_table.c, name_distr.c, subscription.c)
c4307285
YH
100 * - There is one big read/write-lock (tipc_nametbl_lock) protecting the
101 * overall name table structure. Nothing must be added/removed to
b97bf3fd
PL
102 * this structure without holding write access to it.
103 * - There is one local spin_lock per sub_sequence, which can be seen
4323add6 104 * as a sub-domain to the tipc_nametbl_lock domain. It is used only
b97bf3fd
PL
105 * for translation operations, and is needed because a translation
106 * steps the root of the 'publication' linked list between each lookup.
4323add6 107 * This is always used within the scope of a tipc_nametbl_lock(read).
b97bf3fd
PL
108 * - A local spin_lock protecting the queue of subscriber events.
109*/
110
34af946a 111DEFINE_RWLOCK(tipc_net_lock);
b97bf3fd
PL
112
113static void net_route_named_msg(struct sk_buff *buf)
114{
115 struct tipc_msg *msg = buf_msg(buf);
116 u32 dnode;
117 u32 dport;
118
119 if (!msg_named(msg)) {
5f6d9123 120 kfree_skb(buf);
b97bf3fd
PL
121 return;
122 }
123
124 dnode = addr_domain(msg_lookup_scope(msg));
4323add6 125 dport = tipc_nametbl_translate(msg_nametype(msg), msg_nameinst(msg), &dnode);
b97bf3fd
PL
126 if (dport) {
127 msg_set_destnode(msg, dnode);
128 msg_set_destport(msg, dport);
4323add6 129 tipc_net_route_msg(buf);
b97bf3fd
PL
130 return;
131 }
b97bf3fd
PL
132 tipc_reject_msg(buf, TIPC_ERR_NO_NAME);
133}
134
4323add6 135void tipc_net_route_msg(struct sk_buff *buf)
b97bf3fd
PL
136{
137 struct tipc_msg *msg;
138 u32 dnode;
139
140 if (!buf)
141 return;
142 msg = buf_msg(buf);
143
b97bf3fd
PL
144 /* Handle message for this node */
145 dnode = msg_short(msg) ? tipc_own_addr : msg_destnode(msg);
c68ca7b7 146 if (tipc_in_scope(dnode, tipc_own_addr)) {
b97bf3fd 147 if (msg_isdata(msg)) {
c4307285 148 if (msg_mcast(msg))
4323add6 149 tipc_port_recv_mcast(buf, NULL);
b97bf3fd 150 else if (msg_destport(msg))
4323add6 151 tipc_port_recv_msg(buf);
b97bf3fd
PL
152 else
153 net_route_named_msg(buf);
154 return;
155 }
156 switch (msg_user(msg)) {
b97bf3fd 157 case NAME_DISTRIBUTOR:
4323add6 158 tipc_named_recv(buf);
b97bf3fd
PL
159 break;
160 case CONN_MANAGER:
4323add6 161 tipc_port_recv_proto_msg(buf);
b97bf3fd
PL
162 break;
163 default:
5f6d9123 164 kfree_skb(buf);
b97bf3fd
PL
165 }
166 return;
167 }
168
169 /* Handle message for another node */
b2abd4c0 170 skb_trim(buf, msg_size(msg));
4323add6 171 tipc_link_send(buf, dnode, msg_link_selector(msg));
b97bf3fd
PL
172}
173
379c0456 174void tipc_net_start(u32 addr)
b97bf3fd
PL
175{
176 char addr_string[16];
b97bf3fd 177
974a5a86 178 write_lock_bh(&tipc_net_lock);
03194379 179 tipc_own_addr = addr;
4323add6
PL
180 tipc_named_reinit();
181 tipc_port_reinit();
c47e9b91 182 tipc_bclink_init();
974a5a86 183 write_unlock_bh(&tipc_net_lock);
03194379 184
a2cfd45b 185 tipc_cfg_reinit();
03194379 186
2cf8aa19
EH
187 pr_info("Started in network mode\n");
188 pr_info("Own node address %s, network identity %u\n",
189 tipc_addr_string_fill(addr_string, tipc_own_addr), tipc_net_id);
b97bf3fd
PL
190}
191
4323add6 192void tipc_net_stop(void)
b97bf3fd 193{
34e46258
AS
194 struct tipc_node *node, *t_node;
195
b58343f9 196 if (!tipc_own_addr)
b97bf3fd 197 return;
c4307285 198 write_lock_bh(&tipc_net_lock);
97f1b625 199 tipc_bearer_stop();
4323add6 200 tipc_bclink_stop();
1fa07380 201 list_for_each_entry_safe(node, t_node, &tipc_node_list, list)
34e46258 202 tipc_node_delete(node);
c4307285 203 write_unlock_bh(&tipc_net_lock);
2cf8aa19 204 pr_info("Left network mode\n");
b97bf3fd 205}