gem5 [DEVELOP-FOR-25.0]
Loading...
Searching...
No Matches
tcp_iface.cc
Go to the documentation of this file.
1/*
2 * Copyright (c) 2015 ARM Limited
3 * All rights reserved
4 *
5 * The license below extends only to copyright in the software and shall
6 * not be construed as granting a license to any other intellectual
7 * property including but not limited to intellectual property relating
8 * to a hardware implementation of the functionality of the software
9 * licensed hereunder. You may use the software subject to the license
10 * terms below provided that you ensure that this notice is replicated
11 * unmodified and in its entirety in all distributions of the software,
12 * modified or unmodified, in source code or in binary form.
13 *
14 * Redistribution and use in source and binary forms, with or without
15 * modification, are permitted provided that the following conditions are
16 * met: redistributions of source code must retain the above copyright
17 * notice, this list of conditions and the following disclaimer;
18 * redistributions in binary form must reproduce the above copyright
19 * notice, this list of conditions and the following disclaimer in the
20 * documentation and/or other materials provided with the distribution;
21 * neither the name of the copyright holders nor the names of its
22 * contributors may be used to endorse or promote products derived from
23 * this software without specific prior written permission.
24 *
25 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
26 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
27 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
28 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
29 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
30 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
31 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
32 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
33 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
34 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
35 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
36 */
37
38/* @file
39 * TCP stream socket based interface class implementation for dist-gem5 runs.
40 */
41
42#include "dev/net/tcp_iface.hh"
43
44#include <arpa/inet.h>
45#include <netdb.h>
46#include <netinet/tcp.h>
47#include <sys/socket.h>
48#include <sys/types.h>
49#include <unistd.h>
50
51#include <cerrno>
52#include <cstring>
53#include <vector>
54
55#include "base/compiler.hh"
56#include "base/trace.hh"
57#include "base/types.hh"
58#include "debug/DistEthernet.hh"
59#include "debug/DistEthernetCmd.hh"
60#include "sim/sim_exit.hh"
61
62#if defined(__FreeBSD__)
63#include <netinet/in.h>
64
65#endif
66
67// MSG_NOSIGNAL does not exists on OS X
68#if defined(__APPLE__) || defined(__MACH__)
69#ifndef MSG_NOSIGNAL
70#define MSG_NOSIGNAL SO_NOSIGPIPE
71#endif
72#endif
73
74namespace gem5
75{
76
77std::vector<std::pair<TCPIface::NodeInfo, int> > TCPIface::nodes;
78std::vector<int> TCPIface::sockRegistry;
79int TCPIface::fdStatic = -1;
80bool TCPIface::anyListening = false;
81
82TCPIface::TCPIface(std::string server_name, unsigned server_port,
83 unsigned dist_rank, unsigned dist_size,
84 Tick sync_start, Tick sync_repeat,
85 EventManager *em, bool use_pseudo_op, bool is_switch,
86 int num_nodes) :
87 DistIface(dist_rank, dist_size, sync_start, sync_repeat, em, use_pseudo_op,
88 is_switch, num_nodes), serverName(server_name),
89 serverPort(server_port), isSwitch(is_switch), listening(false)
90{
91 if (is_switch && isPrimary) {
92 while (!listen(serverPort)) {
93 DPRINTF(DistEthernet, "TCPIface(listen): Can't bind port %d\n",
95 serverPort++;
96 }
97 inform("tcp_iface listening on port %d", serverPort);
98 // Now accept the first connection requests from each compute node and
99 // store the node info. The compute nodes will then wait for ack
100 // messages. Ack messages will be sent by initTransport() in the
101 // appropriate order to make sure that every compute node is always
102 // connected to the same switch port.
103 NodeInfo ni;
104 for (int i = 0; i < size; i++) {
105 accept();
106 DPRINTF(DistEthernet, "First connection, waiting for link info\n");
107 if (!recvTCP(sock, &ni, sizeof(ni)))
108 panic("Failed to receive link info");
109 nodes.push_back(std::make_pair(ni, sock));
110 }
111 }
112}
113
114bool
116{
117 if (listening)
118 panic("Socket already listening!");
119
120 struct sockaddr_in sockaddr;
121 int ret;
122
123 fdStatic = socket(PF_INET, SOCK_STREAM, IPPROTO_TCP);
124 panic_if(fdStatic < 0, "socket() failed: %s", strerror(errno));
125
126 sockaddr.sin_family = PF_INET;
127 sockaddr.sin_addr.s_addr = INADDR_ANY;
128 sockaddr.sin_port = htons(port);
129 // finally clear sin_zero
130 memset(&sockaddr.sin_zero, 0, sizeof(sockaddr.sin_zero));
131 ret = ::bind(fdStatic, (struct sockaddr *)&sockaddr, sizeof (sockaddr));
132
133 if (ret != 0) {
134 if (ret == -1 && errno != EADDRINUSE)
135 panic("ListenSocket(listen): bind() failed!");
136 return false;
137 }
138
139 if (::listen(fdStatic, 24) == -1) {
140 if (errno != EADDRINUSE)
141 panic("ListenSocket(listen): listen() failed!");
142
143 return false;
144 }
145
146 listening = true;
147 anyListening = true;
148 return true;
149}
150
151void
153{
154 static unsigned cur_rank = 0;
155 static unsigned cur_id = 0;
156 NodeInfo ni;
157
158 if (isSwitch) {
159 if (cur_id == 0) { // first connection accepted in the ctor already
160 auto const &iface0 =
161 std::find_if(nodes.begin(), nodes.end(),
162 [](const std::pair<NodeInfo, int> &cn) -> bool {
163 return cn.first.rank == cur_rank;
164 });
165 assert(iface0 != nodes.end());
166 assert(iface0->first.distIfaceId == 0);
167 sock = iface0->second;
168 ni = iface0->first;
169 } else { // additional connections from the same compute node
170 accept();
171 DPRINTF(DistEthernet, "Next connection, waiting for link info\n");
172 if (!recvTCP(sock, &ni, sizeof(ni)))
173 panic("Failed to receive link info");
174 assert(ni.rank == cur_rank);
175 assert(ni.distIfaceId == cur_id);
176 }
177 inform("Link okay (iface:%d -> (node:%d, iface:%d))",
178 distIfaceId, ni.rank, ni.distIfaceId);
179 if (ni.distIfaceId < ni.distIfaceNum - 1) {
180 cur_id++;
181 } else {
182 cur_rank++;
183 cur_id = 0;
184 }
185 // send ack
186 ni.distIfaceId = distIfaceId;
187 ni.distIfaceNum = distIfaceNum;
188 sendTCP(sock, &ni, sizeof(ni));
189 } else { // this is not a switch
190 connect();
191 // send link info
192 ni.rank = rank;
193 ni.distIfaceId = distIfaceId;
194 ni.distIfaceNum = distIfaceNum;
195 sendTCP(sock, &ni, sizeof(ni));
196 DPRINTF(DistEthernet, "Connected, waiting for ack (distIfaceId:%d\n",
198 if (!recvTCP(sock, &ni, sizeof(ni)))
199 panic("Failed to receive ack");
200 assert(ni.rank == rank);
201 inform("Link okay (iface:%d -> switch iface:%d)", distIfaceId,
202 ni.distIfaceId);
203 }
204 sockRegistry.push_back(sock);
205}
206
207void
209{
210 struct sockaddr_in sockaddr;
211 socklen_t slen = sizeof (sockaddr);
212 sock = ::accept(fdStatic, (struct sockaddr *)&sockaddr, &slen);
213 if (sock != -1) {
214 int i = 1;
215 if (setsockopt(sock, IPPROTO_TCP, TCP_NODELAY, (char *)&i,
216 sizeof(i)) < 0)
217 warn("ListenSocket(accept): setsockopt() TCP_NODELAY failed!");
218 }
219}
220
221void
223{
224 struct addrinfo addr_hint, *addr_results;
225 int ret;
226
227 std::string port_str = std::to_string(serverPort);
228
229 sock = socket(PF_INET, SOCK_STREAM, IPPROTO_TCP);
230 panic_if(sock < 0, "socket() failed: %s", strerror(errno));
231
232 int fl = 1;
233 if (setsockopt(sock, IPPROTO_TCP, TCP_NODELAY, (char *)&fl, sizeof(fl)) < 0)
234 warn("ConnectSocket(connect): setsockopt() TCP_NODELAY failed!");
235
236 bzero(&addr_hint, sizeof(addr_hint));
237 addr_hint.ai_family = AF_INET;
238 addr_hint.ai_socktype = SOCK_STREAM;
239 addr_hint.ai_protocol = IPPROTO_TCP;
240
241 ret = getaddrinfo(serverName.c_str(), port_str.c_str(),
242 &addr_hint, &addr_results);
243 panic_if(ret < 0, "getaddrinf() failed: %s", strerror(errno));
244
245 DPRINTF(DistEthernet, "Connecting to %s:%s\n",
246 serverName.c_str(), port_str.c_str());
247
248 ret = ::connect(sock, (struct sockaddr *)(addr_results->ai_addr),
249 addr_results->ai_addrlen);
250 panic_if(ret < 0, "connect() failed: %s", strerror(errno));
251
252 freeaddrinfo(addr_results);
253}
254
256{
257 [[maybe_unused]] int ret;
258
259 ret = close(sock);
260 assert(ret == 0);
261}
262
263void
264TCPIface::sendTCP(int sock, const void *buf, unsigned length)
265{
266 ssize_t ret;
267
268 ret = ::send(sock, buf, length, MSG_NOSIGNAL);
269 if (ret < 0) {
270 if (errno == ECONNRESET || errno == EPIPE) {
271 exitSimLoop("Message server closed connection, simulation "
272 "is exiting");
273 } else {
274 panic("send() failed: %s", strerror(errno));
275 }
276 }
277 panic_if(ret != length, "send() failed");
278}
279
280bool
281TCPIface::recvTCP(int sock, void *buf, unsigned length)
282{
283 ssize_t ret;
284
285 ret = ::recv(sock, buf, length, MSG_WAITALL );
286 if (ret < 0) {
287 if (errno == ECONNRESET || errno == EPIPE)
288 inform("recv(): %s", strerror(errno));
289 else if (ret < 0)
290 panic("recv() failed: %s", strerror(errno));
291 } else if (ret == 0) {
292 inform("recv(): Connection closed");
293 } else if (ret != length)
294 panic("recv() failed");
295
296 return (ret == length);
297}
298
299void
301{
302 sendTCP(sock, &header, sizeof(header));
303 sendTCP(sock, packet->data, packet->length);
304}
305
306void
308{
309 DPRINTF(DistEthernetCmd, "TCPIface::sendCmd() type: %d\n",
310 static_cast<int>(header.msgType));
311 // Global commands (i.e. sync request) are always sent by the primary
312 // DistIface. The transfer method is simply implemented as point-to-point
313 // messages for now
314 for (auto s: sockRegistry)
315 sendTCP(s, (void*)&header, sizeof(header));
316}
317
318bool
320{
321 bool ret = recvTCP(sock, &header, sizeof(header));
322 DPRINTF(DistEthernetCmd, "TCPIface::recvHeader() type: %d ret: %d\n",
323 static_cast<int>(header.msgType), ret);
324 return ret;
325}
326
327void
329{
330 packet = std::make_shared<EthPacketData>(header.dataPacketLength);
331 bool ret = recvTCP(sock, packet->data, header.dataPacketLength);
332 panic_if(!ret, "Error while reading socket");
333 packet->simLength = header.simLength;
334 packet->length = header.dataPacketLength;
335}
336
337void
339{
340 // We cannot setup the conections in the constructor because the number
341 // of dist interfaces (per process) is unknown until the (simobject) init
342 // phase. That information is necessary for global connection ordering.
344}
345
346} // namespace gem5
#define DPRINTF(x,...)
Definition trace.hh:209
Defines global host-dependent types: Counter, Tick, and (indirectly) {int,uint}{8,...
unsigned rank
The rank of this process among the gem5 peers.
unsigned distIfaceId
Unique id for the dist link.
static unsigned distIfaceNum
Number of DistIface objects (i.e.
DistHeaderPkt::Header Header
DistIface(unsigned dist_rank, unsigned dist_size, Tick sync_start, Tick sync_repeat, EventManager *em, bool use_pseudo_op, bool is_switch, int num_nodes)
ctor
unsigned size
The number of gem5 processes comprising this dist simulation.
bool listen(int port)
Definition tcp_iface.cc:115
bool recvHeader(Header &header) override
Receive a header (i.e.
Definition tcp_iface.cc:319
static int fdStatic
Definition tcp_iface.hh:77
void initTransport() override
Init hook for the underlaying transport.
Definition tcp_iface.cc:338
std::string serverName
Definition tcp_iface.hh:70
static bool anyListening
Definition tcp_iface.hh:76
static std::vector< int > sockRegistry
Storage for all opened sockets.
Definition tcp_iface.hh:93
static std::vector< std::pair< NodeInfo, int > > nodes
Definition tcp_iface.hh:89
void sendPacket(const Header &header, const EthPacketPtr &packet) override
Send out a data packet to the remote end.
Definition tcp_iface.cc:300
bool recvTCP(int sock, void *buf, unsigned length)
Receive the next incoming message through a TCP stream socket.
Definition tcp_iface.cc:281
void recvPacket(const Header &header, EthPacketPtr &packet) override
Receive a packet from the remote end.
Definition tcp_iface.cc:328
TCPIface(std::string server_name, unsigned server_port, unsigned dist_rank, unsigned dist_size, Tick sync_start, Tick sync_repeat, EventManager *em, bool use_pseudo_op, bool is_switch, int num_nodes)
The ctor creates and connects the stream socket to the server.
Definition tcp_iface.cc:82
int sock
The stream socket to connect to the server.
Definition tcp_iface.hh:68
void establishConnection()
Definition tcp_iface.cc:152
void sendCmd(const Header &header) override
Send out a control command to the remote end.
Definition tcp_iface.cc:307
~TCPIface() override
Definition tcp_iface.cc:255
void sendTCP(int sock, const void *buf, unsigned length)
Send out a message through a TCP stream socket.
Definition tcp_iface.cc:264
STL pair class.
Definition stl.hh:58
#define panic(...)
This implements a cprintf based panic() function.
Definition logging.hh:220
#define panic_if(cond,...)
Conditional panic macro that checks the supplied condition and only panics if the condition is true a...
Definition logging.hh:246
#define warn(...)
Definition logging.hh:288
#define inform(...)
Definition logging.hh:289
Bitfield< 4 > s
Bitfield< 7 > i
Definition misc_types.hh:67
Bitfield< 3 > ni
Definition misc.hh:104
Bitfield< 2 > em
Definition misc.hh:617
Copyright (c) 2024 Arm Limited All rights reserved.
Definition binary32.hh:36
void exitSimLoop(const std::string &message, int exit_code, Tick when, Tick repeat, bool serialize)
The "old style" exitSimLoop functions.
uint64_t Tick
Tick count type.
Definition types.hh:58
std::shared_ptr< EthPacketData > EthPacketPtr
Definition etherpkt.hh:90
output header
Definition nop.cc:36
Compute node info and storage for the very first connection from each node (used by the switch)
Definition tcp_iface.hh:84

Generated on Mon May 26 2025 09:19:10 for gem5 by doxygen 1.13.2