diff --git a/CMakeLists.txt b/CMakeLists.txt index 186e5b670..674c1c158 100644 --- a/CMakeLists.txt +++ b/CMakeLists.txt @@ -30,7 +30,6 @@ set(PlatformLib platform) include_directories(${CMAKE_SOURCE_DIR}/include) include_directories(${CMAKE_SOURCE_DIR}/include/core) include_directories(${CMAKE_SOURCE_DIR}/include/core/federated) -include_directories(${CMAKE_SOURCE_DIR}/include/core/federated/network) include_directories(${CMAKE_SOURCE_DIR}/include/core/modal_models) include_directories(${CMAKE_SOURCE_DIR}/include/core/platform) include_directories(${CMAKE_SOURCE_DIR}/include/core/threaded) diff --git a/core/CMakeLists.txt b/core/CMakeLists.txt index 6d938ae0c..2d572b4d5 100644 --- a/core/CMakeLists.txt +++ b/core/CMakeLists.txt @@ -18,7 +18,6 @@ list(APPEND REACTORC_SOURCES ${GENERAL_SOURCES}) # Add sources for either threaded or single-threaded runtime if(DEFINED FEDERATED) include(federated/CMakeLists.txt) - include(federated/network/CMakeLists.txt) endif() # Add sources for either threaded or single-threaded runtime @@ -96,10 +95,19 @@ include(${LF_ROOT}/platform/impl/CMakeLists.txt) target_link_libraries(reactor-c PUBLIC lf::platform-api) target_link_libraries(reactor-c PRIVATE lf::platform-impl) +if(DEFINED FEDERATED) + if(NOT DEFINED COMM_TYPE) + set(COMM_TYPE TCP) + endif() + include(${LF_ROOT}/network/api/CMakeLists.txt) + include(${LF_ROOT}/network/impl/CMakeLists.txt) + target_link_libraries(reactor-c PUBLIC lf::network-api) + target_link_libraries(reactor-c PRIVATE lf::network-impl) +endif() + target_include_directories(reactor-c PUBLIC ../include) target_include_directories(reactor-c PUBLIC ../include/core) target_include_directories(reactor-c PUBLIC ../include/core/federated) -target_include_directories(reactor-c PUBLIC ../include/core/federated/network) target_include_directories(reactor-c PUBLIC ../include/core/platform) target_include_directories(reactor-c PUBLIC ../include/core/modal_models) target_include_directories(reactor-c PUBLIC ../include/core/threaded) diff --git a/core/federated/RTI/CMakeLists.txt b/core/federated/RTI/CMakeLists.txt index d9a93c246..8c12ffd6e 100644 --- a/core/federated/RTI/CMakeLists.txt +++ b/core/federated/RTI/CMakeLists.txt @@ -16,8 +16,6 @@ add_library(${RTI_LIB} STATIC ${CoreLib}/utils/util.c ${CoreLib}/tag.c ${CoreLib}/clock.c - ${CoreLib}/federated/network/net_util.c - ${CoreLib}/federated/network/socket_common.c ${CoreLib}/utils/pqueue_base.c ${CoreLib}/utils/pqueue_tag.c ${CoreLib}/utils/pqueue.c @@ -29,7 +27,6 @@ add_executable(${RTI_MAIN} main.c) target_include_directories(${RTI_LIB} PUBLIC ../../../include) target_include_directories(${RTI_LIB} PUBLIC ${IncludeDir}) target_include_directories(${RTI_LIB} PUBLIC ${IncludeDir}/federated) -target_include_directories(${RTI_LIB} PUBLIC ${IncludeDir}/federated/network) target_include_directories(${RTI_LIB} PUBLIC ${IncludeDir}/modal_models) target_include_directories(${RTI_LIB} PUBLIC ${IncludeDir}/utils) @@ -37,6 +34,10 @@ if (NOT DEFINED LOG_LEVEL) set(LOG_LEVEL 0) ENDIF(NOT DEFINED LOG_LEVEL) +if(NOT DEFINED COMM_TYPE) + set(COMM_TYPE TCP) +endif() + IF(CMAKE_BUILD_TYPE MATCHES DEBUG) # Set the LOG_LEVEL to 4 to get DEBUG messages message("-- Building RTI with DEBUG messages enabled") @@ -71,6 +72,12 @@ target_link_libraries(${RTI_LIB} PUBLIC lf::low-level-platform-impl) include(${LF_ROOT}/low_level_platform/api/CMakeLists.txt) target_link_libraries(${RTI_LIB} PUBLIC lf::low-level-platform-api) +include(${LF_ROOT}/network/impl/CMakeLists.txt) +target_link_libraries(${RTI_LIB} PUBLIC lf::network-impl) + +include(${LF_ROOT}/network/api/CMakeLists.txt) +target_link_libraries(${RTI_LIB} PUBLIC lf::network-api) + # Set the STANDALONE_RTI flag to include the rti_remote and rti_common. target_compile_definitions(${RTI_LIB} PUBLIC STANDALONE_RTI=1) @@ -78,6 +85,9 @@ target_compile_definitions(${RTI_LIB} PUBLIC STANDALONE_RTI=1) target_compile_definitions(${RTI_LIB} PUBLIC FEDERATED=1) target_compile_definitions(${RTI_LIB} PUBLIC PLATFORM_${CMAKE_SYSTEM_NAME}) +# Set communication type. +target_compile_definitions(${RTI_LIB} PUBLIC COMM_TYPE_${COMM_TYPE}) + # Set RTI Tracing target_compile_definitions(${RTI_LIB} PUBLIC RTI_TRACE) diff --git a/core/federated/RTI/main.c b/core/federated/RTI/main.c index c08890ac7..8c2869dc4 100644 --- a/core/federated/RTI/main.c +++ b/core/federated/RTI/main.c @@ -80,11 +80,11 @@ static void send_failed_signal(federate_info_t* fed) { if (rti.base.tracing_enabled) { tracepoint_rti_to_federate(send_FAILED, fed->enclave.id, NULL); } - int failed = write_to_socket(fed->socket, bytes_to_write, &(buffer[0])); + int failed = write_to_netchan(fed->fed_netchan, bytes_to_write, &(buffer[0])); if (failed == 0) { LF_PRINT_LOG("RTI has sent failed signal to federate %d due to abnormal termination.", fed->enclave.id); } else { - lf_print_error("RTI failed to send failed signal to federate %d on socket ID %d.", fed->enclave.id, fed->socket); + lf_print_error("RTI failed to send failed signal to federate %d.", fed->enclave.id); } } @@ -234,6 +234,7 @@ int process_args(int argc, const char* argv[]) { rti.base.number_of_scheduling_nodes = (int32_t)num_federates; // FIXME: Loses numbers on 64-bit machines lf_print("RTI: Number of federates: %d", rti.base.number_of_scheduling_nodes); } else if (strcmp(argv[i], "-p") == 0 || strcmp(argv[i], "--port") == 0) { +#ifdef COMM_TYPE_TCP if (argc < i + 2) { lf_print_error("--port needs a short unsigned integer argument ( > 0 and < %d).", UINT16_MAX); usage(argc, argv); @@ -247,6 +248,9 @@ int process_args(int argc, const char* argv[]) { return 0; } rti.user_specified_port = (uint16_t)RTI_port; +#else + lf_print_error("--port is only available for TCP."); +#endif } else if (strcmp(argv[i], "-c") == 0 || strcmp(argv[i], "--clock_sync") == 0) { if (argc < i + 2) { lf_print_error("--clock-sync needs off|init|on."); @@ -327,9 +331,8 @@ int main(int argc, const char* argv[]) { rti.base.scheduling_nodes[i] = (scheduling_node_t*)fed_info; } - int socket_descriptor = start_rti_server(rti.user_specified_port); - if (socket_descriptor >= 0) { - wait_for_federates(socket_descriptor); + if (!start_rti_server()) { + wait_for_federates(); normal_termination = true; if (rti.base.tracing_enabled) { // No need for a mutex lock because all threads have exited. diff --git a/core/federated/RTI/rti_remote.c b/core/federated/RTI/rti_remote.c index b5ca4fe1c..bcb57dbb8 100644 --- a/core/federated/RTI/rti_remote.c +++ b/core/federated/RTI/rti_remote.c @@ -73,9 +73,9 @@ void notify_tag_advance_grant(scheduling_node_t* e, tag_t tag) { tracepoint_rti_to_federate(send_TAG, e->id, &tag); } // This function is called in notify_advance_grant_if_safe(), which is a long - // function. During this call, the socket might close, causing the following write_to_socket + // function. During this call, the network channel might close, causing the following write_to_netchan // to fail. Consider a failure here a soft failure and update the federate's status. - if (write_to_socket(((federate_info_t*)e)->socket, message_length, buffer)) { + if (write_to_netchan(((federate_info_t*)e)->fed_netchan, message_length, buffer)) { lf_print_error("RTI failed to send tag advance grant to federate %d.", e->id); e->state = NOT_CONNECTED; } else { @@ -106,9 +106,9 @@ void notify_provisional_tag_advance_grant(scheduling_node_t* e, tag_t tag) { tracepoint_rti_to_federate(send_PTAG, e->id, &tag); } // This function is called in notify_advance_grant_if_safe(), which is a long - // function. During this call, the socket might close, causing the following write_to_socket + // function. During this call, the network channel might close, causing the following write_to_netchan // to fail. Consider a failure here a soft failure and update the federate's status. - if (write_to_socket(((federate_info_t*)e)->socket, message_length, buffer)) { + if (write_to_netchan(((federate_info_t*)e)->fed_netchan, message_length, buffer)) { lf_print_error("RTI failed to send tag advance grant to federate %d.", e->id); e->state = NOT_CONNECTED; } else { @@ -165,7 +165,7 @@ void notify_downstream_next_event_tag(scheduling_node_t* e, tag_t tag) { if (rti_remote->base.tracing_enabled) { tracepoint_rti_to_federate(send_DNET, e->id, &tag); } - if (write_to_socket(((federate_info_t*)e)->socket, message_length, buffer)) { + if (write_to_netchan(((federate_info_t*)e)->fed_netchan, message_length, buffer)) { lf_print_error("RTI failed to send downstream next event tag to federate %d.", e->id); e->state = NOT_CONNECTED; } else { @@ -187,7 +187,7 @@ void update_federate_next_event_tag_locked(uint16_t federate_id, tag_t next_even void handle_port_absent_message(federate_info_t* sending_federate, unsigned char* buffer) { size_t message_size = sizeof(uint16_t) + sizeof(uint16_t) + sizeof(int64_t) + sizeof(uint32_t); - read_from_socket_fail_on_error(&sending_federate->socket, message_size, &(buffer[1]), NULL, + read_from_netchan_fail_on_error(sending_federate->fed_netchan, message_size, &(buffer[1]), NULL, " RTI failed to read port absent message from federate %u.", sending_federate->enclave.id); @@ -200,7 +200,7 @@ void handle_port_absent_message(federate_info_t* sending_federate, unsigned char } // Need to acquire the mutex lock to ensure that the thread handling - // messages coming from the socket connected to the destination does not + // messages coming from the network channel connected to the destination does not // issue a TAG before this message has been forwarded. LF_MUTEX_LOCK(&rti_mutex); @@ -236,7 +236,7 @@ void handle_port_absent_message(federate_info_t* sending_federate, unsigned char } // Forward the message. - write_to_socket_fail_on_error(&fed->socket, message_size + 1, buffer, &rti_mutex, + write_to_netchan_fail_on_error(fed->fed_netchan, message_size + 1, buffer, &rti_mutex, "RTI failed to forward message to federate %d.", federate_id); LF_MUTEX_UNLOCK(&rti_mutex); @@ -245,7 +245,7 @@ void handle_port_absent_message(federate_info_t* sending_federate, unsigned char void handle_timed_message(federate_info_t* sending_federate, unsigned char* buffer) { size_t header_size = 1 + sizeof(uint16_t) + sizeof(uint16_t) + sizeof(uint32_t) + sizeof(int64_t) + sizeof(uint32_t); // Read the header, minus the first byte which has already been read. - read_from_socket_fail_on_error(&sending_federate->socket, header_size - 1, &(buffer[1]), NULL, + read_from_netchan_fail_on_error(sending_federate->fed_netchan, header_size - 1, &(buffer[1]), NULL, "RTI failed to read the timed message header from remote federate."); // Extract the header information. of the sender uint16_t reactor_port_id; @@ -274,7 +274,7 @@ void handle_timed_message(federate_info_t* sending_federate, unsigned char* buff sending_federate->enclave.id, federate_id, reactor_port_id, intended_tag.time - lf_time_start(), intended_tag.microstep); - read_from_socket_fail_on_error(&sending_federate->socket, bytes_to_read, &(buffer[header_size]), NULL, + read_from_netchan_fail_on_error(sending_federate->fed_netchan, bytes_to_read, &(buffer[header_size]), NULL, "RTI failed to read timed message from federate %d.", federate_id); size_t bytes_read = bytes_to_read + header_size; // Following only works for string messages. @@ -285,12 +285,12 @@ void handle_timed_message(federate_info_t* sending_federate, unsigned char* buff } // Need to acquire the mutex lock to ensure that the thread handling - // messages coming from the socket connected to the destination does not + // messages coming from the network channel connected to the destination does not // issue a TAG before this message has been forwarded. LF_MUTEX_LOCK(&rti_mutex); // If the destination federate is no longer connected, issue a warning, - // remove the message from the socket and return. + // remove the message from the network channel and return. federate_info_t* fed = GET_FED_INFO(federate_id); if (fed->enclave.state == NOT_CONNECTED) { lf_print_warning("RTI: Destination federate %d is no longer connected. Dropping message.", federate_id); @@ -310,7 +310,7 @@ void handle_timed_message(federate_info_t* sending_federate, unsigned char* buff if (bytes_to_read > FED_COM_BUFFER_SIZE) { bytes_to_read = FED_COM_BUFFER_SIZE; } - read_from_socket_fail_on_error(&sending_federate->socket, bytes_to_read, buffer, NULL, + read_from_netchan_fail_on_error(sending_federate->fed_netchan, bytes_to_read, buffer, NULL, "RTI failed to clear message chunks."); total_bytes_read += bytes_to_read; } @@ -332,7 +332,7 @@ void handle_timed_message(federate_info_t* sending_federate, unsigned char* buff tracepoint_rti_to_federate(send_TAGGED_MSG, federate_id, &intended_tag); } - write_to_socket_fail_on_error(&fed->socket, bytes_read, buffer, &rti_mutex, + write_to_netchan_fail_on_error(fed->fed_netchan, bytes_read, buffer, &rti_mutex, "RTI failed to forward message to federate %d.", federate_id); // The message length may be longer than the buffer, @@ -344,15 +344,15 @@ void handle_timed_message(federate_info_t* sending_federate, unsigned char* buff if (bytes_to_read > FED_COM_BUFFER_SIZE) { bytes_to_read = FED_COM_BUFFER_SIZE; } - read_from_socket_fail_on_error(&sending_federate->socket, bytes_to_read, buffer, NULL, + read_from_netchan_fail_on_error(sending_federate->fed_netchan, bytes_to_read, buffer, NULL, "RTI failed to read message chunks."); total_bytes_read += bytes_to_read; // FIXME: a mutex needs to be held for this so that other threads // do not write to destination_socket and cause interleaving. However, // holding the rti_mutex might be very expensive. Instead, each outgoing - // socket should probably have its own mutex. - write_to_socket_fail_on_error(&fed->socket, bytes_to_read, buffer, &rti_mutex, + // network channel should probably have its own mutex. + write_to_netchan_fail_on_error(fed->fed_netchan, bytes_to_read, buffer, &rti_mutex, "RTI failed to send message chunks."); } @@ -382,7 +382,7 @@ void handle_timed_message(federate_info_t* sending_federate, unsigned char* buff void handle_latest_tag_confirmed(federate_info_t* fed) { unsigned char buffer[sizeof(int64_t) + sizeof(uint32_t)]; - read_from_socket_fail_on_error(&fed->socket, sizeof(int64_t) + sizeof(uint32_t), buffer, NULL, + read_from_netchan_fail_on_error(fed->fed_netchan, sizeof(int64_t) + sizeof(uint32_t), buffer, NULL, "RTI failed to read the content of the logical tag complete from federate %d.", fed->enclave.id); tag_t completed = extract_tag(buffer); @@ -400,7 +400,7 @@ void handle_latest_tag_confirmed(federate_info_t* fed) { void handle_next_event_tag(federate_info_t* fed) { unsigned char buffer[sizeof(int64_t) + sizeof(uint32_t)]; - read_from_socket_fail_on_error(&fed->socket, sizeof(int64_t) + sizeof(uint32_t), buffer, NULL, + read_from_netchan_fail_on_error(fed->fed_netchan, sizeof(int64_t) + sizeof(uint32_t), buffer, NULL, "RTI failed to read the content of the next event tag from federate %d.", fed->enclave.id); @@ -458,7 +458,7 @@ static void broadcast_stop_time_to_federates_locked() { if (rti_remote->base.tracing_enabled) { tracepoint_rti_to_federate(send_STOP_GRN, fed->enclave.id, &rti_remote->base.max_stop_tag); } - write_to_socket_fail_on_error(&fed->socket, MSG_TYPE_STOP_GRANTED_LENGTH, outgoing_buffer, &rti_mutex, + write_to_netchan_fail_on_error(fed->fed_netchan, MSG_TYPE_STOP_GRANTED_LENGTH, outgoing_buffer, &rti_mutex, "RTI failed to send MSG_TYPE_STOP_GRANTED message to federate %d.", fed->enclave.id); } @@ -511,7 +511,7 @@ void handle_stop_request_message(federate_info_t* fed) { size_t bytes_to_read = MSG_TYPE_STOP_REQUEST_LENGTH - 1; unsigned char buffer[bytes_to_read]; - read_from_socket_fail_on_error(&fed->socket, bytes_to_read, buffer, NULL, + read_from_netchan_fail_on_error(fed->fed_netchan, bytes_to_read, buffer, NULL, "RTI failed to read the MSG_TYPE_STOP_REQUEST payload from federate %d.", fed->enclave.id); @@ -578,7 +578,7 @@ void handle_stop_request_message(federate_info_t* fed) { if (rti_remote->base.tracing_enabled) { tracepoint_rti_to_federate(send_STOP_REQ, f->enclave.id, &rti_remote->base.max_stop_tag); } - write_to_socket_fail_on_error(&f->socket, MSG_TYPE_STOP_REQUEST_LENGTH, stop_request_buffer, &rti_mutex, + write_to_netchan_fail_on_error(f->fed_netchan, MSG_TYPE_STOP_REQUEST_LENGTH, stop_request_buffer, &rti_mutex, "RTI failed to forward MSG_TYPE_STOP_REQUEST message to federate %d.", f->enclave.id); } @@ -591,7 +591,7 @@ void handle_stop_request_message(federate_info_t* fed) { void handle_stop_request_reply(federate_info_t* fed) { size_t bytes_to_read = MSG_TYPE_STOP_REQUEST_REPLY_LENGTH - 1; unsigned char buffer_stop_time[bytes_to_read]; - read_from_socket_fail_on_error(&fed->socket, bytes_to_read, buffer_stop_time, NULL, + read_from_netchan_fail_on_error(fed->fed_netchan, bytes_to_read, buffer_stop_time, NULL, "RTI failed to read the reply to MSG_TYPE_STOP_REQUEST message from federate %d.", fed->enclave.id); @@ -621,7 +621,7 @@ void handle_address_query(uint16_t fed_id) { // Use buffer both for reading and constructing the reply. // The length is what is needed for the reply. unsigned char buffer[1 + sizeof(int32_t)]; - read_from_socket_fail_on_error(&fed->socket, sizeof(uint16_t), (unsigned char*)buffer, NULL, + read_from_netchan_fail_on_error(fed->fed_netchan, sizeof(uint16_t), (unsigned char*)buffer, NULL, "Failed to read address query."); uint16_t remote_fed_id = extract_uint16(buffer); @@ -641,20 +641,39 @@ void handle_address_query(uint16_t fed_id) { // Encode the port number. federate_info_t* remote_fed = GET_FED_INFO(remote_fed_id); - // Send the port number (which could be -1). + int32_t server_port; + uint32_t* ip_address; + char* server_host_name; + LF_MUTEX_LOCK(&rti_mutex); - encode_int32(remote_fed->server_port, (unsigned char*)&buffer[1]); - write_to_socket_fail_on_error(&fed->socket, sizeof(int32_t) + 1, (unsigned char*)buffer, &rti_mutex, - "Failed to write port number to socket of federate %d.", fed_id); - - // Send the server IP address to federate. - write_to_socket_fail_on_error(&fed->socket, sizeof(remote_fed->server_ip_addr), - (unsigned char*)&remote_fed->server_ip_addr, &rti_mutex, - "Failed to write ip address to socket of federate %d.", fed_id); + // Check if the RTI has initialized the remote federate's network channel. + if (remote_fed->fed_netchan == NULL) { + // RTI has not set up the remote federate. Respond with -1 to indicate an unknown port number. + server_port = -1; + uint32_t temp = 0; + ip_address = &temp; + server_host_name = "localhost"; + } else { + // The network channel is initialized, but the RTI might still not know the port number. This can happen if the RTI + // has not yet received a MSG_TYPE_ADDRESS_ADVERTISEMENT message from the remote federate. In such cases, the + // returned port number might still be -1. + server_port = get_server_port(remote_fed->fed_netchan); + ip_address = (uint32_t*)get_ip_addr(remote_fed->fed_netchan); + server_host_name = get_server_hostname(remote_fed->fed_netchan); + } + + encode_int32(server_port, (unsigned char*)&buffer[1]); + + // Send the port number (which could be -1) and the server IP address to federate. + write_to_netchan_fail_on_error(fed->fed_netchan, 1 + sizeof(int32_t), (unsigned char*)buffer, &rti_mutex, + "Failed to write port number to network channel of federate %d.", fed_id); + + write_to_netchan_fail_on_error(fed->fed_netchan, sizeof(uint32_t), (unsigned char*)ip_address, &rti_mutex, + "Failed to write ip address to network channel of federate %d.", fed_id); LF_MUTEX_UNLOCK(&rti_mutex); - LF_PRINT_DEBUG("Replied to address query from federate %d with address %s:%d.", fed_id, remote_fed->server_hostname, - remote_fed->server_port); + LF_PRINT_DEBUG("Replied to address query from federate %d with address %s:%d.", fed_id, server_host_name, + server_port); } void handle_address_ad(uint16_t federate_id) { @@ -663,7 +682,7 @@ void handle_address_ad(uint16_t federate_id) { // connections to other federates int32_t server_port = -1; unsigned char buffer[sizeof(int32_t)]; - read_from_socket_fail_on_error(&fed->socket, sizeof(int32_t), (unsigned char*)buffer, NULL, + read_from_netchan_fail_on_error(fed->fed_netchan, sizeof(int32_t), (unsigned char*)buffer, NULL, "Error reading port data from federate %d.", federate_id); server_port = extract_int32(buffer); @@ -671,7 +690,7 @@ void handle_address_ad(uint16_t federate_id) { assert(server_port < 65536); LF_MUTEX_LOCK(&rti_mutex); - fed->server_port = server_port; + set_server_port(fed->fed_netchan, server_port); LF_MUTEX_UNLOCK(&rti_mutex); LF_PRINT_LOG("Received address advertisement with port %d from federate %d.", server_port, federate_id); @@ -682,8 +701,8 @@ void handle_address_ad(uint16_t federate_id) { void handle_timestamp(federate_info_t* my_fed) { unsigned char buffer[sizeof(int64_t)]; - // Read bytes from the socket. We need 8 bytes. - read_from_socket_fail_on_error(&my_fed->socket, sizeof(int64_t), (unsigned char*)&buffer, NULL, + // Read bytes from the network channel. We need 8 bytes. + read_from_netchan_fail_on_error(my_fed->fed_netchan, sizeof(int64_t), (unsigned char*)&buffer, NULL, "ERROR reading timestamp from federate %d.\n", my_fed->enclave.id); int64_t timestamp = swap_bytes_if_big_endian_int64(*((int64_t*)(&buffer))); @@ -725,7 +744,7 @@ void handle_timestamp(federate_info_t* my_fed) { tag_t tag = {.time = start_time, .microstep = 0}; tracepoint_rti_to_federate(send_TIMESTAMP, my_fed->enclave.id, &tag); } - if (write_to_socket(my_fed->socket, MSG_TYPE_TIMESTAMP_LENGTH, start_time_buffer)) { + if (write_to_netchan(my_fed->fed_netchan, MSG_TYPE_TIMESTAMP_LENGTH, start_time_buffer)) { lf_print_error("Failed to send the starting time to federate %d.", my_fed->enclave.id); } @@ -739,9 +758,9 @@ void handle_timestamp(federate_info_t* my_fed) { LF_MUTEX_UNLOCK(&rti_mutex); } -void send_physical_clock(unsigned char message_type, federate_info_t* fed, socket_type_t socket_type) { +void send_physical_clock(unsigned char message_type, federate_info_t* fed, bool use_UDP) { if (fed->enclave.state == NOT_CONNECTED) { - lf_print_warning("Clock sync: RTI failed to send physical time to federate %d. Socket not connected.\n", + lf_print_warning("Clock sync: RTI failed to send physical time to federate %d. network channel not connected.\n", fed->enclave.id); return; } @@ -750,9 +769,8 @@ void send_physical_clock(unsigned char message_type, federate_info_t* fed, socke int64_t current_physical_time = lf_time_physical(); encode_int64(current_physical_time, &(buffer[1])); - // Send the message - if (socket_type == UDP) { - // FIXME: UDP_addr is never initialized. + if (use_UDP) { + // Send using UDP LF_PRINT_DEBUG("Clock sync: RTI sending UDP message type %u.", buffer[0]); ssize_t bytes_written = sendto(rti_remote->socket_descriptor_UDP, buffer, 1 + sizeof(int64_t), 0, (struct sockaddr*)&fed->UDP_addr, sizeof(fed->UDP_addr)); @@ -761,10 +779,11 @@ void send_physical_clock(unsigned char message_type, federate_info_t* fed, socke strerror(errno)); return; } - } else if (socket_type == TCP) { - LF_PRINT_DEBUG("Clock sync: RTI sending TCP message type %u.", buffer[0]); + } else { + // Send using network channel. + LF_PRINT_DEBUG("Clock sync: RTI sending message type %u.", buffer[0]); LF_MUTEX_LOCK(&rti_mutex); - write_to_socket_fail_on_error(&fed->socket, 1 + sizeof(int64_t), buffer, &rti_mutex, + write_to_netchan_fail_on_error(fed->fed_netchan, 1 + sizeof(int64_t), buffer, &rti_mutex, "Clock sync: RTI failed to send physical time to federate %d.", fed->enclave.id); LF_MUTEX_UNLOCK(&rti_mutex); } @@ -772,16 +791,18 @@ void send_physical_clock(unsigned char message_type, federate_info_t* fed, socke current_physical_time, fed->enclave.id); } -void handle_physical_clock_sync_message(federate_info_t* my_fed, socket_type_t socket_type) { +void handle_physical_clock_sync_message(federate_info_t* my_fed, bool use_UDP) { // Lock the mutex to prevent interference between sending the two // coded probe messages. LF_MUTEX_LOCK(&rti_mutex); - // Reply with a T4 type message - send_physical_clock(MSG_TYPE_CLOCK_SYNC_T4, my_fed, socket_type); - // Send the corresponding coded probe immediately after, - // but only if this is a UDP channel. - if (socket_type == UDP) { - send_physical_clock(MSG_TYPE_CLOCK_SYNC_CODED_PROBE, my_fed, socket_type); + if (!use_UDP) { + // Reply with a T4 type message + send_physical_clock(MSG_TYPE_CLOCK_SYNC_T4, my_fed, false); + // Send the corresponding coded probe immediately after, + // but only if this is a UDP channel. + } else { + send_physical_clock(MSG_TYPE_CLOCK_SYNC_T4, my_fed, true); + send_physical_clock(MSG_TYPE_CLOCK_SYNC_CODED_PROBE, my_fed, true); } LF_MUTEX_UNLOCK(&rti_mutex); } @@ -823,7 +844,7 @@ void* clock_synchronization_thread(void* noargs) { // Send the RTI's current physical time to the federate // Send on UDP. LF_PRINT_DEBUG("RTI sending T1 message to initiate clock sync round."); - send_physical_clock(MSG_TYPE_CLOCK_SYNC_T1, fed, UDP); + send_physical_clock(MSG_TYPE_CLOCK_SYNC_T1, fed, true); // Listen for reply message, which should be T3. size_t message_size = 1 + sizeof(uint16_t); @@ -848,7 +869,7 @@ void* clock_synchronization_thread(void* noargs) { continue; } LF_PRINT_DEBUG("Clock sync: RTI received T3 message from federate %d.", fed_id_2); - handle_physical_clock_sync_message(GET_FED_INFO(fed_id_2), UDP); + handle_physical_clock_sync_message(GET_FED_INFO(fed_id_2), true); break; } else { // The message is not a T3 message. Discard the message and @@ -884,7 +905,7 @@ void* clock_synchronization_thread(void* noargs) { * @param my_fed The federate sending a MSG_TYPE_FAILED message. */ static void handle_federate_failed(federate_info_t* my_fed) { - // Nothing more to do. Close the socket and exit. + // Nothing more to do. Close the network channel and exit. LF_MUTEX_LOCK(&rti_mutex); if (rti_remote->base.tracing_enabled) { @@ -900,7 +921,7 @@ static void handle_federate_failed(federate_info_t* my_fed) { // Indicate that there will no further events from this federate. my_fed->enclave.next_event = FOREVER_TAG; - shutdown_socket(&my_fed->socket, false); + shutdown_netchan(my_fed->fed_netchan, false); // Check downstream federates to see whether they should now be granted a TAG. // To handle cycles, need to create a boolean array to keep @@ -919,13 +940,13 @@ static void handle_federate_failed(federate_info_t* my_fed) { * This function assumes the caller does not hold the mutex. * * @note At this point, the RTI might have outgoing messages to the federate. This - * function thus first performs a shutdown on the socket, which sends an EOF. It then - * waits for the remote socket to be closed before closing the socket itself. + * function thus first performs a shutdown on the network channel, which sends an EOF. It then + * waits for the remote network channel to be closed before closing the network channel itself. * * @param my_fed The federate sending a MSG_TYPE_RESIGN message. */ static void handle_federate_resign(federate_info_t* my_fed) { - // Nothing more to do. Close the socket and exit. + // Nothing more to do. Close the network channel and exit. LF_MUTEX_LOCK(&rti_mutex); if (rti_remote->base.tracing_enabled) { @@ -939,7 +960,7 @@ static void handle_federate_resign(federate_info_t* my_fed) { // Indicate that there will no further events from this federate. my_fed->enclave.next_event = FOREVER_TAG; - shutdown_socket(&my_fed->socket, true); + shutdown_netchan(my_fed->fed_netchan, true); // Check downstream federates to see whether they should now be granted a TAG. // To handle cycles, need to create a boolean array to keep @@ -963,14 +984,14 @@ void* federate_info_thread_TCP(void* fed) { // Listen for messages from the federate. while (my_fed->enclave.state != NOT_CONNECTED) { // Read no more than one byte to get the message type. - int read_failed = read_from_socket(my_fed->socket, 1, buffer); + int read_failed = read_from_netchan(my_fed->fed_netchan, 1, buffer); if (read_failed) { - // Socket is closed - lf_print_error("RTI: Socket to federate %d is closed. Exiting the thread.", my_fed->enclave.id); + // network channel is closed + lf_print_error("RTI: network channel to federate %d is closed. Exiting the thread.", my_fed->enclave.id); my_fed->enclave.state = NOT_CONNECTED; - // Nothing more to do. Close the socket and exit. - // Prevent multiple threads from closing the same socket at the same time. - shutdown_socket(&my_fed->socket, false); // from unistd.h + // Nothing more to do. Close the network channel and exit. + // Prevent multiple threads from closing the same network channel at the same time. + shutdown_netchan(my_fed->fed_netchan, false); // FIXME: We need better error handling here, but do not stop execution here. break; } @@ -1023,18 +1044,18 @@ void* federate_info_thread_TCP(void* fed) { return NULL; } -void send_reject(int* socket_id, unsigned char error_code) { +void send_reject(netchan_t chan, unsigned char error_code) { LF_PRINT_DEBUG("RTI sending MSG_TYPE_REJECT."); unsigned char response[2]; response[0] = MSG_TYPE_REJECT; response[1] = error_code; LF_MUTEX_LOCK(&rti_mutex); // NOTE: Ignore errors on this response. - if (write_to_socket(*socket_id, 2, response)) { - lf_print_warning("RTI failed to write MSG_TYPE_REJECT message on the socket."); + if (write_to_netchan(chan, 2, response)) { + lf_print_warning("RTI failed to write MSG_TYPE_REJECT message on the network channel."); } - // Close the socket without reading until EOF. - shutdown_socket(socket_id, false); + // Close the network channel without reading until EOF. + shutdown_netchan(chan, false); LF_MUTEX_UNLOCK(&rti_mutex); } @@ -1043,18 +1064,17 @@ void send_reject(int* socket_id, unsigned char error_code) { * a federate ID and a federation ID. If the federation ID * matches this federation, send an MSG_TYPE_ACK and otherwise send * a MSG_TYPE_REJECT message. - * @param socket_id Pointer to the socket on which to listen. - * @param client_fd The socket address. + * @param fed_netchan Pointer to the network channel on which to listen. * @return The federate ID for success or -1 for failure. */ -static int32_t receive_and_check_fed_id_message(int* socket_id) { +static int32_t receive_and_check_fed_id_message(netchan_t fed_netchan) { // Buffer for message ID, federate ID, and federation ID length. size_t length = 1 + sizeof(uint16_t) + 1; // Message ID, federate ID, length of fedration ID. unsigned char buffer[length]; - // Read bytes from the socket. We need 4 bytes. - if (read_from_socket_close_on_error(socket_id, length, buffer)) { - lf_print_error("RTI failed to read from accepted socket."); + // Read bytes from the network channel. We need 4 bytes. + if (read_from_netchan_close_on_error(fed_netchan, length, buffer)) { + lf_print_error("RTI failed to read from accepted network channel."); return -1; } @@ -1073,12 +1093,12 @@ static int32_t receive_and_check_fed_id_message(int* socket_id) { // of the peer they want to connect to from the RTI. // If the connection is a peer-to-peer connection between two // federates, reject the connection with the WRONG_SERVER error. - send_reject(socket_id, WRONG_SERVER); + send_reject(fed_netchan, WRONG_SERVER); } else if (buffer[0] == MSG_TYPE_FED_NONCE) { - send_reject(socket_id, RTI_NOT_EXECUTED_WITH_AUTH); + send_reject(fed_netchan, RTI_NOT_EXECUTED_WITH_AUTH); lf_print_error("RTI not executed with HMAC authentication option using -a or --auth."); } else { - send_reject(socket_id, UNEXPECTED_MESSAGE); + send_reject(fed_netchan, UNEXPECTED_MESSAGE); } lf_print_error("RTI expected a MSG_TYPE_FED_IDS message. Got %u (see net_common.h).", buffer[0]); return -1; @@ -1091,7 +1111,7 @@ static int32_t receive_and_check_fed_id_message(int* socket_id) { size_t federation_id_length = (size_t)buffer[sizeof(uint16_t) + 1]; char federation_id_received[federation_id_length + 1]; // One extra for null terminator. // Next read the actual federation ID. - if (read_from_socket_close_on_error(socket_id, federation_id_length, (unsigned char*)federation_id_received)) { + if (read_from_netchan_close_on_error(fed_netchan, federation_id_length, (unsigned char*)federation_id_received)) { lf_print_error("RTI failed to read federation id from federate %d.", fed_id); return -1; } @@ -1112,7 +1132,7 @@ static int32_t receive_and_check_fed_id_message(int* socket_id) { if (rti_remote->base.tracing_enabled) { tracepoint_rti_to_federate(send_REJECT, fed_id, NULL); } - send_reject(socket_id, FEDERATION_ID_DOES_NOT_MATCH); + send_reject(fed_netchan, FEDERATION_ID_DOES_NOT_MATCH); return -1; } else { if (fed_id >= rti_remote->base.number_of_scheduling_nodes) { @@ -1121,7 +1141,7 @@ static int32_t receive_and_check_fed_id_message(int* socket_id) { if (rti_remote->base.tracing_enabled) { tracepoint_rti_to_federate(send_REJECT, fed_id, NULL); } - send_reject(socket_id, FEDERATE_ID_OUT_OF_RANGE); + send_reject(fed_netchan, FEDERATE_ID_OUT_OF_RANGE); return -1; } else { if ((rti_remote->base.scheduling_nodes[fed_id])->state != NOT_CONNECTED) { @@ -1129,7 +1149,7 @@ static int32_t receive_and_check_fed_id_message(int* socket_id) { if (rti_remote->base.tracing_enabled) { tracepoint_rti_to_federate(send_REJECT, fed_id, NULL); } - send_reject(socket_id, FEDERATE_ID_IN_USE); + send_reject(fed_netchan, FEDERATE_ID_IN_USE); return -1; } } @@ -1138,24 +1158,7 @@ static int32_t receive_and_check_fed_id_message(int* socket_id) { federate_info_t* fed = GET_FED_INFO(fed_id); // The MSG_TYPE_FED_IDS message has the right federation ID. - // Get the peer address from the connected socket_id. Then assign it as the federate's socket server. - struct sockaddr_in peer_addr; - socklen_t addr_len = sizeof(peer_addr); - if (getpeername(*socket_id, (struct sockaddr*)&peer_addr, &addr_len) != 0) { - lf_print_error("RTI failed to get peer address."); - } - fed->server_ip_addr = peer_addr.sin_addr; - -#if LOG_LEVEL >= LOG_LEVEL_DEBUG - // Create the human readable format and copy that into - // the .server_hostname field of the federate. - char str[INET_ADDRSTRLEN + 1]; - inet_ntop(AF_INET, &fed->server_ip_addr, str, INET_ADDRSTRLEN); - strncpy(fed->server_hostname, str, INET_ADDRSTRLEN); - - LF_PRINT_DEBUG("RTI got address %s from federate %d.", fed->server_hostname, fed_id); -#endif - fed->socket = *socket_id; + fed->fed_netchan = fed_netchan; // Set the federate's state as pending // because it is waiting for the start time to be @@ -1169,7 +1172,7 @@ static int32_t receive_and_check_fed_id_message(int* socket_id) { tracepoint_rti_to_federate(send_ACK, fed_id, NULL); } LF_MUTEX_LOCK(&rti_mutex); - if (write_to_socket_close_on_error(&fed->socket, 1, &ack_message)) { + if (write_to_netchan_close_on_error(fed->fed_netchan, 1, &ack_message)) { LF_MUTEX_UNLOCK(&rti_mutex); lf_print_error("RTI failed to write MSG_TYPE_ACK message to federate %d.", fed_id); return -1; @@ -1186,10 +1189,10 @@ static int32_t receive_and_check_fed_id_message(int* socket_id) { * out the relevant information in the federate's struct. * @return 1 on success and 0 on failure. */ -static int receive_connection_information(int* socket_id, uint16_t fed_id) { +static int receive_connection_information(netchan_t fed_netchan, uint16_t fed_id) { LF_PRINT_DEBUG("RTI waiting for MSG_TYPE_NEIGHBOR_STRUCTURE from federate %d.", fed_id); unsigned char connection_info_header[MSG_TYPE_NEIGHBOR_STRUCTURE_HEADER_SIZE]; - read_from_socket_fail_on_error(socket_id, MSG_TYPE_NEIGHBOR_STRUCTURE_HEADER_SIZE, connection_info_header, NULL, + read_from_netchan_fail_on_error(fed_netchan, MSG_TYPE_NEIGHBOR_STRUCTURE_HEADER_SIZE, connection_info_header, NULL, "RTI failed to read MSG_TYPE_NEIGHBOR_STRUCTURE message header from federate %d.", fed_id); @@ -1197,7 +1200,7 @@ static int receive_connection_information(int* socket_id, uint16_t fed_id) { lf_print_error("RTI was expecting a MSG_TYPE_UDP_PORT message from federate %d. Got %u instead. " "Rejecting federate.", fed_id, connection_info_header[0]); - send_reject(socket_id, UNEXPECTED_MESSAGE); + send_reject(fed_netchan, UNEXPECTED_MESSAGE); return 0; } else { federate_info_t* fed = GET_FED_INFO(fed_id); @@ -1229,7 +1232,7 @@ static int receive_connection_information(int* socket_id, uint16_t fed_id) { if (connections_info_body_size > 0) { connections_info_body = (unsigned char*)malloc(connections_info_body_size); LF_ASSERT_NON_NULL(connections_info_body); - read_from_socket_fail_on_error(socket_id, connections_info_body_size, connections_info_body, NULL, + read_from_netchan_fail_on_error(fed_netchan, connections_info_body_size, connections_info_body, NULL, "RTI failed to read MSG_TYPE_NEIGHBOR_STRUCTURE message body from federate %d.", fed_id); // Keep track of where we are in the buffer @@ -1263,23 +1266,23 @@ static int receive_connection_information(int* socket_id, uint16_t fed_id) { * up to perform runtime clock synchronization using the UDP port number * specified in the payload to communicate with the federate's clock * synchronization logic. - * @param socket_id The socket on which to listen. + * @param fed_netchan The network channel on which to listen. * @param fed_id The federate ID. * @return 1 for success, 0 for failure. */ -static int receive_udp_message_and_set_up_clock_sync(int* socket_id, uint16_t fed_id) { +static int receive_udp_message_and_set_up_clock_sync(netchan_t fed_netchan, uint16_t fed_id) { // Read the MSG_TYPE_UDP_PORT message from the federate regardless of the status of // clock synchronization. This message will tell the RTI whether the federate // is doing clock synchronization, and if it is, what port to use for UDP. LF_PRINT_DEBUG("RTI waiting for MSG_TYPE_UDP_PORT from federate %d.", fed_id); unsigned char response[1 + sizeof(uint16_t)]; - read_from_socket_fail_on_error(socket_id, 1 + sizeof(uint16_t), response, NULL, + read_from_netchan_fail_on_error(fed_netchan, 1 + sizeof(uint16_t), response, NULL, "RTI failed to read MSG_TYPE_UDP_PORT message from federate %d.", fed_id); if (response[0] != MSG_TYPE_UDP_PORT) { lf_print_error("RTI was expecting a MSG_TYPE_UDP_PORT message from federate %d. Got %u instead. " "Rejecting federate.", fed_id, response[0]); - send_reject(socket_id, UNEXPECTED_MESSAGE); + send_reject(fed_netchan, UNEXPECTED_MESSAGE); return 0; } else { federate_info_t* fed = GET_FED_INFO(fed_id); @@ -1295,20 +1298,20 @@ static int receive_udp_message_and_set_up_clock_sync(int* socket_id, uint16_t fe // Send the required number of messages for clock synchronization for (int i = 0; i < rti_remote->clock_sync_exchanges_per_interval; i++) { // Send the RTI's current physical time T1 to the federate. - send_physical_clock(MSG_TYPE_CLOCK_SYNC_T1, fed, TCP); + send_physical_clock(MSG_TYPE_CLOCK_SYNC_T1, fed, false); // Listen for reply message, which should be T3. size_t message_size = 1 + sizeof(uint16_t); unsigned char buffer[message_size]; - read_from_socket_fail_on_error(socket_id, message_size, buffer, NULL, - "Socket to federate %d unexpectedly closed.", fed_id); + read_from_netchan_fail_on_error(fed_netchan, message_size, buffer, NULL, + "network channel to federate %d unexpectedly closed.", fed_id); if (buffer[0] == MSG_TYPE_CLOCK_SYNC_T3) { uint16_t fed_id = extract_uint16(&(buffer[1])); LF_PRINT_DEBUG("RTI received T3 clock sync message from federate %d.", fed_id); - handle_physical_clock_sync_message(fed, TCP); + handle_physical_clock_sync_message(fed, false); } else { lf_print_error("Unexpected message %u from federate %d.", buffer[0], fed_id); - send_reject(socket_id, UNEXPECTED_MESSAGE); + send_reject(fed_netchan, UNEXPECTED_MESSAGE); return 0; } } @@ -1320,7 +1323,7 @@ static int receive_udp_message_and_set_up_clock_sync(int* socket_id, uint16_t fe // Initialize the UDP_addr field of the federate struct fed->UDP_addr.sin_family = AF_INET; fed->UDP_addr.sin_port = htons(federate_UDP_port_number); - fed->UDP_addr.sin_addr = fed->server_ip_addr; + fed->UDP_addr.sin_addr = *get_ip_addr(fed_netchan); } } else { // Disable clock sync after initial round. @@ -1343,14 +1346,14 @@ static int receive_udp_message_and_set_up_clock_sync(int* socket_id, uint16_t fe /** * Authenticate incoming federate by performing HMAC-based authentication. * - * @param socket Socket for the incoming federate tryting to authenticate. + * @param fed_netchan network channel for the incoming federate tryting to authenticate. * @return True if authentication is successful and false otherwise. */ -static bool authenticate_federate(int* socket) { +static bool authenticate_federate(netchan_t fed_netchan) { // Wait for MSG_TYPE_FED_NONCE from federate. size_t fed_id_length = sizeof(uint16_t); unsigned char buffer[1 + fed_id_length + NONCE_LENGTH]; - read_from_socket_fail_on_error(socket, 1 + fed_id_length + NONCE_LENGTH, buffer, NULL, + read_from_netchan_fail_on_error(fed_netchan, 1 + fed_id_length + NONCE_LENGTH, buffer, NULL, "Failed to read MSG_TYPE_FED_NONCE"); if (buffer[0] != MSG_TYPE_FED_NONCE) { lf_print_error_and_exit("Received unexpected response %u from the FED (see net_common.h).", buffer[0]); @@ -1375,13 +1378,13 @@ static bool authenticate_federate(int* socket) { RAND_bytes(rti_nonce, NONCE_LENGTH); memcpy(&sender[1], rti_nonce, NONCE_LENGTH); memcpy(&sender[1 + NONCE_LENGTH], hmac_tag, hmac_length); - if (write_to_socket(*socket, 1 + NONCE_LENGTH + hmac_length, sender)) { + if (write_to_netchan(fed_netchan, 1 + NONCE_LENGTH + hmac_length, sender)) { lf_print_error("Failed to send nonce to federate."); } // Wait for MSG_TYPE_FED_RESPONSE unsigned char received[1 + hmac_length]; - read_from_socket_fail_on_error(socket, 1 + hmac_length, received, NULL, "Failed to read federate response."); + read_from_netchan_fail_on_error(fed_netchan, 1 + hmac_length, received, NULL, "Failed to read federate response."); if (received[0] != MSG_TYPE_FED_RESPONSE) { lf_print_error_and_exit("Received unexpected response %u from the federate (see net_common.h).", received[0]); return false; @@ -1400,7 +1403,7 @@ static bool authenticate_federate(int* socket) { if (memcmp(&received[1], rti_tag, hmac_length) != 0) { // Federation IDs do not match. Send back a HMAC_DOES_NOT_MATCH message. lf_print_warning("HMAC authentication failed. Rejecting the federate."); - send_reject(socket, HMAC_DOES_NOT_MATCH); + send_reject(fed_netchan, HMAC_DOES_NOT_MATCH); return false; } else { LF_PRINT_LOG("Federate's HMAC verified."); @@ -1409,16 +1412,20 @@ static bool authenticate_federate(int* socket) { } #endif -void lf_connect_to_federates(int socket_descriptor) { +void lf_connect_to_federates(netchan_t rti_netchan) { for (int i = 0; i < rti_remote->base.number_of_scheduling_nodes; i++) { - int socket_id = accept_socket(rti_remote->socket_descriptor_TCP, -1); + netchan_t fed_netchan = accept_netchan(rti_netchan, NULL); + if (fed_netchan == NULL) { + lf_print_warning("RTI failed to accept the federate."); + return; + } // Wait for the first message from the federate when RTI -a option is on. #ifdef __RTI_AUTH__ if (rti_remote->authentication_enabled) { - if (!authenticate_federate(&socket_id)) { + if (!authenticate_federate(fed_netchan)) { lf_print_warning("RTI failed to authenticate the incoming federate."); - // Close the socket without reading until EOF. - shutdown_socket(&socket_id, false); + // Close the network channel without reading until EOF. + shutdown_netchan(fed_netchan, false); // Ignore the federate that failed authentication. i--; continue; @@ -1427,9 +1434,9 @@ void lf_connect_to_federates(int socket_descriptor) { #endif // The first message from the federate should contain its ID and the federation ID. - int32_t fed_id = receive_and_check_fed_id_message(&socket_id); - if (fed_id >= 0 && socket_id >= 0 && receive_connection_information(&socket_id, (uint16_t)fed_id) && - receive_udp_message_and_set_up_clock_sync(&socket_id, (uint16_t)fed_id)) { + int32_t fed_id = receive_and_check_fed_id_message(fed_netchan); + if (fed_id >= 0 && receive_connection_information(fed_netchan, (uint16_t)fed_id) && + receive_udp_message_and_set_up_clock_sync(fed_netchan, (uint16_t)fed_id)) { // Create a thread to communicate with the federate. // This has to be done after clock synchronization is finished @@ -1468,9 +1475,9 @@ void* respond_to_erroneous_connections(void* nothing) { while (true) { // Wait for an incoming connection request. // The following will block until either a federate attempts to connect - // or shutdown_socket(rti->socket_descriptor_TCP) is called. - int socket_id = accept_socket(rti_remote->socket_descriptor_TCP, -1); - if (socket_id < 0) { + // or shutdown_netchan(rti->rti_netchan) is called. + netchan_t fed_netchan = accept_netchan(rti_remote->rti_netchan, NULL); + if (fed_netchan == NULL) { return NULL; } if (rti_remote->all_federates_exited) { @@ -1482,11 +1489,11 @@ void* respond_to_erroneous_connections(void* nothing) { response[0] = MSG_TYPE_REJECT; response[1] = FEDERATION_ID_DOES_NOT_MATCH; // Ignore errors on this response. - if (write_to_socket(socket_id, 2, response)) { + if (write_to_netchan(fed_netchan, 2, response)) { lf_print_warning("RTI failed to write FEDERATION_ID_DOES_NOT_MATCH to erroneous incoming connection."); } - // Close the socket without reading until EOF. - shutdown_socket(&socket_id, false); + // Close the network channel without reading until EOF. + shutdown_netchan(fed_netchan, false); } return NULL; } @@ -1494,40 +1501,41 @@ void* respond_to_erroneous_connections(void* nothing) { void initialize_federate(federate_info_t* fed, uint16_t id) { initialize_scheduling_node(&(fed->enclave), id); fed->requested_stop = false; - fed->socket = -1; // No socket. fed->clock_synchronization_enabled = true; fed->in_transit_message_tags = pqueue_tag_init(10); - strncpy(fed->server_hostname, "localhost", INET_ADDRSTRLEN); - fed->server_ip_addr.s_addr = 0; - fed->server_port = -1; } -int32_t start_rti_server(uint16_t port) { +int start_rti_server() { _lf_initialize_clock(); - // Create the TCP socket server - if (create_server(port, &rti_remote->socket_descriptor_TCP, &rti_remote->final_port_TCP, TCP, true)) { + // Initialize RTI's network channel. + rti_remote->rti_netchan = initialize_netchan(); + // Set the user specified port to the network channel. + set_my_port(rti_remote->rti_netchan, rti_remote->user_specified_port); + // Create the server + if (create_server(rti_remote->rti_netchan, true)) { lf_print_error_system_failure("RTI failed to create TCP server: %s.", strerror(errno)); + return -1; }; lf_print("RTI: Listening for federates."); // Create the UDP socket server - // Try to get the rti_remote->final_port_TCP + 1 port if (rti_remote->clock_sync_global_status >= clock_sync_on) { - if (create_server(rti_remote->final_port_TCP + 1, &rti_remote->socket_descriptor_UDP, &rti_remote->final_port_UDP, - UDP, true)) { + if (create_socket_server(DEFAULT_UDP_PORT, &rti_remote->socket_descriptor_UDP, &rti_remote->final_port_UDP, UDP, + false)) { lf_print_error_system_failure("RTI failed to create UDP server: %s.", strerror(errno)); + return -1; } } - return rti_remote->socket_descriptor_TCP; + return 0; } -void wait_for_federates(int socket_descriptor) { +void wait_for_federates() { // Wait for connections from federates and create a thread for each. - lf_connect_to_federates(socket_descriptor); + lf_connect_to_federates(rti_remote->rti_netchan); // All federates have connected. lf_print("RTI: All expected federates have connected. Starting execution."); - // The socket server will not continue to accept connections after all the federates + // The network channel server will not continue to accept connections after all the federates // have joined. // In case some other federation's federates are trying to join the wrong // federation, need to respond. Start a separate thread to do that. @@ -1546,12 +1554,13 @@ void wait_for_federates(int socket_descriptor) { rti_remote->all_federates_exited = true; - // Shutdown and close the socket that is listening for incoming connections + // Shutdown and close the network channel that is listening for incoming connections // so that the accept() call in respond_to_erroneous_connections returns. // That thread should then check rti->all_federates_exited and it should exit. - shutdown_socket(&socket_descriptor, false); + shutdown_netchan(rti_remote->rti_netchan, false); if (rti_remote->socket_descriptor_UDP > 0) { + // UDP only uses sockets. shutdown_socket(&rti_remote->socket_descriptor_UDP, false); } } @@ -1574,8 +1583,6 @@ void initialize_RTI(rti_remote_t* rti) { rti_remote->all_federates_exited = false; rti_remote->federation_id = "Unidentified Federation"; rti_remote->user_specified_port = 0; - rti_remote->final_port_TCP = 0; - rti_remote->socket_descriptor_TCP = -1; rti_remote->final_port_UDP = UINT16_MAX; rti_remote->socket_descriptor_UDP = -1; rti_remote->clock_sync_global_status = clock_sync_init; diff --git a/core/federated/RTI/rti_remote.h b/core/federated/RTI/rti_remote.h index 99e439588..81ab67984 100644 --- a/core/federated/RTI/rti_remote.h +++ b/core/federated/RTI/rti_remote.h @@ -15,13 +15,6 @@ #ifndef RTI_REMOTE_H #define RTI_REMOTE_H -#include -#include // Provides select() function to read from multiple sockets. -#include // Defines struct sockaddr_in -#include // inet_ntop & inet_pton -#include // Defines read(), write(), and close() -#include // Defines bzero(). - #include "rti_common.h" #ifdef __RTI_AUTH__ @@ -31,7 +24,7 @@ #include "lf_types.h" #include "pqueue_tag.h" -#include "socket_common.h" +#include "net_driver.h" /** Time allowed for federates to reply to stop request. */ #define MAX_TIME_FOR_REPLY_TO_STOP_REQUEST SEC(30) @@ -53,20 +46,13 @@ typedef struct federate_info_t { // to a request for stop from the RTI. Used to prevent double-counting // a federate when handling lf_request_stop(). lf_thread_t thread_id; // The ID of the thread handling communication with this federate. - int socket; // The TCP socket descriptor for communicating with this federate. + netchan_t fed_netchan; // The netchannel that the RTI handling each federate. struct sockaddr_in UDP_addr; // The UDP address for the federate. bool clock_synchronization_enabled; // Indicates the status of clock synchronization // for this federate. Enabled by default. pqueue_tag_t* in_transit_message_tags; // Record of in-transit messages to this federate that are not // yet processed. This record is ordered based on the time // value of each message for a more efficient access. - char server_hostname[INET_ADDRSTRLEN]; // Human-readable IP address and - int32_t server_port; // port number of the socket server of the federate - // if it has any incoming direct connections from other federates. - // The port number will be -1 if there is no server or if the - // RTI has not been informed of the port number. - struct in_addr server_ip_addr; // Information about the IP address of the socket - // server of the federate. } federate_info_t; /** @@ -113,15 +99,11 @@ typedef struct rti_remote_t { const char* federation_id; /************* TCP server information *************/ - /** The desired port specified by the user on the command line. */ + /** The desired port specified by the user on the command line. + * This should be not moved to the net_driver, because the user can configure this as -p or --port. + */ uint16_t user_specified_port; - /** The final port number that the TCP socket server ends up using. */ - uint16_t final_port_TCP; - - /** The TCP socket descriptor for the socket server. */ - int socket_descriptor_TCP; - /************* UDP server information *************/ /** The final port number that the UDP socket server ends up using. */ uint16_t final_port_UDP; @@ -129,6 +111,11 @@ typedef struct rti_remote_t { /** The UDP socket descriptor for the socket server. */ int socket_descriptor_UDP; + /** + * The rti's network channel. + */ + netchan_t rti_netchan; + /************* Clock synchronization information *************/ /* Thread performing PTP clock sync sessions periodically. */ lf_thread_t clock_thread; @@ -295,15 +282,15 @@ void handle_timestamp(federate_info_t* my_fed); /** * Take a snapshot of the physical clock time and send - * it to federate fed_id. + * it to federate fed_id using the network channel. * * This version assumes the caller holds the mutex lock. * * @param message_type The type of the clock sync message (see net_common.h). * @param fed The federate to send the physical time to. - * @param socket_type The socket type (TCP or UDP). + * @param use_UDP Boolean to use UDP or the network channel. */ -void send_physical_clock(unsigned char message_type, federate_info_t* fed, socket_type_t socket_type); +void send_physical_clock(unsigned char message_type, federate_info_t* fed, bool use_UDP); /** * Handle clock synchronization T3 messages from federates. @@ -316,9 +303,9 @@ void send_physical_clock(unsigned char message_type, federate_info_t* fed, socke * clock synchronization round. * * @param my_fed The sending federate. - * @param socket_type The RTI's socket type used for the communication (TCP or UDP) + * @param use_UDP Boolean to send a coded probe message (for UDP only). */ -void handle_physical_clock_sync_message(federate_info_t* my_fed, socket_type_t socket_type); +void handle_physical_clock_sync_message(federate_info_t* my_fed, bool use_UDP); /** * A (quasi-)periodic thread that performs clock synchronization with each @@ -342,18 +329,18 @@ void* federate_info_thread_TCP(void* fed); /** * Send a MSG_TYPE_REJECT message to the specified socket and close the socket. - * @param socket_id Pointer to the socket ID. + * @param chan Pointer to the network channel. * @param error_code An error code. */ -void send_reject(int* socket_id, unsigned char error_code); +void send_reject(netchan_t chan, unsigned char error_code); /** * Wait for one incoming connection request from each federate, * and upon receiving it, create a thread to communicate with * that federate. Return when all federates have connected. - * @param socket_descriptor The socket on which to accept connections. + * @param rti_netchan The rti's network channel on which to accept connections. */ -void lf_connect_to_federates(int socket_descriptor); +void lf_connect_to_federates(netchan_t rti_netchan); /** * Thread to respond to new connections, which could be federates of other @@ -369,20 +356,16 @@ void* respond_to_erroneous_connections(void* nothing); void initialize_federate(federate_info_t* fed, uint16_t id); /** - * Start the socket server for the runtime infrastructure (RTI) and - * return the socket descriptor. - * @param num_feds Number of federates. - * @param port The port on which to listen for socket connections, or - * 0 to use the default port range. + * Start the socket server for the runtime infrastructure (RTI). + * @return 0 for success, -1 for failure. */ -int32_t start_rti_server(uint16_t port); +int start_rti_server(); /** * Start the runtime infrastructure (RTI) interaction with the federates * and wait for the federates to exit. - * @param socket_descriptor The socket descriptor returned by start_rti_server(). */ -void wait_for_federates(int socket_descriptor); +void wait_for_federates(); /** * Print a usage message. diff --git a/core/federated/clock-sync.c b/core/federated/clock-sync.c index 60a7bd16f..f26c43718 100644 --- a/core/federated/clock-sync.c +++ b/core/federated/clock-sync.c @@ -208,7 +208,7 @@ uint16_t setup_clock_synchronization_with_rti() { return port_to_return; } -void synchronize_initial_physical_clock_with_rti(int* rti_socket_TCP) { +void synchronize_initial_physical_clock_with_rti(netchan_t rti_netchan) { LF_PRINT_DEBUG("Waiting for initial clock synchronization messages from the RTI."); size_t message_size = 1 + sizeof(instant_t); @@ -216,7 +216,7 @@ void synchronize_initial_physical_clock_with_rti(int* rti_socket_TCP) { for (int i = 0; i < _LF_CLOCK_SYNC_EXCHANGES_PER_INTERVAL; i++) { // The first message expected from the RTI is MSG_TYPE_CLOCK_SYNC_T1 - read_from_socket_fail_on_error(rti_socket_TCP, message_size, buffer, NULL, + read_from_netchan_fail_on_error(rti_netchan, message_size, buffer, NULL, "Federate %d did not get the initial clock synchronization message T1 from the RTI.", _lf_my_fed_id); @@ -230,12 +230,12 @@ void synchronize_initial_physical_clock_with_rti(int* rti_socket_TCP) { // Handle the message and send a reply T3 message. // NOTE: No need to acquire the mutex lock during initialization because only // one thread is running. - if (handle_T1_clock_sync_message(buffer, *rti_socket_TCP, receive_time) != 0) { + if (handle_T1_clock_sync_message(buffer, (void*)rti_netchan, receive_time, false) != 0) { lf_print_error_and_exit("Initial clock sync: Failed to send T3 reply to RTI."); } // Next message from the RTI is required to be MSG_TYPE_CLOCK_SYNC_T4 - read_from_socket_fail_on_error(rti_socket_TCP, message_size, buffer, NULL, + read_from_netchan_fail_on_error(rti_netchan, message_size, buffer, NULL, "Federate %d did not get the clock synchronization message T4 from the RTI.", _lf_my_fed_id); @@ -245,7 +245,7 @@ void synchronize_initial_physical_clock_with_rti(int* rti_socket_TCP) { } // Handle the message. - handle_T4_clock_sync_message(buffer, *rti_socket_TCP, receive_time); + handle_T4_clock_sync_message(buffer, (void*)rti_netchan, receive_time, false); } LF_PRINT_LOG("Finished initial clock synchronization with the RTI."); @@ -258,11 +258,12 @@ void synchronize_initial_physical_clock_with_rti(int* rti_socket_TCP) { * It also measures the time it takes between when the method is * called and the reply has been sent. * @param buffer The buffer containing the message, including the message type. - * @param socket The socket (either _lf_rti_socket_TCP or _lf_rti_socket_UDP). + * @param socket_or_netchan The pointer of either UDP socket or the network channel. * @param t2 The physical time at which the T1 message was received. + * @param use_UDP Boolean to use UDP or the network channel. * @return 0 if T3 reply is successfully sent, -1 otherwise. */ -int handle_T1_clock_sync_message(unsigned char* buffer, int socket, instant_t t2) { +int handle_T1_clock_sync_message(unsigned char* buffer, void* socket_or_netchan, instant_t t2, bool use_udp) { // Extract the payload instant_t t1 = extract_int64(&(buffer[1])); @@ -282,7 +283,10 @@ int handle_T1_clock_sync_message(unsigned char* buffer, int socket, instant_t t2 // Write the reply to the socket. LF_PRINT_DEBUG("Sending T3 message to RTI."); - if (write_to_socket(socket, 1 + sizeof(uint16_t), reply_buffer)) { + int result = use_udp ? write_to_socket(*(int*)socket_or_netchan, 1 + sizeof(uint16_t), reply_buffer) + : write_to_netchan((netchan_t)socket_or_netchan, 1 + sizeof(uint16_t), reply_buffer); + + if (result) { lf_print_error("Clock sync: Failed to send T3 message to RTI."); return -1; } @@ -296,21 +300,22 @@ int handle_T1_clock_sync_message(unsigned char* buffer, int socket, instant_t t2 /** * Handle a clock synchronization message T4 coming from the RTI. - * If the socket is _lf_rti_socket_TCP, then assume we are in the + * If using the network channel, then assume we are in the * initial clock synchronization phase and set the clock offset * based on the estimated clock synchronization error. - * Otherwise, if the socket is _lf_rti_socket_UDP, then this looks also for a + * Otherwise, if using the UDP socket, then this looks also for a * subsequent "coded probe" message on the socket. If the delay between * the T4 and the coded probe message is not as expected, then reject * this clock synchronization round. If it is not rejected, then make * an adjustment to the clock offset based on the estimated error. - * This function does not acquire the socket_mutex lock. + * This function does not acquire the netchan_mutex lock. * The caller should acquire it unless it is sure there is only one thread running. * @param buffer The buffer containing the message, including the message type. - * @param socket The socket (either _lf_rti_socket_TCP or _lf_rti_socket_UDP). + * @param socket_or_netchan The pointer of either UDP socket or the network channel. * @param r4 The physical time at which this T4 message was received. + * @param use_UDP Boolean to use UDP or the network channel. */ -void handle_T4_clock_sync_message(unsigned char* buffer, int socket, instant_t r4) { +void handle_T4_clock_sync_message(unsigned char* buffer, void* socket_or_netchan, instant_t r4, bool use_udp) { // Increment the number of received T4 messages _lf_rti_socket_stat.received_T4_messages_in_current_sync_window++; @@ -342,10 +347,10 @@ void handle_T4_clock_sync_message(unsigned char* buffer, int socket, instant_t r // If the socket is _lf_rti_socket_UDP, then // after sending T4, the RTI sends a "coded probe" message, // which can be used to filter out noise. - if (socket == _lf_rti_socket_UDP) { + if (use_udp) { // Read the coded probe message. // We can reuse the same buffer. - int read_failed = read_from_socket(socket, 1 + sizeof(instant_t), buffer); + int read_failed = read_from_socket(*(int*)socket_or_netchan, 1 + sizeof(instant_t), buffer); instant_t r5 = lf_time_physical(); @@ -376,17 +381,15 @@ void handle_T4_clock_sync_message(unsigned char* buffer, int socket, instant_t r _lf_rti_socket_stat.received_T4_messages_in_current_sync_window--; return; } - // Apply a jitter attenuator to the estimated clock error to prevent - // large jumps in the underlying clock. - // Note that estimated_clock_error is calculated using lf_time_physical() which includes - // the clock sync adjustment. - adjustment = estimated_clock_error / _LF_CLOCK_SYNC_ATTENUATION; - } else { - // Use of TCP socket means we are in the startup phase, so - // rather than adjust the clock offset, we simply set it to the - // estimated error. - adjustment = estimated_clock_error; } + // If use UDP, apply a jitter attenuator to the estimated clock error to prevent + // large jumps in the underlying clock. + // Note that estimated_clock_error is calculated using lf_time_physical() which includes + // the clock sync adjustment. + // Use of TCP socket means we are in the startup phase, so + // rather than adjust the clock offset, we simply set it to the + // estimated error. + adjustment = use_udp ? estimated_clock_error / _LF_CLOCK_SYNC_ATTENUATION : estimated_clock_error; #ifdef _LF_CLOCK_SYNC_COLLECT_STATS // Enabled by default // Update RTI's socket stats @@ -501,7 +504,7 @@ void* listen_to_rti_UDP_thread(void* args) { break; } connected = true; - if (handle_T1_clock_sync_message(buffer, _lf_rti_socket_UDP, receive_time) != 0) { + if (handle_T1_clock_sync_message(buffer, (void*)&_lf_rti_socket_UDP, receive_time, true) != 0) { // Failed to send T3 reply. Wait for the next T1. waiting_for_T1 = true; continue; @@ -514,7 +517,7 @@ void* listen_to_rti_UDP_thread(void* args) { continue; } } else if (buffer[0] == MSG_TYPE_CLOCK_SYNC_T4) { - handle_T4_clock_sync_message(buffer, _lf_rti_socket_UDP, receive_time); + handle_T4_clock_sync_message(buffer, (void*)&_lf_rti_socket_UDP, receive_time, true); waiting_for_T1 = true; } else { lf_print_warning("Clock sync: Received from RTI an unexpected UDP message type: %u. " diff --git a/core/federated/federate.c b/core/federated/federate.c index e5899d462..7c7d5c8e1 100644 --- a/core/federated/federate.c +++ b/core/federated/federate.c @@ -14,14 +14,9 @@ #error No support for federated execution on this platform. #endif -#include // inet_ntop & inet_pton -#include // Defines getaddrinfo(), freeaddrinfo() and struct addrinfo. -#include // Defines struct sockaddr_in -#include -#include // Defines read(), write(), and close() -#include // Defines memset(), strnlen(), strncmp(), strncpy() -#include // Defines strerror() - +#include // inet_ntop +#include // Defines memset(), strnlen(), strncmp(), strncpy() +#include // Defines strerror() #include #include // Defined perror(), errno #include // Defines bzero(). @@ -30,6 +25,7 @@ #include "federate.h" #include "net_common.h" #include "net_util.h" +#include "net_driver.h" #include "reactor.h" #include "reactor_common.h" #include "reactor_threaded.h" @@ -49,7 +45,7 @@ extern instant_t start_time; extern bool _lf_termination_executed; // Global variables references in federate.h -lf_mutex_t lf_outbound_socket_mutex; +lf_mutex_t lf_outbound_netchan_mutex; lf_cond_t lf_port_status_changed; @@ -76,13 +72,10 @@ int max_level_allowed_to_advance; * The state of this federate instance. Each executable has exactly one federate instance, * and the _fed global variable refers to that instance. */ -federate_instance_t _fed = {.socket_TCP_RTI = -1, - .number_of_inbound_p2p_connections = 0, - .inbound_socket_listeners = NULL, +federate_instance_t _fed = {.number_of_inbound_p2p_connections = 0, + .inbound_netchan_listeners = NULL, .number_of_outbound_p2p_connections = 0, .inbound_p2p_handling_thread_id = 0, - .server_socket = -1, - .server_port = -1, .last_TAG = {.time = NEVER, .microstep = 0u}, .is_last_TAG_provisional = false, .has_upstream = false, @@ -103,7 +96,7 @@ federation_metadata_t federation_metadata = { // Static functions (used only internally) /** - * Send a time to the RTI. This acquires the lf_outbound_socket_mutex. + * Send a time to the RTI. This acquires the lf_outbound_netchan_mutex. * @param type The message type (MSG_TYPE_TIMESTAMP). * @param time The time. */ @@ -118,15 +111,15 @@ static void send_time(unsigned char type, instant_t time) { tag_t tag = {.time = time, .microstep = 0}; tracepoint_federate_to_rti(send_TIMESTAMP, _lf_my_fed_id, &tag); - LF_MUTEX_LOCK(&lf_outbound_socket_mutex); - write_to_socket_fail_on_error(&_fed.socket_TCP_RTI, bytes_to_write, buffer, &lf_outbound_socket_mutex, + LF_MUTEX_LOCK(&lf_outbound_netchan_mutex); + write_to_netchan_fail_on_error(_fed.netchan_to_RTI, bytes_to_write, buffer, &lf_outbound_netchan_mutex, "Failed to send time " PRINTF_TIME " to the RTI.", time - start_time); - LF_MUTEX_UNLOCK(&lf_outbound_socket_mutex); + LF_MUTEX_UNLOCK(&lf_outbound_netchan_mutex); } /** * Send a tag to the RTI. - * This function acquires the lf_outbound_socket_mutex. + * This function acquires the lf_outbound_netchan_mutex. * @param type The message type (MSG_TYPE_NEXT_EVENT_TAG or MSG_TYPE_LATEST_TAG_CONFIRMED). * @param tag The tag. */ @@ -137,32 +130,25 @@ static void send_tag(unsigned char type, tag_t tag) { buffer[0] = type; encode_tag(&(buffer[1]), tag); - LF_MUTEX_LOCK(&lf_outbound_socket_mutex); - if (_fed.socket_TCP_RTI < 0) { - lf_print_warning("Socket is no longer connected. Dropping message."); - LF_MUTEX_UNLOCK(&lf_outbound_socket_mutex); + LF_MUTEX_LOCK(&lf_outbound_netchan_mutex); + if (_fed.netchan_to_RTI == NULL) { + lf_print_warning("RTI is no longer connected. Dropping message."); + LF_MUTEX_UNLOCK(&lf_outbound_netchan_mutex); return; } trace_event_t event_type = (type == MSG_TYPE_NEXT_EVENT_TAG) ? send_NET : send_LTC; // Trace the event when tracing is enabled tracepoint_federate_to_rti(event_type, _lf_my_fed_id, &tag); - write_to_socket_fail_on_error(&_fed.socket_TCP_RTI, bytes_to_write, buffer, &lf_outbound_socket_mutex, + write_to_netchan_fail_on_error(_fed.netchan_to_RTI, bytes_to_write, buffer, &lf_outbound_netchan_mutex, "Failed to send tag " PRINTF_TAG " to the RTI.", tag.time - start_time, tag.microstep); - LF_MUTEX_UNLOCK(&lf_outbound_socket_mutex); + LF_MUTEX_UNLOCK(&lf_outbound_netchan_mutex); } /** - * Return true if either the socket to the RTI is broken or the socket is - * alive and the first unread byte on the socket's queue is MSG_TYPE_FAILED. + * Return true if either the network channel to the RTI is broken or the network channel is + * alive and the first unread byte on the network channel's queue is MSG_TYPE_FAILED. */ -static bool rti_failed() { - unsigned char first_byte; - ssize_t bytes = peek_from_socket(_fed.socket_TCP_RTI, &first_byte); - if (bytes < 0 || (bytes == 1 && first_byte == MSG_TYPE_FAILED)) - return true; - else - return false; -} +static bool rti_failed() { return check_netchan_closed(_fed.netchan_to_RTI); } //////////////////////////////// Port Status Handling /////////////////////////////////////// @@ -406,17 +392,17 @@ static trigger_handle_t schedule_message_received_from_network_locked(environmen } /** - * Close the socket that receives incoming messages from the + * Close the network channel that receives incoming messages from the * specified federate ID. This function should be called when a read - * of incoming socket fails or when an EOF is received. + * of incoming network channel fails or when an EOF is received. * It can also be called when the receiving end wants to stop communication. * * @param fed_id The ID of the peer federate sending messages to this * federate. */ -static void close_inbound_socket(int fed_id) { - if (_fed.sockets_for_inbound_p2p_connections[fed_id] >= 0) { - shutdown_socket(&_fed.sockets_for_inbound_p2p_connections[fed_id], false); +static void close_inbound_netchan(int fed_id) { + if (_fed.netchans_for_inbound_p2p_connections[fed_id] >= 0) { + shutdown_netchan(&_fed.netchans_for_inbound_p2p_connections[fed_id], false); } } @@ -467,17 +453,17 @@ static bool handle_message_now(environment_t* env, trigger_t* trigger, tag_t int * Handle a message being received from a remote federate. * * This function assumes the caller does not hold the mutex lock. - * @param socket Pointer to the socket to read the message from. + * @param netchan Pointer to the network channel to read the message from. * @param fed_id The sending federate ID or -1 if the centralized coordination. * @return 0 for success, -1 for failure. */ -static int handle_message(int* socket, int fed_id) { +static int handle_message(netchan_t netchan, int fed_id) { (void)fed_id; // Read the header. size_t bytes_to_read = sizeof(uint16_t) + sizeof(uint16_t) + sizeof(uint32_t); unsigned char buffer[bytes_to_read]; - if (read_from_socket_close_on_error(socket, bytes_to_read, buffer)) { - // Read failed, which means the socket has been closed between reading the + if (read_from_netchan_close_on_error(netchan, bytes_to_read, buffer)) { + // Read failed, which means the network channel has been closed between reading the // message ID byte and here. return -1; } @@ -497,7 +483,7 @@ static int handle_message(int* socket, int fed_id) { // Read the payload. // Allocate memory for the message contents. unsigned char* message_contents = (unsigned char*)malloc(length); - if (read_from_socket_close_on_error(socket, length, message_contents)) { + if (read_from_netchan_close_on_error(netchan, length, message_contents)) { return -1; } // Trace the event when tracing is enabled @@ -521,11 +507,11 @@ static int handle_message(int* socket, int fed_id) { * will not advance to the tag of the message if it is in the future, or * the tag will not advance at all if the tag of the message is * now or in the past. - * @param socket Pointer to the socket to read the message from. + * @param netchan Pointer to the network channel to read the message from. * @param fed_id The sending federate ID or -1 if the centralized coordination. - * @return 0 on successfully reading the message, -1 on failure (e.g. due to socket closed). + * @return 0 on successfully reading the message, -1 on failure (e.g. due to network channel closed). */ -static int handle_tagged_message(int* socket, int fed_id) { +static int handle_tagged_message(netchan_t netchan, int fed_id) { // Environment is always the one corresponding to the top-level scheduling enclave. environment_t* env; _lf_get_environments(&env); @@ -534,7 +520,7 @@ static int handle_tagged_message(int* socket, int fed_id) { size_t bytes_to_read = sizeof(uint16_t) + sizeof(uint16_t) + sizeof(uint32_t) + sizeof(instant_t) + sizeof(microstep_t); unsigned char buffer[bytes_to_read]; - if (read_from_socket_close_on_error(socket, bytes_to_read, buffer)) { + if (read_from_netchan_close_on_error(netchan, bytes_to_read, buffer)) { return -1; // Read failed. } @@ -583,7 +569,7 @@ static int handle_tagged_message(int* socket, int fed_id) { // Read the payload. // Allocate memory for the message contents. unsigned char* message_contents = (unsigned char*)malloc(length); - if (read_from_socket_close_on_error(socket, length, message_contents)) { + if (read_from_netchan_close_on_error(netchan, length, message_contents)) { #ifdef FEDERATED_DECENTRALIZED _lf_decrement_tag_barrier_locked(env); #endif @@ -652,11 +638,11 @@ static int handle_tagged_message(int* socket, int fed_id) { if (lf_tag_compare(env->current_tag, env->stop_tag) >= 0 && env->execution_started) { lf_print_error("Received message too late. Already at stop tag.\n" " Current tag is " PRINTF_TAG " and intended tag is " PRINTF_TAG ".\n" - " Discarding message and closing the socket.", + " Discarding message and closing the network channel.", env->current_tag.time - start_time, env->current_tag.microstep, intended_tag.time - start_time, intended_tag.microstep); - // Close socket, reading any incoming data and discarding it. - close_inbound_socket(fed_id); + // Close network channel, reading any incoming data and discarding it. + close_inbound_netchan(fed_id); LF_MUTEX_UNLOCK(&env->mutex); return -1; } else { @@ -687,14 +673,14 @@ static int handle_tagged_message(int* socket, int fed_id) { * This just sets the last known status tag of the port specified * in the message. * - * @param socket Pointer to the socket to read the message from + * @param netchan Pointer to the network channel to read the message from * @param fed_id The sending federate ID or -1 if the centralized coordination. * @return 0 for success, -1 for failure to complete the read. */ -static int handle_port_absent_message(int* socket, int fed_id) { +static int handle_port_absent_message(netchan_t netchan, int fed_id) { size_t bytes_to_read = sizeof(uint16_t) + sizeof(uint16_t) + sizeof(instant_t) + sizeof(microstep_t); unsigned char buffer[bytes_to_read]; - if (read_from_socket_close_on_error(socket, bytes_to_read, buffer)) { + if (read_from_netchan_close_on_error(netchan, bytes_to_read, buffer)) { return -1; } @@ -731,7 +717,7 @@ static int handle_port_absent_message(int* socket, int fed_id) { * peer federate and calls the appropriate handling function for * each message type. If an error occurs or an EOF is received * from the peer, then this procedure sets the corresponding - * socket in _fed.sockets_for_inbound_p2p_connections + * network channel in _fed.netchans_for_inbound_p2p_connections * to -1 and returns, terminating the thread. * @param _args The remote federate ID (cast to void*). * @param fed_id_ptr A pointer to a uint16_t containing federate ID being listened to. @@ -743,7 +729,7 @@ static void* listen_to_federates(void* _args) { LF_PRINT_LOG("Listening to federate %d.", fed_id); - int* socket_id = &_fed.sockets_for_inbound_p2p_connections[fed_id]; + netchan_t netchan = _fed.netchans_for_inbound_p2p_connections[fed_id]; // Buffer for incoming messages. // This does not constrain the message size @@ -752,44 +738,44 @@ static void* listen_to_federates(void* _args) { // Listen for messages from the federate. while (1) { - bool socket_closed = false; + bool netchan_closed = false; // Read one byte to get the message type. - LF_PRINT_DEBUG("Waiting for a P2P message on socket %d.", *socket_id); + LF_PRINT_DEBUG("Waiting for a P2P message."); bool bad_message = false; - if (read_from_socket_close_on_error(socket_id, 1, buffer)) { - // Socket has been closed. - lf_print("Socket from federate %d is closed.", fed_id); + if (read_from_netchan_close_on_error(netchan, 1, buffer)) { + // network channel has been closed. + lf_print("network channel from federate %d is closed.", fed_id); // Stop listening to this federate. - socket_closed = true; + netchan_closed = true; } else { - LF_PRINT_DEBUG("Received a P2P message on socket %d of type %d.", *socket_id, buffer[0]); + LF_PRINT_DEBUG("Received a P2P message of type %d.", buffer[0]); switch (buffer[0]) { case MSG_TYPE_P2P_MESSAGE: LF_PRINT_LOG("Received untimed message from federate %d.", fed_id); - if (handle_message(socket_id, fed_id)) { + if (handle_message(netchan, fed_id)) { // Failed to complete the reading of a message on a physical connection. lf_print_warning("Failed to complete reading of message on physical connection."); - socket_closed = true; + netchan_closed = true; } break; case MSG_TYPE_P2P_TAGGED_MESSAGE: LF_PRINT_LOG("Received tagged message from federate %d.", fed_id); - if (handle_tagged_message(socket_id, fed_id)) { + if (handle_tagged_message(netchan, fed_id)) { // P2P tagged messages are only used in decentralized coordination, and - // it is not a fatal error if the socket is closed before the whole message is read. + // it is not a fatal error if the network channel is closed before the whole message is read. // But this thread should exit. lf_print_warning("Failed to complete reading of tagged message."); - socket_closed = true; + netchan_closed = true; } break; case MSG_TYPE_PORT_ABSENT: LF_PRINT_LOG("Received port absent message from federate %d.", fed_id); - if (handle_port_absent_message(socket_id, fed_id)) { + if (handle_port_absent_message(netchan, fed_id)) { // P2P tagged messages are only used in decentralized coordination, and - // it is not a fatal error if the socket is closed before the whole message is read. + // it is not a fatal error if the network channel is closed before the whole message is read. // But this thread should exit. lf_print_warning("Failed to complete reading of tagged message."); - socket_closed = true; + netchan_closed = true; } break; default: @@ -797,13 +783,13 @@ static void* listen_to_federates(void* _args) { } } if (bad_message) { - lf_print_error("Received erroneous message type: %d. Closing the socket.", buffer[0]); + lf_print_error("Received erroneous message type: %d. Closing the network channel.", buffer[0]); // Trace the event when tracing is enabled tracepoint_federate_from_federate(receive_UNIDENTIFIED, _lf_my_fed_id, fed_id, NULL); break; // while loop } - if (socket_closed) { - // For decentralized execution, once this socket is closed, we + if (netchan_closed) { + // For decentralized execution, once this network channel is closed, we // update last known tags of all ports connected to the specified federate to FOREVER_TAG, // which would eliminate the need to wait for STAA to assume an input is absent. mark_inputs_known_absent(fed_id); @@ -815,25 +801,27 @@ static void* listen_to_federates(void* _args) { } /** - * Close the socket that sends outgoing messages to the - * specified federate ID. This function acquires the lf_outbound_socket_mutex mutex lock + * Close the network channel that sends outgoing messages to the + * specified federate ID. This function acquires the lf_outbound_netchan_mutex mutex lock * if _lf_normal_termination is true and otherwise proceeds without the lock. * @param fed_id The ID of the peer federate receiving messages from this * federate, or -1 if the RTI (centralized coordination). */ -static void close_outbound_socket(int fed_id) { +static void close_outbound_netchan(int fed_id) { assert(fed_id >= 0 && fed_id < NUMBER_OF_FEDERATES); // Close outbound connections, in case they have not closed themselves. // This will result in EOF being sent to the remote federate, except for - // abnormal termination, in which case it will just close the socket. + // abnormal termination, in which case it will just close the network channel. if (_lf_normal_termination) { - if (_fed.sockets_for_outbound_p2p_connections[fed_id] >= 0) { - // Close the socket by sending a FIN packet indicating that no further writes + if (_fed.netchans_for_outbound_p2p_connections[fed_id] != NULL) { + // Close the network channel by sending a FIN packet indicating that no further writes // are expected. Then read until we get an EOF indication. - shutdown_socket(&_fed.sockets_for_outbound_p2p_connections[fed_id], true); + shutdown_netchan(_fed.netchans_for_outbound_p2p_connections[fed_id], true); + _fed.netchans_for_outbound_p2p_connections[fed_id] = NULL; } } else { - shutdown_socket(&_fed.sockets_for_outbound_p2p_connections[fed_id], false); + shutdown_netchan(_fed.netchans_for_outbound_p2p_connections[fed_id], false); + _fed.netchans_for_outbound_p2p_connections[fed_id] = NULL; } } @@ -855,14 +843,14 @@ static int perform_hmac_authentication() { RAND_bytes(fed_nonce, NONCE_LENGTH); memcpy(&fed_hello_buf[1 + fed_id_length], fed_nonce, NONCE_LENGTH); - write_to_socket_fail_on_error(&_fed.socket_TCP_RTI, message_length, fed_hello_buf, NULL, "Failed to write nonce."); + write_to_netchan_fail_on_error(_fed.netchan_to_RTI, message_length, fed_hello_buf, NULL, "Failed to write nonce."); // Check HMAC of received FED_RESPONSE message. unsigned int hmac_length = SHA256_HMAC_LENGTH; size_t federation_id_length = strnlen(federation_metadata.federation_id, 255); unsigned char received[1 + NONCE_LENGTH + hmac_length]; - if (read_from_socket_close_on_error(&_fed.socket_TCP_RTI, 1 + NONCE_LENGTH + hmac_length, received)) { + if (read_from_netchan_close_on_error(_fed.netchan_to_RTI, 1 + NONCE_LENGTH + hmac_length, received)) { lf_print_warning("Failed to read RTI response."); return -1; } @@ -896,7 +884,7 @@ static int perform_hmac_authentication() { response[1] = HMAC_DOES_NOT_MATCH; // Ignore errors on writing back. - write_to_socket(_fed.socket_TCP_RTI, 2, response); + write_to_netchan(_fed.netchan_to_RTI, 2, response); return -1; } else { LF_PRINT_LOG("HMAC verified."); @@ -910,7 +898,7 @@ static int perform_hmac_authentication() { HMAC(EVP_sha256(), federation_metadata.federation_id, federation_id_length, mac_buf, 1 + NONCE_LENGTH, &sender[1], &hmac_length); - write_to_socket_fail_on_error(&_fed.socket_TCP_RTI, 1 + hmac_length, sender, NULL, "Failed to write fed response."); + write_to_netchan_fail_on_error(_fed.netchan_to_RTI, 1 + hmac_length, sender, NULL, "Failed to write fed response."); } return 0; } @@ -929,12 +917,12 @@ static instant_t get_start_time_from_rti(instant_t my_physical_time) { // Send the timestamp marker first. send_time(MSG_TYPE_TIMESTAMP, my_physical_time); - // Read bytes from the socket. We need 9 bytes. + // Read bytes from the network channel. We need 9 bytes. // Buffer for message ID plus timestamp. size_t buffer_length = 1 + sizeof(instant_t); unsigned char buffer[buffer_length]; - read_from_socket_fail_on_error(&_fed.socket_TCP_RTI, buffer_length, buffer, NULL, + read_from_netchan_fail_on_error(_fed.netchan_to_RTI, buffer_length, buffer, NULL, "Failed to read MSG_TYPE_TIMESTAMP message from RTI."); LF_PRINT_DEBUG("Read 9 bytes."); @@ -978,7 +966,7 @@ static void handle_tag_advance_grant(void) { size_t bytes_to_read = sizeof(instant_t) + sizeof(microstep_t); unsigned char buffer[bytes_to_read]; - read_from_socket_fail_on_error(&_fed.socket_TCP_RTI, bytes_to_read, buffer, NULL, + read_from_netchan_fail_on_error(_fed.netchan_to_RTI, bytes_to_read, buffer, NULL, "Failed to read tag advance grant from RTI."); tag_t TAG = extract_tag(buffer); @@ -1219,7 +1207,7 @@ static void handle_provisional_tag_advance_grant() { size_t bytes_to_read = sizeof(instant_t) + sizeof(microstep_t); unsigned char buffer[bytes_to_read]; - read_from_socket_fail_on_error(&_fed.socket_TCP_RTI, bytes_to_read, buffer, NULL, + read_from_netchan_fail_on_error(_fed.netchan_to_RTI, bytes_to_read, buffer, NULL, "Failed to read provisional tag advance grant from RTI."); tag_t PTAG = extract_tag(buffer); @@ -1309,7 +1297,7 @@ static void handle_stop_granted_message() { size_t bytes_to_read = MSG_TYPE_STOP_GRANTED_LENGTH - 1; unsigned char buffer[bytes_to_read]; - read_from_socket_fail_on_error(&_fed.socket_TCP_RTI, bytes_to_read, buffer, NULL, + read_from_netchan_fail_on_error(_fed.netchan_to_RTI, bytes_to_read, buffer, NULL, "Failed to read stop granted from RTI."); tag_t received_stop_tag = extract_tag(buffer); @@ -1353,7 +1341,7 @@ static void handle_stop_granted_message() { static void handle_stop_request_message() { size_t bytes_to_read = MSG_TYPE_STOP_REQUEST_LENGTH - 1; unsigned char buffer[bytes_to_read]; - read_from_socket_fail_on_error(&_fed.socket_TCP_RTI, bytes_to_read, buffer, NULL, + read_from_netchan_fail_on_error(_fed.netchan_to_RTI, bytes_to_read, buffer, NULL, "Failed to read stop request from RTI."); tag_t tag_to_stop = extract_tag(buffer); @@ -1379,10 +1367,10 @@ static void handle_stop_request_message() { // or we have previously sent a stop request to the RTI, // then we have already blocked tag advance in enclaves. // Do not do this twice. The record of whether the first has occurred - // is guarded by the outbound socket mutex. + // is guarded by the outbound network channel mutex. // The second is guarded by the global mutex. // Note that the RTI should not send stop requests more than once to federates. - LF_MUTEX_LOCK(&lf_outbound_socket_mutex); + LF_MUTEX_LOCK(&lf_outbound_netchan_mutex); if (_fed.received_stop_request_from_rti) { LF_PRINT_LOG("Redundant MSG_TYPE_STOP_REQUEST from RTI. Ignoring it."); already_blocked = true; @@ -1391,7 +1379,7 @@ static void handle_stop_request_message() { // prevent lf_request_stop from sending. _fed.received_stop_request_from_rti = true; } - LF_MUTEX_UNLOCK(&lf_outbound_socket_mutex); + LF_MUTEX_UNLOCK(&lf_outbound_netchan_mutex); if (already_blocked) { // Either we have sent a stop request to the RTI ourselves, @@ -1425,11 +1413,11 @@ static void handle_stop_request_message() { tracepoint_federate_to_rti(send_STOP_REQ_REP, _lf_my_fed_id, &tag_to_stop); // Send the current logical time to the RTI. - LF_MUTEX_LOCK(&lf_outbound_socket_mutex); - write_to_socket_fail_on_error(&_fed.socket_TCP_RTI, MSG_TYPE_STOP_REQUEST_REPLY_LENGTH, outgoing_buffer, - &lf_outbound_socket_mutex, + LF_MUTEX_LOCK(&lf_outbound_netchan_mutex); + write_to_netchan_fail_on_error(_fed.netchan_to_RTI, MSG_TYPE_STOP_REQUEST_REPLY_LENGTH, outgoing_buffer, + &lf_outbound_netchan_mutex, "Failed to send the answer to MSG_TYPE_STOP_REQUEST to RTI."); - LF_MUTEX_UNLOCK(&lf_outbound_socket_mutex); + LF_MUTEX_UNLOCK(&lf_outbound_netchan_mutex); LF_PRINT_DEBUG("Sent MSG_TYPE_STOP_REQUEST_REPLY to RTI with tag " PRINTF_TAG, tag_to_stop.time, tag_to_stop.microstep); @@ -1441,7 +1429,7 @@ static void handle_stop_request_message() { static void handle_downstream_next_event_tag() { size_t bytes_to_read = sizeof(instant_t) + sizeof(microstep_t); unsigned char buffer[bytes_to_read]; - read_from_socket_fail_on_error(&_fed.socket_TCP_RTI, bytes_to_read, buffer, NULL, + read_from_netchan_fail_on_error(_fed.netchan_to_RTI, bytes_to_read, buffer, NULL, "Failed to read downstream next event tag from RTI."); tag_t DNET = extract_tag(buffer); @@ -1472,10 +1460,10 @@ static void send_resign_signal() { size_t bytes_to_write = 1; unsigned char buffer[bytes_to_write]; buffer[0] = MSG_TYPE_RESIGN; - LF_MUTEX_LOCK(&lf_outbound_socket_mutex); - write_to_socket_fail_on_error(&_fed.socket_TCP_RTI, bytes_to_write, &(buffer[0]), &lf_outbound_socket_mutex, + LF_MUTEX_LOCK(&lf_outbound_netchan_mutex); + write_to_netchan_fail_on_error(_fed.netchan_to_RTI, bytes_to_write, &(buffer[0]), &lf_outbound_netchan_mutex, "Failed to send MSG_TYPE_RESIGN."); - LF_MUTEX_UNLOCK(&lf_outbound_socket_mutex); + LF_MUTEX_UNLOCK(&lf_outbound_netchan_mutex); LF_PRINT_LOG("Resigned."); } @@ -1486,7 +1474,7 @@ static void send_failed_signal() { size_t bytes_to_write = 1; unsigned char buffer[bytes_to_write]; buffer[0] = MSG_TYPE_FAILED; - write_to_socket_fail_on_error(&_fed.socket_TCP_RTI, bytes_to_write, &(buffer[0]), NULL, + write_to_netchan_fail_on_error(_fed.netchan_to_RTI, bytes_to_write, &(buffer[0]), NULL, "Failed to send MSG_TYPE_FAILED."); LF_PRINT_LOG("Failed."); } @@ -1500,11 +1488,11 @@ static void send_failed_signal() { static void handle_rti_failed_message(void) { exit(1); } /** - * Thread that listens for TCP inputs from the RTI. + * Thread that listens for network channel inputs from the RTI. * When messages arrive, this calls the appropriate handler. * @param args Ignored */ -static void* listen_to_rti_TCP(void* args) { +static void* listen_to_rti_netchan(void* args) { (void)args; initialize_lf_thread_id(); // Buffer for incoming messages. @@ -1514,39 +1502,27 @@ static void* listen_to_rti_TCP(void* args) { // Listen for messages from the federate. while (1) { - // Check whether the RTI socket is still valid - if (_fed.socket_TCP_RTI < 0) { - lf_print_warning("Socket to the RTI unexpectedly closed."); + // Check whether the RTI network channel is still valid + if (_fed.netchan_to_RTI == NULL) { + lf_print_warning("network channel to the RTI unexpectedly closed."); return NULL; } // Read one byte to get the message type. // This will exit if the read fails. - int read_failed = read_from_socket(_fed.socket_TCP_RTI, 1, buffer); + int read_failed = read_from_netchan(_fed.netchan_to_RTI, 1, buffer); if (read_failed < 0) { - if (errno == ECONNRESET) { - lf_print_error("Socket connection to the RTI was closed by the RTI without" - " properly sending an EOF first. Considering this a soft error."); - // FIXME: If this happens, possibly a new RTI must be elected. - shutdown_socket(&_fed.socket_TCP_RTI, false); - return NULL; - } else { - lf_print_error("Socket connection to the RTI has been broken with error %d: %s." - " The RTI should close connections with an EOF first." - " Considering this a soft error.", - errno, strerror(errno)); - // FIXME: If this happens, possibly a new RTI must be elected. - shutdown_socket(&_fed.socket_TCP_RTI, false); - return NULL; - } + lf_print_error("Connection to the RTI was closed by the RTI with an error. Considering this a soft error."); + shutdown_netchan(_fed.netchan_to_RTI, false); + return NULL; } else if (read_failed > 0) { // EOF received. lf_print("Connection to the RTI closed with an EOF."); - shutdown_socket(&_fed.socket_TCP_RTI, false); + shutdown_netchan(_fed.netchan_to_RTI, false); return NULL; } switch (buffer[0]) { case MSG_TYPE_TAGGED_MESSAGE: - if (handle_tagged_message(&_fed.socket_TCP_RTI, -1)) { + if (handle_tagged_message(_fed.netchan_to_RTI, -1)) { // Failures to complete the read of messages from the RTI are fatal. lf_print_error_and_exit("Failed to complete the reading of a message from the RTI."); } @@ -1564,7 +1540,7 @@ static void* listen_to_rti_TCP(void* args) { handle_stop_granted_message(); break; case MSG_TYPE_PORT_ABSENT: - if (handle_port_absent_message(&_fed.socket_TCP_RTI, -1)) { + if (handle_port_absent_message(_fed.netchan_to_RTI, -1)) { // Failures to complete the read of absent messages from the RTI are fatal. lf_print_error_and_exit("Failed to complete the reading of an absent message from the RTI."); } @@ -1577,10 +1553,10 @@ static void* listen_to_rti_TCP(void* args) { break; case MSG_TYPE_CLOCK_SYNC_T1: case MSG_TYPE_CLOCK_SYNC_T4: - lf_print_error("Federate %d received unexpected clock sync message from RTI on TCP socket.", _lf_my_fed_id); + lf_print_error("Federate %d received unexpected clock sync message from RTI.", _lf_my_fed_id); break; default: - lf_print_error_and_exit("Received from RTI an unrecognized TCP message type: %hhx.", buffer[0]); + lf_print_error_and_exit("Received from RTI an unrecognized message type: %hhx.", buffer[0]); // Trace the event when tracing is enabled tracepoint_federate_from_rti(receive_UNIDENTIFIED, _lf_my_fed_id, NULL); } @@ -1642,7 +1618,7 @@ static bool bounded_NET(tag_t* tag) { // An empty version of this function is code generated for unfederated execution. /** - * Close sockets used to communicate with other federates, if they are open, + * Close network channels used to communicate with other federates, if they are open, * and send a MSG_TYPE_RESIGN message to the RTI. This implements the function * defined in reactor.h. For unfederated execution, the code generator * generates an empty implementation. @@ -1653,7 +1629,7 @@ void lf_terminate_execution(environment_t* env) { // For an abnormal termination (e.g. a SIGINT), we need to send a // MSG_TYPE_FAILED message to the RTI, but we should not acquire a mutex. - if (_fed.socket_TCP_RTI >= 0) { + if (_fed.netchan_to_RTI != NULL) { if (_lf_normal_termination) { tracepoint_federate_to_rti(send_RESIGN, _lf_my_fed_id, &env->current_tag); send_resign_signal(); @@ -1663,45 +1639,45 @@ void lf_terminate_execution(environment_t* env) { } } - LF_PRINT_DEBUG("Closing incoming P2P sockets."); - // Close any incoming P2P sockets that are still open. + LF_PRINT_DEBUG("Closing incoming P2P network channels."); + // Close any incoming P2P network channels that are still open. for (int i = 0; i < NUMBER_OF_FEDERATES; i++) { - close_inbound_socket(i); - // Ignore errors. Mark the socket closed. - _fed.sockets_for_inbound_p2p_connections[i] = -1; + close_inbound_netchan(i); + // Ignore errors. Mark the network channel closed. + _fed.netchans_for_inbound_p2p_connections[i] = NULL; } // Check for all outgoing physical connections in - // _fed.sockets_for_outbound_p2p_connections and - // if the socket ID is not -1, the connection is still open. - // Send an EOF by closing the socket here. + // _fed.netchans_for_outbound_p2p_connections and + // if the network channel ID is not NULL, the connection is still open. + // Send an EOF by closing the network channel here. for (int i = 0; i < NUMBER_OF_FEDERATES; i++) { // Close outbound connections, in case they have not closed themselves. // This will result in EOF being sent to the remote federate, except for - // abnormal termination, in which case it will just close the socket. - close_outbound_socket(i); + // abnormal termination, in which case it will just close the network channel. + close_outbound_netchan(i); } - LF_PRINT_DEBUG("Waiting for inbound p2p socket listener threads."); - // Wait for each inbound socket listener thread to close. - if (_fed.number_of_inbound_p2p_connections > 0 && _fed.inbound_socket_listeners != NULL) { + LF_PRINT_DEBUG("Waiting for inbound p2p network channel listener threads."); + // Wait for each inbound network channel listener thread to close. + if (_fed.number_of_inbound_p2p_connections > 0 && _fed.inbound_netchan_listeners != NULL) { LF_PRINT_LOG("Waiting for %zu threads listening for incoming messages to exit.", _fed.number_of_inbound_p2p_connections); for (size_t i = 0; i < _fed.number_of_inbound_p2p_connections; i++) { // Ignoring errors here. - lf_thread_join(_fed.inbound_socket_listeners[i], NULL); + lf_thread_join(_fed.inbound_netchan_listeners[i], NULL); } } - LF_PRINT_DEBUG("Waiting for RTI's socket listener threads."); + LF_PRINT_DEBUG("Waiting for RTI's network channel listener threads."); // Wait for the thread listening for messages from the RTI to close. - lf_thread_join(_fed.RTI_socket_listener, NULL); + lf_thread_join(_fed.RTI_netchan_listener, NULL); // For abnormal termination, there is no need to free memory. if (_lf_normal_termination) { LF_PRINT_DEBUG("Freeing memory occupied by the federate."); - free(_fed.inbound_socket_listeners); + free(_fed.inbound_netchan_listeners); free(federation_metadata.rti_host); free(federation_metadata.rti_user); } @@ -1730,13 +1706,13 @@ void lf_connect_to_federate(uint16_t remote_federate_id) { // Trace the event when tracing is enabled tracepoint_federate_to_rti(send_ADR_QR, _lf_my_fed_id, NULL); - LF_MUTEX_LOCK(&lf_outbound_socket_mutex); - write_to_socket_fail_on_error(&_fed.socket_TCP_RTI, sizeof(uint16_t) + 1, buffer, &lf_outbound_socket_mutex, + LF_MUTEX_LOCK(&lf_outbound_netchan_mutex); + write_to_netchan_fail_on_error(_fed.netchan_to_RTI, sizeof(uint16_t) + 1, buffer, &lf_outbound_netchan_mutex, "Failed to send address query for federate %d to RTI.", remote_federate_id); - LF_MUTEX_UNLOCK(&lf_outbound_socket_mutex); + LF_MUTEX_UNLOCK(&lf_outbound_netchan_mutex); // Read RTI's response. - read_from_socket_fail_on_error(&_fed.socket_TCP_RTI, sizeof(int32_t) + 1, buffer, NULL, + read_from_netchan_fail_on_error(_fed.netchan_to_RTI, sizeof(int32_t) + 1, buffer, NULL, "Failed to read the requested port number for federate %d from RTI.", remote_federate_id); @@ -1750,7 +1726,7 @@ void lf_connect_to_federate(uint16_t remote_federate_id) { } port = extract_int32(&buffer[1]); - read_from_socket_fail_on_error(&_fed.socket_TCP_RTI, sizeof(host_ip_addr), (unsigned char*)&host_ip_addr, NULL, + read_from_netchan_fail_on_error(_fed.netchan_to_RTI, sizeof(host_ip_addr), (unsigned char*)&host_ip_addr, NULL, "Failed to read the IP address for federate %d from RTI.", remote_federate_id); // A reply of -1 for the port means that the RTI does not know @@ -1771,17 +1747,25 @@ void lf_connect_to_federate(uint16_t remote_federate_id) { char hostname[INET_ADDRSTRLEN]; inet_ntop(AF_INET, &host_ip_addr, hostname, INET_ADDRSTRLEN); - int socket_id = create_real_time_tcp_socket_errexit(); - if (connect_to_socket(socket_id, (const char*)hostname, uport) < 0) { - lf_print_error_and_exit("Failed to connect() to RTI."); + + // Create a network channel. + netchan_t netchan = initialize_netchan(); + // Set the received host name and port to the network channel. + set_server_port(netchan, uport); + set_server_hostname(netchan, hostname); + // Create the client network channel. + create_client(netchan); + if (connect_to_netchan(netchan) < 0) { + lf_print_error_and_exit("Failed to connect to federate."); } + // Iterate until we either successfully connect or we exceed the CONNECT_TIMEOUT start_connect = lf_time_physical(); while (result < 0 && !_lf_termination_executed) { // Try again after some time if the connection failed. // Note that this should not really happen since the remote federate should be - // accepting socket connections. But possibly it will be busy (in process of accepting - // another socket connection?). Hence, we retry. + // accepting connections. But possibly it will be busy (in process of accepting + // another connection?). Hence, we retry. if (CHECK_TIMEOUT(start_connect, CONNECT_TIMEOUT)) { // If the remote federate is not accepting the connection after CONNECT_TIMEOUT // treat it as a soft error condition and return. @@ -1807,25 +1791,25 @@ void lf_connect_to_federate(uint16_t remote_federate_id) { // Trace the event when tracing is enabled tracepoint_federate_to_federate(send_FED_ID, _lf_my_fed_id, remote_federate_id, NULL); - // No need for a mutex because we have the only handle on the socket. - write_to_socket_fail_on_error(&socket_id, buffer_length, buffer, NULL, "Failed to send fed_id to federate %d.", + // No need for a mutex because we have the only handle on the network channel. + write_to_netchan_fail_on_error(netchan, buffer_length, buffer, NULL, "Failed to send fed_id to federate %d.", remote_federate_id); - write_to_socket_fail_on_error(&socket_id, federation_id_length, (unsigned char*)federation_metadata.federation_id, - NULL, "Failed to send federation id to federate %d.", remote_federate_id); + write_to_netchan_fail_on_error(netchan, federation_id_length, (unsigned char*)federation_metadata.federation_id, NULL, + "Failed to send federation id to federate %d.", remote_federate_id); - read_from_socket_fail_on_error(&socket_id, 1, (unsigned char*)buffer, NULL, + read_from_netchan_fail_on_error(netchan, 1, (unsigned char*)buffer, NULL, "Failed to read MSG_TYPE_ACK from federate %d in response to sending fed_id.", remote_federate_id); if (buffer[0] != MSG_TYPE_ACK) { // Get the error code. - read_from_socket_fail_on_error(&socket_id, 1, (unsigned char*)buffer, NULL, + read_from_netchan_fail_on_error(netchan, 1, (unsigned char*)buffer, NULL, "Failed to read error code from federate %d in response to sending fed_id.", remote_federate_id); lf_print_error("Received MSG_TYPE_REJECT message from remote federate (%d).", buffer[0]); result = -1; // Wait ADDRESS_QUERY_RETRY_INTERVAL nanoseconds. lf_sleep(ADDRESS_QUERY_RETRY_INTERVAL); - lf_print_warning("Could not connect to federate %d. Will try again every" PRINTF_TIME "nanoseconds.\n", + lf_print_warning("Could not connect to federate %d. Will try again every " PRINTF_TIME "nanoseconds.\n", remote_federate_id, ADDRESS_QUERY_RETRY_INTERVAL); continue; } else { @@ -1836,8 +1820,8 @@ void lf_connect_to_federate(uint16_t remote_federate_id) { } } // Once we set this variable, then all future calls to close() on this - // socket ID should reset it to -1 within a critical section. - _fed.sockets_for_outbound_p2p_connections[remote_federate_id] = socket_id; + // network channel should reset it to NULL within a critical section. + _fed.netchans_for_outbound_p2p_connections[remote_federate_id] = netchan; } void lf_connect_to_rti(const char* hostname, int port) { @@ -1847,10 +1831,16 @@ void lf_connect_to_rti(const char* hostname, int port) { hostname = federation_metadata.rti_host ? federation_metadata.rti_host : hostname; port = federation_metadata.rti_port >= 0 ? federation_metadata.rti_port : port; - // Create a socket - _fed.socket_TCP_RTI = create_real_time_tcp_socket_errexit(); - if (connect_to_socket(_fed.socket_TCP_RTI, hostname, port) < 0) { - lf_print_error_and_exit("Failed to connect() to RTI."); + // Create a network channel. + _fed.netchan_to_RTI = initialize_netchan(); + // Set the user specified host name and port to the network channel. + set_server_port(_fed.netchan_to_RTI, port); + set_server_hostname(_fed.netchan_to_RTI, hostname); + + // Create the client network channel. + create_client(_fed.netchan_to_RTI); + if (connect_to_netchan(_fed.netchan_to_RTI) < 0) { + lf_print_error_and_exit("Failed to connect to RTI."); } instant_t start_connect = lf_time_physical(); @@ -1890,13 +1880,13 @@ void lf_connect_to_rti(const char* hostname, int port) { // Trace the event when tracing is enabled tracepoint_federate_to_rti(send_FED_ID, _lf_my_fed_id, NULL); - // No need for a mutex here because no other threads are writing to this socket. - if (write_to_socket(_fed.socket_TCP_RTI, 2 + sizeof(uint16_t), buffer)) { + // No need for a mutex here because no other threads are writing to this network channel. + if (write_to_netchan(_fed.netchan_to_RTI, 2 + sizeof(uint16_t), buffer)) { continue; // Try again, possibly on a new port. } // Next send the federation ID itself. - if (write_to_socket(_fed.socket_TCP_RTI, federation_id_length, (unsigned char*)federation_metadata.federation_id)) { + if (write_to_netchan(_fed.netchan_to_RTI, federation_id_length, (unsigned char*)federation_metadata.federation_id)) { continue; // Try again. } @@ -1908,7 +1898,7 @@ void lf_connect_to_rti(const char* hostname, int port) { LF_PRINT_DEBUG("Waiting for response to federation ID from the RTI."); - if (read_from_socket(_fed.socket_TCP_RTI, 1, &response)) { + if (read_from_netchan(_fed.netchan_to_RTI, 1, &response)) { continue; // Try again. } if (response == MSG_TYPE_REJECT) { @@ -1916,7 +1906,7 @@ void lf_connect_to_rti(const char* hostname, int port) { tracepoint_federate_from_rti(receive_REJECT, _lf_my_fed_id, NULL); // Read one more byte to determine the cause of rejection. unsigned char cause; - read_from_socket_fail_on_error(&_fed.socket_TCP_RTI, 1, &cause, NULL, + read_from_netchan_fail_on_error(_fed.netchan_to_RTI, 1, &cause, NULL, "Failed to read the cause of rejection by the RTI."); if (cause == FEDERATION_ID_DOES_NOT_MATCH || cause == WRONG_SERVER) { lf_print_warning("Connected to the wrong RTI. Will try again"); @@ -1940,7 +1930,7 @@ void lf_connect_to_rti(const char* hostname, int port) { // about connections between this federate and other federates // where messages are routed through the RTI. // @see MSG_TYPE_NEIGHBOR_STRUCTURE in net_common.h - lf_send_neighbor_structure_to_RTI(_fed.socket_TCP_RTI); + lf_send_neighbor_structure_to_RTI(_fed.netchan_to_RTI); uint16_t udp_port = setup_clock_synchronization_with_rti(); @@ -1948,34 +1938,39 @@ void lf_connect_to_rti(const char* hostname, int port) { unsigned char UDP_port_number[1 + sizeof(uint16_t)]; UDP_port_number[0] = MSG_TYPE_UDP_PORT; encode_uint16(udp_port, &(UDP_port_number[1])); - write_to_socket_fail_on_error(&_fed.socket_TCP_RTI, 1 + sizeof(uint16_t), UDP_port_number, NULL, + write_to_netchan_fail_on_error(_fed.netchan_to_RTI, 1 + sizeof(uint16_t), UDP_port_number, NULL, "Failed to send the UDP port number to the RTI."); } void lf_create_server(int specified_port) { assert(specified_port <= UINT16_MAX && specified_port >= 0); - uint16_t final_port; - if (create_server(specified_port, &_fed.server_socket, &final_port, TCP, false)) { - lf_print_error_system_failure("RTI failed to create TCP server: %s.", strerror(errno)); + + netchan_t* server_netchan = initialize_netchan(); + set_my_port(server_netchan, specified_port); + + if (create_server(server_netchan, false)) { + lf_print_error_system_failure("RTI failed to create server: %s.", strerror(errno)); }; + _fed.server_netchan = server_netchan; + // Get the final server port to send to the RTI on an MSG_TYPE_ADDRESS_ADVERTISEMENT message. + int32_t server_port = get_my_port(server_netchan); - LF_PRINT_LOG("Server for communicating with other federates started using port %u.", final_port); - _fed.server_port = final_port; + LF_PRINT_LOG("Server for communicating with other federates started using port %d.", server_port); // Send the server port number to the RTI // on an MSG_TYPE_ADDRESS_ADVERTISEMENT message (@see net_common.h). unsigned char buffer[sizeof(int32_t) + 1]; buffer[0] = MSG_TYPE_ADDRESS_ADVERTISEMENT; - encode_int32(_fed.server_port, &(buffer[1])); + encode_int32(server_port, &(buffer[1])); // Trace the event when tracing is enabled tracepoint_federate_to_rti(send_ADR_AD, _lf_my_fed_id, NULL); - // No need for a mutex because we have the only handle on this socket. - write_to_socket_fail_on_error(&_fed.socket_TCP_RTI, sizeof(int32_t) + 1, (unsigned char*)buffer, NULL, + // No need for a mutex because we have the only handle on this network driver. + write_to_netchan_fail_on_error(_fed.netchan_to_RTI, sizeof(int32_t) + 1, (unsigned char*)buffer, NULL, "Failed to send address advertisement."); - LF_PRINT_DEBUG("Sent port %d to the RTI.", _fed.server_port); + LF_PRINT_DEBUG("Sent port %d to the RTI.", server_port); } void lf_enqueue_port_absent_reactions(environment_t* env) { @@ -2006,21 +2001,21 @@ void* lf_handle_p2p_connections_from_federates(void* env_arg) { LF_ASSERT_NON_NULL(env_arg); size_t received_federates = 0; // Allocate memory to store thread IDs. - _fed.inbound_socket_listeners = (lf_thread_t*)calloc(_fed.number_of_inbound_p2p_connections, sizeof(lf_thread_t)); + _fed.inbound_netchan_listeners = (lf_thread_t*)calloc(_fed.number_of_inbound_p2p_connections, sizeof(lf_thread_t)); while (received_federates < _fed.number_of_inbound_p2p_connections && !_lf_termination_executed) { // Wait for an incoming connection request. - int socket_id = accept_socket(_fed.server_socket, _fed.socket_TCP_RTI); - if (socket_id < 0) { - lf_print_warning("Federate failed to accept the socket."); + netchan_t netchan = accept_netchan(_fed.server_netchan, _fed.netchan_to_RTI); + if (netchan == NULL) { + lf_print_warning("Federate failed to accept the network channel."); return NULL; } LF_PRINT_LOG("Accepted new connection from remote federate."); size_t header_length = 1 + sizeof(uint16_t) + 1; unsigned char buffer[header_length]; - int read_failed = read_from_socket(socket_id, header_length, (unsigned char*)&buffer); + int read_failed = read_from_netchan(netchan, header_length, (unsigned char*)&buffer); if (read_failed || buffer[0] != MSG_TYPE_P2P_SENDING_FED_ID) { - lf_print_warning("Federate received invalid first message on P2P socket. Closing socket."); + lf_print_warning("Federate received invalid first message on P2P network channel. Closing network channel."); if (read_failed == 0) { // Wrong message received. unsigned char response[2]; @@ -2029,19 +2024,19 @@ void* lf_handle_p2p_connections_from_federates(void* env_arg) { // Trace the event when tracing is enabled tracepoint_federate_to_federate(send_REJECT, _lf_my_fed_id, -3, NULL); // Ignore errors on this response. - write_to_socket(socket_id, 2, response); + write_to_netchan(netchan, 2, response); } - shutdown_socket(&socket_id, false); + shutdown_netchan(netchan, false); continue; } // Get the federation ID and check it. unsigned char federation_id_length = buffer[header_length - 1]; char remote_federation_id[federation_id_length]; - read_failed = read_from_socket(socket_id, federation_id_length, (unsigned char*)remote_federation_id); + read_failed = read_from_netchan(netchan, federation_id_length, (unsigned char*)remote_federation_id); if (read_failed || (strncmp(federation_metadata.federation_id, remote_federation_id, strnlen(federation_metadata.federation_id, 255)) != 0)) { - lf_print_warning("Received invalid federation ID. Closing socket."); + lf_print_warning("Received invalid federation ID. Closing network channel."); if (read_failed == 0) { unsigned char response[2]; response[0] = MSG_TYPE_REJECT; @@ -2049,9 +2044,9 @@ void* lf_handle_p2p_connections_from_federates(void* env_arg) { // Trace the event when tracing is enabled tracepoint_federate_to_federate(send_REJECT, _lf_my_fed_id, -3, NULL); // Ignore errors on this response. - write_to_socket(socket_id, 2, response); + write_to_netchan(netchan, 2, response); } - shutdown_socket(&socket_id, false); + shutdown_netchan(netchan, false); continue; } @@ -2062,12 +2057,12 @@ void* lf_handle_p2p_connections_from_federates(void* env_arg) { // Trace the event when tracing is enabled tracepoint_federate_to_federate(receive_FED_ID, _lf_my_fed_id, remote_fed_id, NULL); - // Once we record the socket_id here, all future calls to close() on - // the socket should be done while holding the socket_mutex, and this array - // element should be reset to -1 during that critical section. + // Once we record the network channel here, all future calls to close() on + // the network channel should be done while holding the netchan_mutex, and this array + // element should be reset to NULL during that critical section. // Otherwise, there can be race condition where, during termination, - // two threads attempt to simultaneously close the socket. - _fed.sockets_for_inbound_p2p_connections[remote_fed_id] = socket_id; + // two threads attempt to simultaneously close the network channel. + _fed.netchans_for_inbound_p2p_connections[remote_fed_id] = netchan; // Send an MSG_TYPE_ACK message. unsigned char response = MSG_TYPE_ACK; @@ -2075,21 +2070,21 @@ void* lf_handle_p2p_connections_from_federates(void* env_arg) { // Trace the event when tracing is enabled tracepoint_federate_to_federate(send_ACK, _lf_my_fed_id, remote_fed_id, NULL); - LF_MUTEX_LOCK(&lf_outbound_socket_mutex); - write_to_socket_fail_on_error(&_fed.sockets_for_inbound_p2p_connections[remote_fed_id], 1, - (unsigned char*)&response, &lf_outbound_socket_mutex, - "Failed to write MSG_TYPE_ACK in response to federate %d.", remote_fed_id); - LF_MUTEX_UNLOCK(&lf_outbound_socket_mutex); + LF_MUTEX_LOCK(&lf_outbound_netchan_mutex); + write_to_netchan_fail_on_error(_fed.netchans_for_inbound_p2p_connections[remote_fed_id], 1, (unsigned char*)&response, + &lf_outbound_netchan_mutex, "Failed to write MSG_TYPE_ACK in response to federate %d.", + remote_fed_id); + LF_MUTEX_UNLOCK(&lf_outbound_netchan_mutex); // Start a thread to listen for incoming messages from other federates. // The fed_id is a uint16_t, which we assume can be safely cast to and from void*. void* fed_id_arg = (void*)(uintptr_t)remote_fed_id; - int result = lf_thread_create(&_fed.inbound_socket_listeners[received_federates], listen_to_federates, fed_id_arg); + int result = lf_thread_create(&_fed.inbound_netchan_listeners[received_federates], listen_to_federates, fed_id_arg); if (result != 0) { // Failed to create a listening thread. - if (_fed.sockets_for_inbound_p2p_connections[remote_fed_id] != -1) { - shutdown_socket(&socket_id, false); - _fed.sockets_for_inbound_p2p_connections[remote_fed_id] = -1; + if (_fed.netchans_for_inbound_p2p_connections[remote_fed_id] != NULL) { + shutdown_netchan(_fed.netchans_for_inbound_p2p_connections[remote_fed_id], false); + _fed.netchans_for_inbound_p2p_connections[remote_fed_id] = NULL; } lf_print_error_and_exit("Failed to create a thread to listen for incoming physical connection. Error code: %d.", result); @@ -2195,23 +2190,23 @@ int lf_send_message(int message_type, unsigned short port, unsigned short federa const int header_length = 1 + sizeof(uint16_t) + sizeof(uint16_t) + sizeof(uint32_t); // Use a mutex lock to prevent multiple threads from simultaneously sending. - LF_MUTEX_LOCK(&lf_outbound_socket_mutex); + LF_MUTEX_LOCK(&lf_outbound_netchan_mutex); - int* socket = &_fed.sockets_for_outbound_p2p_connections[federate]; + netchan_t netchan = _fed.netchans_for_outbound_p2p_connections[federate]; // Trace the event when tracing is enabled tracepoint_federate_to_federate(send_P2P_MSG, _lf_my_fed_id, federate, NULL); - int result = write_to_socket_close_on_error(socket, header_length, header_buffer); + int result = write_to_netchan_close_on_error(netchan, header_length, header_buffer); if (result == 0) { // Header sent successfully. Send the body. - result = write_to_socket_close_on_error(socket, length, message); + result = write_to_netchan_close_on_error(netchan, length, message); } if (result != 0) { // Message did not send. Since this is used for physical connections, this is not critical. lf_print_warning("Failed to send message to %s. Dropping the message.", next_destination_str); } - LF_MUTEX_UNLOCK(&lf_outbound_socket_mutex); + LF_MUTEX_UNLOCK(&lf_outbound_netchan_mutex); return result; } @@ -2397,25 +2392,25 @@ void lf_send_port_absent_to_federate(environment_t* env, interval_t additional_d #ifdef FEDERATED_CENTRALIZED // Send the absent message through the RTI - int* socket = &_fed.socket_TCP_RTI; + netchan_t netchan = _fed.netchan_to_RTI; #else // Send the absent message directly to the federate - int* socket = &_fed.sockets_for_outbound_p2p_connections[fed_ID]; + netchan_t netchan = _fed.netchans_for_outbound_p2p_connections[fed_ID]; #endif - if (socket == &_fed.socket_TCP_RTI) { + if (netchan == _fed.netchan_to_RTI) { tracepoint_federate_to_rti(send_PORT_ABS, _lf_my_fed_id, ¤t_message_intended_tag); } else { tracepoint_federate_to_federate(send_PORT_ABS, _lf_my_fed_id, fed_ID, ¤t_message_intended_tag); } - LF_MUTEX_LOCK(&lf_outbound_socket_mutex); - int result = write_to_socket_close_on_error(socket, message_length, buffer); - LF_MUTEX_UNLOCK(&lf_outbound_socket_mutex); + LF_MUTEX_LOCK(&lf_outbound_netchan_mutex); + int result = write_to_netchan_close_on_error(netchan, message_length, buffer); + LF_MUTEX_UNLOCK(&lf_outbound_netchan_mutex); if (result != 0) { // Write failed. Response depends on whether coordination is centralized. - if (socket == &_fed.socket_TCP_RTI) { + if (netchan == _fed.netchan_to_RTI) { // Centralized coordination. This is a critical error. lf_print_error_system_failure("Failed to send port absent message for port %hu to federate %hu.", port_ID, fed_ID); @@ -2434,29 +2429,29 @@ int lf_send_stop_request_to_rti(tag_t stop_tag) { stop_tag.microstep++; ENCODE_STOP_REQUEST(buffer, stop_tag.time, stop_tag.microstep); - LF_MUTEX_LOCK(&lf_outbound_socket_mutex); + LF_MUTEX_LOCK(&lf_outbound_netchan_mutex); // Do not send a stop request if a stop request has been previously received from the RTI. if (!_fed.received_stop_request_from_rti) { LF_PRINT_LOG("Sending to RTI a MSG_TYPE_STOP_REQUEST message with tag " PRINTF_TAG ".", stop_tag.time - start_time, stop_tag.microstep); - if (_fed.socket_TCP_RTI < 0) { - lf_print_warning("Socket is no longer connected. Dropping message."); - LF_MUTEX_UNLOCK(&lf_outbound_socket_mutex); + if (_fed.netchan_to_RTI == NULL) { + lf_print_warning("RTI is no longer connected. Dropping message."); + LF_MUTEX_UNLOCK(&lf_outbound_netchan_mutex); return -1; } // Trace the event when tracing is enabled tracepoint_federate_to_rti(send_STOP_REQ, _lf_my_fed_id, &stop_tag); - write_to_socket_fail_on_error(&_fed.socket_TCP_RTI, MSG_TYPE_STOP_REQUEST_LENGTH, buffer, &lf_outbound_socket_mutex, + write_to_netchan_fail_on_error(_fed.netchan_to_RTI, MSG_TYPE_STOP_REQUEST_LENGTH, buffer, &lf_outbound_netchan_mutex, "Failed to send stop time " PRINTF_TIME " to the RTI.", stop_tag.time - start_time); // Treat this sending as equivalent to having received a stop request from the RTI. _fed.received_stop_request_from_rti = true; - LF_MUTEX_UNLOCK(&lf_outbound_socket_mutex); + LF_MUTEX_UNLOCK(&lf_outbound_netchan_mutex); return 0; } else { - LF_MUTEX_UNLOCK(&lf_outbound_socket_mutex); + LF_MUTEX_UNLOCK(&lf_outbound_netchan_mutex); return 1; } } @@ -2509,14 +2504,14 @@ int lf_send_tagged_message(environment_t* env, interval_t additional_delay, int current_message_intended_tag.microstep, next_destination_str); // Use a mutex lock to prevent multiple threads from simultaneously sending. - LF_MUTEX_LOCK(&lf_outbound_socket_mutex); + LF_MUTEX_LOCK(&lf_outbound_netchan_mutex); - int* socket; + netchan_t netchan; if (message_type == MSG_TYPE_P2P_TAGGED_MESSAGE) { - socket = &_fed.sockets_for_outbound_p2p_connections[federate]; + netchan = _fed.netchans_for_outbound_p2p_connections[federate]; tracepoint_federate_to_federate(send_P2P_TAGGED_MSG, _lf_my_fed_id, federate, ¤t_message_intended_tag); } else { - socket = &_fed.socket_TCP_RTI; + netchan = _fed.netchan_to_RTI; tracepoint_federate_to_rti(send_TAGGED_MSG, _lf_my_fed_id, ¤t_message_intended_tag); } @@ -2524,10 +2519,10 @@ int lf_send_tagged_message(environment_t* env, interval_t additional_delay, int _fed.last_DNET = current_message_intended_tag; } - int result = write_to_socket_close_on_error(socket, header_length, header_buffer); + int result = write_to_netchan_close_on_error(netchan, header_length, header_buffer); if (result == 0) { // Header sent successfully. Send the body. - result = write_to_socket_close_on_error(socket, length, message); + result = write_to_netchan_close_on_error(netchan, length, message); } if (result != 0) { // Message did not send. Handling depends on message type. @@ -2538,7 +2533,7 @@ int lf_send_tagged_message(environment_t* env, interval_t additional_delay, int next_destination_str, errno, strerror(errno)); } } - LF_MUTEX_UNLOCK(&lf_outbound_socket_mutex); + LF_MUTEX_UNLOCK(&lf_outbound_netchan_mutex); return result; } @@ -2572,11 +2567,11 @@ void lf_synchronize_with_other_federates(void) { start_time = get_start_time_from_rti(lf_time_physical()); lf_tracing_set_start_time(start_time); - // Start a thread to listen for incoming TCP messages from the RTI. + // Start a thread to listen for incoming messages from the RTI. // @note Up until this point, the federate has been listening for messages // from the RTI in a sequential manner in the main thread. From now on, a // separate thread is created to allow for asynchronous communication. - lf_thread_create(&_fed.RTI_socket_listener, listen_to_rti_TCP, NULL); + lf_thread_create(&_fed.RTI_netchan_listener, listen_to_rti_netchan, NULL); lf_thread_t thread_id; if (create_clock_sync_thread(&thread_id)) { lf_print_warning("Failed to create thread to handle clock synchronization."); diff --git a/core/federated/network/CMakeLists.txt b/core/federated/network/CMakeLists.txt deleted file mode 100644 index f61d69897..000000000 --- a/core/federated/network/CMakeLists.txt +++ /dev/null @@ -1,4 +0,0 @@ -set(LF_NETWORK_FILES net_util.c socket_common.c) - -list(TRANSFORM LF_NETWORK_FILES PREPEND federated/network/) -list(APPEND REACTORC_SOURCES ${LF_NETWORK_FILES}) diff --git a/include/core/federated/clock-sync.h b/include/core/federated/clock-sync.h index b003a3150..0afddf0d9 100644 --- a/include/core/federated/clock-sync.h +++ b/include/core/federated/clock-sync.h @@ -34,6 +34,7 @@ THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. #define CLOCK_SYNC_H #include "low_level_platform.h" +#include "net_driver.h" // Clock synchronization defaults to performing clock synchronization only at initialization. #define LF_CLOCK_SYNC_OFF 1 @@ -157,15 +158,15 @@ uint16_t setup_clock_synchronization_with_rti(void); * is required. * * This is a blocking function that expects - * to read a MSG_TYPE_CLOCK_SYNC_T1 from the RTI TCP socket. + * to read a MSG_TYPE_CLOCK_SYNC_T1 from the RTI network channel. * It will then follow the PTP protocol to synchronize the local * physical clock with the RTI. * Failing to complete this protocol is treated as a catastrophic * error that causes the federate to exit. * - * @param rti_socket_TCP Pointer to the RTI's socket + * @param rti_netchan Pointer to the RTI's network channel. */ -void synchronize_initial_physical_clock_with_rti(int* rti_socket_TCP); +void synchronize_initial_physical_clock_with_rti(netchan_t rti_netchan); /** * Handle a clock synchroninzation message T1 coming from the RTI. @@ -174,29 +175,31 @@ void synchronize_initial_physical_clock_with_rti(int* rti_socket_TCP); * It also measures the time it takes between when the method is * called and the reply has been sent. * @param buffer The buffer containing the message, including the message type. - * @param socket The socket (either _lf_rti_socket_TCP or _lf_rti_socket_UDP). + * @param netchan_t The pointer to the network channel. * @param t2 The physical time at which the T1 message was received. + * @param use_UDP Boolean to use UDP or the network channel. * @return 0 if T3 reply is successfully sent, -1 otherwise. */ -int handle_T1_clock_sync_message(unsigned char* buffer, int socket, instant_t t2); +int handle_T1_clock_sync_message(unsigned char* buffer, void* socket_or_netchan, instant_t t2, bool use_udp); /** * Handle a clock synchronization message T4 coming from the RTI. - * If the socket is _lf_rti_socket_TCP, then assume we are in the + * If the socket_or_netchan is a network channel, then assume we are in the * initial clock synchronization phase and set the clock offset * based on the estimated clock synchronization error. - * Otherwise, if the socket is _lf_rti_socket_UDP, then this looks also for a + * Otherwise, if the socket_or_netchan is UDP socket, then this looks also for a * subsequent "coded probe" message on the socket. If the delay between * the T4 and the coded probe message is not as expected, then reject * this clock synchronization round. If it is not rejected, then make * an adjustment to the clock offset based on the estimated error. - * This function does not acquire the socket_mutex lock. + * This function does not acquire the netchan_mutex lock. * The caller should acquire it unless it is sure there is only one thread running. * @param buffer The buffer containing the message, including the message type. - * @param socket The socket (either _lf_rti_socket_TCP or _lf_rti_socket_UDP). - * @param r4 The physical time at which this T4 message was received. + * @param netchan_t The pointer to the network channel. + * @param r4 The physical time at which this T4 message was received.\ + * @param use_UDP Boolean to use UDP or the network channel. */ -void handle_T4_clock_sync_message(unsigned char* buffer, int socket, instant_t r4); +void handle_T4_clock_sync_message(unsigned char* buffer, void* socket_or_netchan, instant_t r4, bool use_udp); /** * Thread that listens for UDP inputs from the RTI. diff --git a/include/core/federated/federate.h b/include/core/federated/federate.h index af46d7ec7..a4b67433e 100644 --- a/include/core/federated/federate.h +++ b/include/core/federated/federate.h @@ -18,6 +18,7 @@ #include "lf_types.h" #include "environment.h" #include "low_level_platform.h" +#include "net_driver.h" #ifndef ADVANCE_MESSAGE_INTERVAL #define ADVANCE_MESSAGE_INTERVAL MSEC(10) @@ -31,16 +32,16 @@ */ typedef struct federate_instance_t { /** - * The TCP socket descriptor for this federate to communicate with the RTI. + * The network channel for this federate to communicate with the RTI. * This is set by lf_connect_to_rti(), which must be called before other * functions that communicate with the rti are called. */ - int socket_TCP_RTI; + netchan_t netchan_to_RTI; /** - * Thread listening for incoming TCP messages from the RTI. + * Thread listening for incoming messages from the RTI. */ - lf_thread_t RTI_socket_listener; + lf_thread_t RTI_netchan_listener; /** * Number of inbound physical connections to the federate. @@ -54,7 +55,7 @@ typedef struct federate_instance_t { * This is NULL if there are none and otherwise has size given by * number_of_inbound_p2p_connections. */ - lf_thread_t* inbound_socket_listeners; + lf_thread_t* inbound_netchan_listeners; /** * Number of outbound peer-to-peer connections from the federate. @@ -64,57 +65,50 @@ typedef struct federate_instance_t { size_t number_of_outbound_p2p_connections; /** - * An array that holds the socket descriptors for inbound + * An array that holds the network channels for inbound * connections from each federate. The index will be the federate * ID of the remote sending federate. This is initialized at startup - * to -1 and is set to a socket ID by lf_handle_p2p_connections_from_federates() - * when the socket is opened. + * to NULL and is set to the pointer of the network channel by lf_connect_to_federate() + * when the network channels is opened. * - * @note There will not be an inbound socket unless a physical connection + * @note There will not be an inbound network channel unless a physical connection * or a p2p logical connection (by setting the coordination target property * to "distributed") is specified in the Lingua Franca program where this * federate is the destination. Multiple incoming p2p connections from the - * same remote federate will use the same socket. + * same remote federate will use the same network channel. */ - int sockets_for_inbound_p2p_connections[NUMBER_OF_FEDERATES]; + netchan_t netchans_for_inbound_p2p_connections[NUMBER_OF_FEDERATES]; /** - * An array that holds the socket descriptors for outbound direct + * An array that holds the network channels for outbound direct * connections to each remote federate. The index will be the federate * ID of the remote receiving federate. This is initialized at startup - * to -1 and is set to a socket ID by lf_connect_to_federate() - * when the socket is opened. + * to NULL and is set to the pointer of the network channel by lf_connect_to_federate() + * when the network channels is opened. * - * @note This federate will not open an outbound socket unless a physical + * @note This federate will not open an outbound network channels unless a physical * connection or a p2p logical connection (by setting the coordination target * property to "distributed") is specified in the Lingua Franca * program where this federate acts as the source. Multiple outgoing p2p - * connections to the same remote federate will use the same socket. + * connections to the same remote federate will use the same network channels. */ - int sockets_for_outbound_p2p_connections[NUMBER_OF_FEDERATES]; + netchan_t netchans_for_outbound_p2p_connections[NUMBER_OF_FEDERATES]; /** - * Thread ID for a thread that accepts sockets and then supervises - * listening to those sockets for incoming P2P (physical) connections. + * Thread ID for a thread that accepts network channels and then supervises + * listening to those network channels for incoming P2P (physical) connections. */ lf_thread_t inbound_p2p_handling_thread_id; /** - * A socket descriptor for the socket server of the federate. + * A network channel for the server of the federate. * This is assigned in lf_create_server(). - * This socket is used to listen to incoming physical connections from + * This network channel is used to listen to incoming physical connections from * remote federates. Once an incoming connection is accepted, the - * opened socket will be stored in - * federate_sockets_for_inbound_p2p_connections. + * opened network channel will be stored in + * federate_netchans_for_inbound_p2p_connections. */ - int server_socket; - - /** - * The port used for the server socket to listen for messages from other federates. - * The federate informs the RTI of this port once it has created its socket server by - * sending an ADDRESS_AD message (@see rti.h). - */ - int server_port; + netchan_t server_netchan; /** * Most recent tag advance grant (TAG) received from the RTI, or NEVER if none @@ -221,9 +215,9 @@ typedef enum parse_rti_code_t { SUCCESS, INVALID_PORT, INVALID_HOST, INVALID_USE // Global variables /** - * Mutex lock held while performing outbound socket write and close operations. + * Mutex lock held while performing outbound network channel write and close operations. */ -extern lf_mutex_t lf_outbound_socket_mutex; +extern lf_mutex_t lf_outbound_netchan_mutex; /** * Condition variable for blocking on unkonwn federate input ports. @@ -240,10 +234,10 @@ extern lf_cond_t lf_port_status_changed; * to send messages directly to the specified federate. * This function first sends an MSG_TYPE_ADDRESS_QUERY message to the RTI to obtain * the IP address and port number of the specified federate. It then attempts - * to establish a socket connection to the specified federate. + * to establish a network channel connection to the specified federate. * If this fails, the program exits. If it succeeds, it sets element [id] of - * the _fed.sockets_for_outbound_p2p_connections global array to - * refer to the socket for communicating directly with the federate. + * the _fed.netchans_for_outbound_p2p_connections global array to + * refer to the network channel for communicating directly with the federate. * @param remote_federate_id The ID of the remote federate. */ void lf_connect_to_federate(uint16_t); @@ -251,12 +245,12 @@ void lf_connect_to_federate(uint16_t); /** * @brief Connect to the RTI at the specified host and port. * - * This will return the socket descriptor for the connection. + * This will return the network channel for the connection. * If port_number is 0, then start at DEFAULT_PORT and increment * the port number on each attempt. If an attempt fails, wait CONNECT_RETRY_INTERVAL * and try again. If it fails after CONNECT_TIMEOUT, the program exits. - * If it succeeds, it sets the _fed.socket_TCP_RTI global variable to refer to - * the socket for communicating with the RTI. + * If it succeeds, it sets the _fed.netchan_to_RTI global variable to refer to + * the network channel for communicating with the RTI. * @param hostname A hostname, such as "localhost". * @param port_number A port number or 0 to start with the default. */ @@ -266,8 +260,8 @@ void lf_connect_to_rti(const char* hostname, int port_number); * @brief Create a server to listen to incoming P2P connections. * * Such connections are used for physical connections or any connection if using - * decentralized coordination. This function only handles the creation of the server socket. - * The bound port for the server socket is then sent to the RTI by sending an + * decentralized coordination. This function only handles the creation of the server network channel. + * The bound port for the server network channel is then sent to the RTI by sending an * MSG_TYPE_ADDRESS_ADVERTISEMENT message (@see net_common.h). * This function expects no response from the RTI. * @@ -294,8 +288,8 @@ void lf_enqueue_port_absent_reactions(environment_t* env); * * This thread accepts connections from federates that send messages directly * to this one (not through the RTI). This thread starts a thread for - * each accepted socket connection to read messages and, once it has opened all expected - * sockets, exits. + * each accepted network channel connection to read messages and, once it has opened all expected + * network channels, exits. * @param ignored No argument needed for this thread. */ void* lf_handle_p2p_connections_from_federates(void*); @@ -334,10 +328,10 @@ void lf_reset_status_fields_on_input_port_triggers(); * @brief Send a message to another federate. * * This function is used for physical connections - * between federates. If the socket connection to the remote federate or the RTI has been broken, + * between federates. If the connection to the remote federate or the RTI has been broken, * then this returns -1 without sending. Otherwise, it returns 0. * - * This method assumes that the caller does not hold the lf_outbound_socket_mutex lock, + * This method assumes that the caller does not hold the lf_outbound_netchan_mutex lock, * which it acquires to perform the send. * * @param message_type The type of the message being sent (currently only MSG_TYPE_P2P_MESSAGE). @@ -360,7 +354,7 @@ int lf_send_message(int message_type, unsigned short port, unsigned short federa * information is needed for the RTI to perform the centralized coordination. * @see MSG_TYPE_NEIGHBOR_STRUCTURE in net_common.h */ -void lf_send_neighbor_structure_to_RTI(int); +void lf_send_neighbor_structure_to_RTI(netchan_t); /** * @brief Send a next event tag (NET) signal. @@ -439,7 +433,7 @@ void lf_send_port_absent_to_federate(environment_t* env, interval_t additional_d * * The payload is the specified tag plus one microstep. If this federate has previously * received a stop request from the RTI, then do not send the message and - * return 1. Return -1 if the socket is disconnected. Otherwise, return 0. + * return 1. Return -1 if the network channel is disconnected. Otherwise, return 0. * @return 0 if the message is sent. */ int lf_send_stop_request_to_rti(tag_t stop_tag); @@ -451,7 +445,7 @@ int lf_send_stop_request_to_rti(tag_t stop_tag); * If the delayed tag falls after the timeout time, then the message is not sent and -1 is returned. * The caller can reuse or free the memory storing the message after this returns. * - * If the message fails to send (e.g. the socket connection is broken), then the + * If the message fails to send (e.g. the network channel connection is broken), then the * response depends on the message_type. For MSG_TYPE_TAGGED_MESSAGE, the message is * supposed to go via the RTI, and failure to communicate with the RTI is a critical failure. * In this case, the program will exit with an error message. If the message type is @@ -460,7 +454,7 @@ int lf_send_stop_request_to_rti(tag_t stop_tag); * to believe that there were no messages forthcoming. In this case, on failure to send * the message, this function returns -11. * - * This method assumes that the caller does not hold the lf_outbound_socket_mutex lock, + * This method assumes that the caller does not hold the lf_outbound_netchan_mutex lock, * which it acquires to perform the send. * * @param env The environment from which to get the current tag. @@ -516,7 +510,7 @@ void lf_stall_advance_level_federation_locked(size_t level); * @brief Synchronize the start with other federates via the RTI. * * This assumes that a connection to the RTI is already made - * and _lf_rti_socket_TCP is valid. It then sends the current logical + * and netchan_to_RTI is valid. It then sends the current logical * time to the RTI and waits for the RTI to respond with a specified * time. It starts a thread to listen for messages from the RTI. */ diff --git a/lingua-franca-ref.txt b/lingua-franca-ref.txt index 316fcb7f9..b756b406f 100644 --- a/lingua-franca-ref.txt +++ b/lingua-franca-ref.txt @@ -1 +1 @@ -shutdown \ No newline at end of file +networkdriver diff --git a/network/api/CMakeLists.txt b/network/api/CMakeLists.txt new file mode 100644 index 000000000..08aaf8105 --- /dev/null +++ b/network/api/CMakeLists.txt @@ -0,0 +1,11 @@ +add_library(lf-network-api INTERFACE) +target_include_directories(lf-network-api INTERFACE ${CMAKE_CURRENT_LIST_DIR}) +add_library(lf::network-api ALIAS lf-network-api) + +#Link necessary libraries. +target_link_libraries(lf-network-api INTERFACE lf::tag-api) +target_link_libraries(lf-network-api INTERFACE lf::low-level-platform-api) + +target_include_directories(lf-network-api INTERFACE ${CMAKE_CURRENT_LIST_DIR}/../../include/core/utils) + +target_compile_definitions(lf-network-api INTERFACE COMM_TYPE_${COMM_TYPE}) diff --git a/include/core/federated/network/net_common.h b/network/api/net_common.h similarity index 100% rename from include/core/federated/network/net_common.h rename to network/api/net_common.h diff --git a/network/api/net_driver.h b/network/api/net_driver.h new file mode 100644 index 000000000..dd6e86f7d --- /dev/null +++ b/network/api/net_driver.h @@ -0,0 +1,218 @@ +#ifndef NET_DRIVER_H +#define NET_DRIVER_H + +#include "socket_common.h" + +typedef void* netchan_t; + +/** + * Allocate memory for the network channel. + * @return netchan_t Initialized network channel. + */ +netchan_t initialize_netchan(); + +/** + * Create a netchannel server. This is such as a server socket which accepts connections. + * However this is only the creation of the server network channel. + * + * @param chan Server's network channel. + * @param serv_type Type of server, RTI or FED. + * @return int 0 for success, -1 for failure. + */ +int create_server(netchan_t chan, bool increment_port_on_retry); + +/** + * Wait for an incoming connection request on the specified server network channel. + * The implementation should include three steps. + * 1. Initialize the network channel of the connected federate. + * 2. Wait for the incoming connection request. This should block until the connection is successfully accepted. + * 3. Save the information in the connected network channel, such as the address of the connected peer, for future + * querying address. + * + * @param server_chan The server network channel that is listening for incoming connections. + * @param rti_chan The rti's network channel to check if it is still open. + * @return netchan_t The network channel for the newly accepted connection on success, or NULL on failure + */ +netchan_t accept_netchan(netchan_t server_chan, netchan_t rti_chan); + +/** + * Using the initialized network channel, create a client network channel ready to connect to a server. + * + * @param chan The initialized network channel. + */ +void create_client(netchan_t chan); + +/** + * Connect to the server network channel. The server's connection information, + * such as the port and address should be set before calling this function. + * + * @param chan network channel to connect. + * @return int 0 on success, -1 on failure, and `errno` is set to indicate the specific error. + */ +int connect_to_netchan(netchan_t chan); + +/** + * Read the specified number of bytes from the specified network channel into the specified buffer. + * If an error occurs during this reading, return -1 and set errno to indicate + * the cause of the error. If the read succeeds in reading the specified number of bytes, + * return 0. If an EOF occurs before reading the specified number of bytes, return 1. + * @param chan The network channel. + * @param num_bytes The number of bytes to read. + * @param buffer The buffer into which to put the bytes. + * @return 0 for success, 1 for EOF, and -1 for an error. + */ +int read_from_netchan(netchan_t chan, size_t num_bytes, unsigned char* buffer); + +/** + * Read the specified number of bytes to the specified network channel using read_from_netchan + * and close the network channel if an error occurs. + * @param chan The network channel. + * @param num_bytes The number of bytes to write. + * @param buffer The buffer from which to get the bytes. + * @return 0 for success, -1 for failure. + */ +int read_from_netchan_close_on_error(netchan_t chan, size_t num_bytes, unsigned char* buffer); + +/** + * Read the specified number of bytes from the specified network channel into the + * specified buffer. If a disconnect or an EOF occurs during this + * reading, then if format is non-null, report an error and exit. + * If the mutex argument is non-NULL, release the mutex before exiting. + * If format is null, then report the error, but do not exit. + * This function takes a formatted string and additional optional arguments + * similar to printf(format, ...) that is appended to the error messages. + * @param chan The network channel. + * @param num_bytes The number of bytes to read. + * @param buffer The buffer into which to put the bytes. + * @param format A printf-style format string, followed by arguments to + * fill the string, or NULL to not exit with an error message. + * @return The number of bytes read, or 0 if an EOF is received, or + * a negative number for an error. + */ +void read_from_netchan_fail_on_error(netchan_t chan, size_t num_bytes, unsigned char* buffer, lf_mutex_t* mutex, + char* format, ...); + +/** + * Write the specified number of bytes to the specified network channel from the + * specified buffer. If an error occurs, return -1 and set errno to indicate + * the cause of the error. If the write succeeds, return 0. + * This function repeats the attempt until the specified number of bytes + * have been written or an error occurs. + * @param chan The network channel. + * @param num_bytes The number of bytes to write. + * @param buffer The buffer from which to get the bytes. + * @return 0 for success, -1 for failure. + */ +int write_to_netchan(netchan_t chan, size_t num_bytes, unsigned char* buffer); + +/** + * Write the specified number of bytes to the specified network channel using write_to_netchan + * and close the network channel if an error occurs. + * @param chan The network channel. + * @param num_bytes The number of bytes to write. + * @param buffer The buffer from which to get the bytes. + * @return 0 for success, -1 for failure. + */ +int write_to_netchan_close_on_error(netchan_t chan, size_t num_bytes, unsigned char* buffer); + +/** + * Write the specified number of bytes to the specified network channel using + * write_to_netchan_close_on_error and exit with an error code if an error occurs. + * If the mutex argument is non-NULL, release the mutex before exiting. If the + * format argument is non-null, then use it an any additional arguments to form + * the error message using printf conventions. Otherwise, print a generic error + * message. + * @param chan The network channel. + * @param num_bytes The number of bytes to write. + * @param buffer The buffer from which to get the bytes. + * @param mutex If non-NULL, the mutex to unlock before exiting. + * @param format A format string for error messages, followed by any number of + * fields that will be used to fill the format string as in printf, or NULL + * to print a generic error message. + */ +void write_to_netchan_fail_on_error(netchan_t chan, size_t num_bytes, unsigned char* buffer, lf_mutex_t* mutex, + char* format, ...); + +/** + * Checks if the network channel is still connected to the peer. + * + * @param chan The network channel. + * @return true if closed, false if still open. + */ +bool check_netchan_closed(netchan_t chan); + +/** + * @brief Gracefully shuts down and closes the network channel, optionally reading until EOF. + * Shutdown and close the network channel. If read_before_closing is false, it just immediately calls shutdown() with + * SHUT_RDWR and close(). If read_before_closing is true, it calls shutdown with SHUT_WR, only disallowing further + * writing. Then, it calls read() until EOF is received, and discards all received bytes. + * @param chan The network channel to shutdown and close. + * @param read_before_closing If true, read until EOF before closing the network channel. + * @return int Returns 0 on success, -1 on failure (errno will indicate the error). + */ +int shutdown_netchan(netchan_t chan, bool read_before_closing); + +/** + * Get the open port number from the network channel. + * This is used when the federate sends a MSG_TYPE_ADDRESS_ADVERTISEMENT to the RTI, informing its port number. The RTI + * will save this port number, and send it to the other federate in a MSG_TYPE_ADDRESS_QUERY_REPLY message. + * + * @param chan The network channel. + * @return The port number of a server network channel. + */ +int32_t get_my_port(netchan_t chan); + +/** + * Get the port number of the connected peer. + * This is used by the RTI, when there is a request from the federate to the RTI, for the MSG_TYPE_ADDRESS_QUERY + * message. + * + * @param chan The network channel. + * @return Port number of the connected peer. + */ +int32_t get_server_port(netchan_t chan); + +/** + * Get the IP address of the connected peer. + * + * @param chan The network channel. + * @return Pointer to the server IP address + */ +struct in_addr* get_ip_addr(netchan_t chan); + +/** + * Get the hostname of the connected peer. + * + * @param chan The network channel. + * @return Pointer to the server hostname + */ +char* get_server_hostname(netchan_t chan); + +/** + * Set the user specified port to the created network channel. + * + * @param chan The network channel. + * @param port The user specified port + */ +void set_my_port(netchan_t chan, int32_t port); + +/** + * Set server port number to the target network channel. + * The federate and RTI receives the port number from another + * federate MSG_TYPE_ADDRESS_ADVERTISEMENT message. + * This function is used to set the network channel's target server port number. + * + * @param chan The network channel. + * @param port The target server's port + */ +void set_server_port(netchan_t chan, int32_t port); + +/** + * Set the target server's hostname to the network channel. + * + * @param chan The network channel. + * @param hostname The target server's hostname + */ +void set_server_hostname(netchan_t chan, const char* hostname); + +#endif /* NET_DRIVER_H */ diff --git a/include/core/federated/network/net_util.h b/network/api/net_util.h similarity index 99% rename from include/core/federated/network/net_util.h rename to network/api/net_util.h index 1e9008816..b945659c7 100644 --- a/include/core/federated/network/net_util.h +++ b/network/api/net_util.h @@ -51,10 +51,6 @@ THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. #include "low_level_platform.h" #include "tag.h" -#ifdef FEDERATED -#include "socket_common.h" -#endif - #define HOST_LITTLE_ENDIAN 1 #define HOST_BIG_ENDIAN 2 diff --git a/include/core/federated/network/socket_common.h b/network/api/socket_common.h similarity index 85% rename from include/core/federated/network/socket_common.h rename to network/api/socket_common.h index 6d04994e4..05afc0e65 100644 --- a/include/core/federated/network/socket_common.h +++ b/network/api/socket_common.h @@ -1,7 +1,10 @@ #ifndef SOCKET_COMMON_H #define SOCKET_COMMON_H -#include "low_level_platform.h" +#include "low_level_platform.h" // lf_mutex_t +#include +#include +#include /** * The amount of time to wait after a failed socket read or write before trying again. This defaults to 100 ms. @@ -61,6 +64,11 @@ */ #define DEFAULT_PORT 15045u +/** + * Default port number for the RTI's clock server. + */ +#define DEFAULT_UDP_PORT 15061u + /** * Byte identifying that the federate or the RTI has failed. */ @@ -68,6 +76,23 @@ typedef enum socket_type_t { TCP, UDP } socket_type_t; +typedef struct socket_priv_t { + int socket_descriptor; + uint16_t port; // The port number. // + uint16_t user_specified_port; // Default as 0 for both RTI and federate. + + // The connected other side's info. The + char server_hostname[INET_ADDRSTRLEN]; // Human-readable IP address and + int32_t server_port; // port number of the socket server of the federate + // if it has any incoming direct connections from other federates. + // The port number will be -1 if there is no server or if the + // RTI has not been informed of the port number. + struct in_addr server_ip_addr; // Information about the IP address of the socket + // server of the federate. + + struct sockaddr_in UDP_addr; // The UDP address for the federate. +} socket_priv_t; + /** * @brief Create an IPv4 TCP socket with Nagle's algorithm disabled * (TCP_NODELAY) and Delayed ACKs disabled (TCP_QUICKACK). Exits application @@ -75,7 +100,7 @@ typedef enum socket_type_t { TCP, UDP } socket_type_t; * * @return The socket ID (a file descriptor). */ -int create_real_time_tcp_socket_errexit(); +int create_real_time_tcp_socket_errexit(void); /** * @brief Create a TCP server that listens for socket connections. @@ -93,12 +118,11 @@ int create_real_time_tcp_socket_errexit(); * @param port The port number to use or 0 to let the OS pick or 1 to start trying at DEFAULT_PORT. * @param final_socket Pointer to the returned socket descriptor on which accepting connections will occur. * @param final_port Pointer to the final port the server will use. - * @param sock_type Type of the socket, TCP or UDP. * @param increment_port_on_retry Boolean to retry port increment. * @return 0 for success, -1 for failure. */ -int create_server(uint16_t port, int* final_socket, uint16_t* final_port, socket_type_t sock_type, - bool increment_port_on_retry); +int create_socket_server(uint16_t port, int* final_socket, uint16_t* final_port, socket_type_t sock_type, + bool increment_port_on_retry); /** * Wait for an incoming connection request on the specified server socket. @@ -116,7 +140,6 @@ int create_server(uint16_t port, int* final_socket, uint16_t* final_port, socket * @return The file descriptor for the newly accepted socket on success, or -1 on failure * (with an appropriate error message printed). */ - int accept_socket(int socket, int rti_socket); /** @@ -190,6 +213,22 @@ void read_from_socket_fail_on_error(int* socket, size_t num_bytes, unsigned char */ ssize_t peek_from_socket(int socket, unsigned char* result); +/** + * Return true if either the socket to the RTI is broken or the socket is + * alive and the first unread byte on the socket's queue is MSG_TYPE_FAILED. + * @param socket Socket to check. + * @return True if closed, false if still connected. + */ +bool check_socket_closed(int socket); +/** + * Get the connected peer name from the connected socket. + * Set it to the server_ip_addr. Also, set server_hostname if LOG_LEVEL is higher than LOG_LEVEL_DEBUG. + * + * @param priv The socket_priv struct. + * @return 0 for success, -1 for failure. + */ +int get_peer_address(socket_priv_t* priv); + /** * Write the specified number of bytes to the specified socket from the * specified buffer. If an error occurs, return -1 and set errno to indicate diff --git a/network/impl/CMakeLists.txt b/network/impl/CMakeLists.txt new file mode 100644 index 000000000..225edf3d5 --- /dev/null +++ b/network/impl/CMakeLists.txt @@ -0,0 +1,25 @@ +set(LF_ROOT ${CMAKE_CURRENT_LIST_DIR}/../..) +include(${LF_ROOT}/core/lf_utils.cmake) + +add_library(lf-network-impl STATIC ${LF_NETWORK_FILES}) +add_library(lf::network-impl ALIAS lf-network-impl) +target_sources(lf-network-impl PUBLIC + ${CMAKE_CURRENT_LIST_DIR}/src/net_util.c + ${CMAKE_CURRENT_LIST_DIR}/src/socket_common.c +) + +if(COMM_TYPE MATCHES TCP) + target_sources(lf-network-impl PUBLIC ${CMAKE_CURRENT_LIST_DIR}/src/lf_socket_support.c) +else() + message(FATAL_ERROR "Your communication type is not supported! The C target supports TCP.") +endif() + +# Link necessary libraries +target_link_libraries(lf-network-impl PUBLIC lf-logging-api) +target_link_libraries(lf-network-impl PUBLIC lf-low-level-platform-api) +target_link_libraries(lf-network-impl PUBLIC lf::tag-api) +target_link_libraries(lf-network-impl PRIVATE lf-network-api) + +lf_enable_compiler_warnings(lf-network-impl) + +target_compile_definitions(lf-network-impl PUBLIC COMM_TYPE_${COMM_TYPE}) diff --git a/network/impl/src/lf_socket_support.c b/network/impl/src/lf_socket_support.c new file mode 100644 index 000000000..29f01da2e --- /dev/null +++ b/network/impl/src/lf_socket_support.c @@ -0,0 +1,212 @@ +#include // malloc() +#include // strerror() +#include // errno +#include // read() write() +#include // inet_ntop + +#include "net_driver.h" +#include "socket_common.h" +#include "util.h" + +static socket_priv_t* get_socket_priv_t(netchan_t chan) { + if (chan == NULL) { + lf_print_error("Network channel is already closed."); + return NULL; + } + return (socket_priv_t*)chan; +} + +netchan_t initialize_netchan() { + // Initialize priv. + socket_priv_t* priv = malloc(sizeof(socket_priv_t)); + if (priv == NULL) { + lf_print_error_and_exit("Falied to malloc socket_priv_t."); + } + + // Server initialization. + priv->port = 0; + priv->user_specified_port = 0; + priv->socket_descriptor = -1; + + // Federate initialization + strncpy(priv->server_hostname, "localhost", INET_ADDRSTRLEN); + priv->server_ip_addr.s_addr = 0; + priv->server_port = -1; + + return (netchan_t)priv; +} + +void free_netchan(netchan_t chan) { + socket_priv_t* priv = get_socket_priv_t(chan); + free(priv); +} + +int create_server(netchan_t chan, bool increment_port_on_retry) { + socket_priv_t* priv = get_socket_priv_t(chan); + return create_socket_server(priv->user_specified_port, &priv->socket_descriptor, &priv->port, TCP, + increment_port_on_retry); +} + +netchan_t accept_netchan(netchan_t server_chan, netchan_t rti_chan) { + socket_priv_t* serv_priv = get_socket_priv_t(server_chan); + int rti_socket; + if (rti_chan == NULL) { + // Set to -1, to indicate that this accept_netchan() call is not trying to check if the rti_chan is available, + // inside the accept_socket() function. + rti_socket = -1; + } else { + socket_priv_t* rti_priv = get_socket_priv_t(rti_chan); + rti_socket = rti_priv->socket_descriptor; + } + netchan_t fed_netchan = initialize_netchan(); + socket_priv_t* fed_priv = get_socket_priv_t(fed_netchan); + + int sock = accept_socket(serv_priv->socket_descriptor, rti_socket); + if (sock == -1) { + free_netchan(fed_netchan); + return NULL; + } + fed_priv->socket_descriptor = sock; + // Get the peer address from the connected socket_id. Saving this for the address query. + if (get_peer_address(fed_priv) != 0) { + lf_print_error("RTI failed to get peer address."); + }; + return fed_netchan; +} + +void create_client(netchan_t chan) { + socket_priv_t* priv = get_socket_priv_t(chan); + priv->socket_descriptor = create_real_time_tcp_socket_errexit(); +} + +int connect_to_netchan(netchan_t chan) { + socket_priv_t* priv = get_socket_priv_t(chan); + return connect_to_socket(priv->socket_descriptor, priv->server_hostname, priv->server_port); +} + +int read_from_netchan(netchan_t chan, size_t num_bytes, unsigned char* buffer) { + socket_priv_t* priv = get_socket_priv_t(chan); + return read_from_socket(priv->socket_descriptor, num_bytes, buffer); +} + +int read_from_netchan_close_on_error(netchan_t chan, size_t num_bytes, unsigned char* buffer) { + socket_priv_t* priv = get_socket_priv_t(chan); + int read_failed = read_from_netchan(chan, num_bytes, buffer); + if (read_failed) { + // Read failed. + // Socket has probably been closed from the other side. + // Shut down and close the socket from this side. + shutdown_socket(&priv->socket_descriptor, false); + return -1; + } + return 0; +} + +void read_from_netchan_fail_on_error(netchan_t chan, size_t num_bytes, unsigned char* buffer, lf_mutex_t* mutex, + char* format, ...) { + va_list args; + int read_failed = read_from_netchan_close_on_error(chan, num_bytes, buffer); + if (read_failed) { + // Read failed. + if (mutex != NULL) { + LF_MUTEX_UNLOCK(mutex); + } + if (format != NULL) { + va_start(args, format); + lf_print_error_system_failure(format, args); + va_end(args); + } else { + lf_print_error_system_failure("Failed to read from socket."); + } + } +} + +int write_to_netchan(netchan_t chan, size_t num_bytes, unsigned char* buffer) { + socket_priv_t* priv = get_socket_priv_t(chan); + return write_to_socket(priv->socket_descriptor, num_bytes, buffer); +} + +int write_to_netchan_close_on_error(netchan_t chan, size_t num_bytes, unsigned char* buffer) { + socket_priv_t* priv = get_socket_priv_t(chan); + int result = write_to_netchan(chan, num_bytes, buffer); + if (result) { + // Write failed. + // Socket has probably been closed from the other side. + // Shut down and close the socket from this side. + shutdown_socket(&priv->socket_descriptor, false); + } + return result; +} + +void write_to_netchan_fail_on_error(netchan_t chan, size_t num_bytes, unsigned char* buffer, lf_mutex_t* mutex, + char* format, ...) { + va_list args; + int result = write_to_netchan_close_on_error(chan, num_bytes, buffer); + if (result) { + // Write failed. + if (mutex != NULL) { + LF_MUTEX_UNLOCK(mutex); + } + if (format != NULL) { + va_start(args, format); + lf_print_error_system_failure(format, args); + va_end(args); + } else { + lf_print_error("Failed to write to socket. Closing it."); + } + } +} + +bool check_netchan_closed(netchan_t chan) { + socket_priv_t* priv = get_socket_priv_t(chan); + return check_socket_closed(priv->socket_descriptor); +} + +int shutdown_netchan(netchan_t chan, bool read_before_closing) { + if (chan == NULL) { + lf_print("Socket already closed."); + return 0; + } + socket_priv_t* priv = get_socket_priv_t(chan); + int ret = shutdown_socket(&priv->socket_descriptor, read_before_closing); + if (ret != 0) { + lf_print_error("Failed to shutdown socket."); + } + free_netchan(chan); + return ret; +} + +int32_t get_my_port(netchan_t chan) { + socket_priv_t* priv = get_socket_priv_t(chan); + return priv->port; +} + +int32_t get_server_port(netchan_t chan) { + socket_priv_t* priv = get_socket_priv_t(chan); + return priv->server_port; +} + +struct in_addr* get_ip_addr(netchan_t chan) { + socket_priv_t* priv = get_socket_priv_t(chan); + return &priv->server_ip_addr; +} + +char* get_server_hostname(netchan_t chan) { + socket_priv_t* priv = get_socket_priv_t(chan); + return priv->server_hostname; +} + +void set_my_port(netchan_t chan, int32_t port) { + socket_priv_t* priv = get_socket_priv_t(chan); + priv->port = port; +} + +void set_server_port(netchan_t chan, int32_t port) { + socket_priv_t* priv = get_socket_priv_t(chan); + priv->server_port = port; +} + +void set_server_hostname(netchan_t chan, const char* hostname) { + socket_priv_t* priv = get_socket_priv_t(chan); + memcpy(priv->server_hostname, hostname, INET_ADDRSTRLEN); +} diff --git a/core/federated/network/net_util.c b/network/impl/src/net_util.c similarity index 98% rename from core/federated/network/net_util.c rename to network/impl/src/net_util.c index bcea05495..3565fcb4e 100644 --- a/core/federated/network/net_util.c +++ b/network/impl/src/net_util.c @@ -37,10 +37,8 @@ THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. #include // Defines va_list #include #include -#include // Defines memcpy() -#include // Defines nanosleep() -#include // IPPROTO_TCP, IPPROTO_UDP -#include // TCP_NODELAY +#include // Defines memcpy() +#include // Defines nanosleep() #include "net_util.h" #include "util.h" @@ -82,7 +80,7 @@ void encode_uint16(uint16_t data, unsigned char* buffer) { buffer[1] = (unsigned char)((data & 0xff00) >> 8); } -int host_is_big_endian() { +int host_is_big_endian(void) { static int host = 0; union { uint32_t uint; diff --git a/core/federated/network/socket_common.c b/network/impl/src/socket_common.c similarity index 85% rename from core/federated/network/socket_common.c rename to network/impl/src/socket_common.c index 8df2bd5c4..e5b350042 100644 --- a/core/federated/network/socket_common.c +++ b/network/impl/src/socket_common.c @@ -1,6 +1,7 @@ #include // Defines read(), write(), and close() #include // IPPROTO_TCP, IPPROTO_UDP #include // TCP_NODELAY +#include // inet_ntop #include #include #include @@ -11,7 +12,7 @@ #include // strerror #include "util.h" -#include "socket_common.h" +#include "net_driver.h" #ifndef NUMBER_OF_FEDERATES #define NUMBER_OF_FEDERATES 1 @@ -20,10 +21,10 @@ /** Number of nanoseconds to sleep before retrying a socket read. */ #define SOCKET_READ_RETRY_INTERVAL 1000000 -// Mutex lock held while performing socket shutdown and close operations. +// Mutex lock held while performing network channel shutdown and close operations. lf_mutex_t shutdown_mutex; -int create_real_time_tcp_socket_errexit() { +int create_real_time_tcp_socket_errexit(void) { int sock = socket(AF_INET, SOCK_STREAM, IPPROTO_TCP); if (sock < 0) { lf_print_error_system_failure("Could not open TCP socket."); @@ -132,8 +133,8 @@ static int set_socket_bind_option(int socket_descriptor, uint16_t specified_port return used_port; } -int create_server(uint16_t port, int* final_socket, uint16_t* final_port, socket_type_t sock_type, - bool increment_port_on_retry) { +int create_socket_server(uint16_t port, int* final_socket, uint16_t* final_port, socket_type_t sock_type, + bool increment_port_on_retry) { int socket_descriptor; struct timeval timeout_time; if (sock_type == TCP) { @@ -169,11 +170,7 @@ int create_server(uint16_t port, int* final_socket, uint16_t* final_port, socket return 0; } -/** - * Return true if either the socket to the RTI is broken or the socket is - * alive and the first unread byte on the socket's queue is MSG_TYPE_FAILED. - */ -static bool check_socket_closed(int socket) { +bool check_socket_closed(int socket) { unsigned char first_byte; ssize_t bytes = peek_from_socket(socket, &first_byte); if (bytes < 0 || (bytes == 1 && first_byte == MSG_TYPE_FAILED)) { @@ -183,6 +180,28 @@ static bool check_socket_closed(int socket) { } } +int get_peer_address(socket_priv_t* priv) { + struct sockaddr_in peer_addr; + socklen_t addr_len = sizeof(peer_addr); + if (getpeername(priv->socket_descriptor, (struct sockaddr*)&peer_addr, &addr_len) != 0) { + lf_print_error("Failed to get peer address."); + return -1; + } + priv->server_ip_addr = peer_addr.sin_addr; + +#if LOG_LEVEL >= LOG_LEVEL_DEBUG + // Create the human readable format and copy that into + // the .server_hostname field of the federate. + char str[INET_ADDRSTRLEN + 1]; + inet_ntop(AF_INET, &priv->server_ip_addr, str, INET_ADDRSTRLEN); + strncpy(priv->server_hostname, str, INET_ADDRSTRLEN - 1); // Copy up to INET_ADDRSTRLEN - 1 characters + priv->server_hostname[INET_ADDRSTRLEN - 1] = '\0'; // Null-terminate explicitly + + LF_PRINT_DEBUG("Got address %s", priv->server_hostname); +#endif + return 0; +} + int accept_socket(int socket, int rti_socket) { struct sockaddr client_fd; // Wait for an incoming connection request. @@ -197,14 +216,15 @@ int accept_socket(int socket, int rti_socket) { break; } else if (socket_id < 0 && (errno != EAGAIN || errno != EWOULDBLOCK || errno != EINTR)) { lf_print_warning("Failed to accept the socket. %s.", strerror(errno)); - break; + return -1; } else if (errno == EPERM) { lf_print_error_system_failure("Firewall permissions prohibit connection."); + return -1; } else { // For the federates, it should check if the rti_socket is still open, before retrying accept(). if (rti_socket != -1) { if (check_socket_closed(rti_socket)) { - break; + return -1; } } // Try again @@ -259,8 +279,10 @@ int connect_to_socket(int sock, const char* hostname, int port) { } lf_print_warning("Could not connect. Will try again every " PRINTF_TIME " nanoseconds. Connecting to port %d.\n", CONNECT_RETRY_INTERVAL, used_port); + freeaddrinfo(result); continue; } else { + freeaddrinfo(result); break; } freeaddrinfo(result); @@ -297,39 +319,6 @@ int read_from_socket(int socket, size_t num_bytes, unsigned char* buffer) { return 0; } -int read_from_socket_close_on_error(int* socket, size_t num_bytes, unsigned char* buffer) { - assert(socket); - int read_failed = read_from_socket(*socket, num_bytes, buffer); - if (read_failed) { - // Read failed. - // Socket has probably been closed from the other side. - // Shut down and close the socket from this side. - shutdown_socket(socket, false); - return -1; - } - return 0; -} - -void read_from_socket_fail_on_error(int* socket, size_t num_bytes, unsigned char* buffer, lf_mutex_t* mutex, - char* format, ...) { - va_list args; - assert(socket); - int read_failed = read_from_socket_close_on_error(socket, num_bytes, buffer); - if (read_failed) { - // Read failed. - if (mutex != NULL) { - LF_MUTEX_UNLOCK(mutex); - } - if (format != NULL) { - va_start(args, format); - lf_print_error_system_failure(format, args); - va_end(args); - } else { - lf_print_error_system_failure("Failed to read from socket."); - } - } -} - ssize_t peek_from_socket(int socket, unsigned char* result) { ssize_t bytes_read = recv(socket, result, 1, MSG_DONTWAIT | MSG_PEEK); if (bytes_read < 0 && (errno == EAGAIN || errno == EWOULDBLOCK)) @@ -364,38 +353,6 @@ int write_to_socket(int socket, size_t num_bytes, unsigned char* buffer) { return 0; } -int write_to_socket_close_on_error(int* socket, size_t num_bytes, unsigned char* buffer) { - assert(socket); - int result = write_to_socket(*socket, num_bytes, buffer); - if (result) { - // Write failed. - // Socket has probably been closed from the other side. - // Shut down and close the socket from this side. - shutdown_socket(socket, false); - } - return result; -} - -void write_to_socket_fail_on_error(int* socket, size_t num_bytes, unsigned char* buffer, lf_mutex_t* mutex, - char* format, ...) { - va_list args; - assert(socket); - int result = write_to_socket_close_on_error(socket, num_bytes, buffer); - if (result) { - // Write failed. - if (mutex != NULL) { - LF_MUTEX_UNLOCK(mutex); - } - if (format != NULL) { - va_start(args, format); - lf_print_error_system_failure(format, args); - va_end(args); - } else { - lf_print_error("Failed to write to socket. Closing it."); - } - } -} - void init_shutdown_mutex(void) { LF_MUTEX_INIT(&shutdown_mutex); } int shutdown_socket(int* socket, bool read_before_closing) {