Retro68/gcc/libcody/cody.hh
2022-10-27 20:55:19 +02:00

805 lines
22 KiB
C++

// CODYlib -*- mode:c++ -*-
// Copyright (C) 2020 Nathan Sidwell, nathan@acm.org
// License: Apache v2.0
#ifndef CODY_HH
#define CODY_HH 1
// If the user specifies this as non-zero, it must be what we expect,
// generally only good for requesting no networking
#if !defined (CODY_NETWORKING)
// Have a known-good list of networking systems
#if defined (__unix__) || defined (__MACH__)
#define CODY_NETWORKING 1
#else
#define CODY_NETWORKING 0
#endif
#if 0 // For testing
#undef CODY_NETWORKING
#define CODY_NETWORKING 0
#endif
#endif
// C++
#include <memory>
#include <string>
#include <vector>
// C
#include <cstddef>
// OS
#include <errno.h>
#include <sys/types.h>
#if CODY_NETWORKING
#include <sys/socket.h>
#endif
namespace Cody {
// Set version to 1, as this is completely incompatible with 0.
// Fortunately both versions 0 and 1 will recognize each other's HELLO
// messages sufficiently to error out
constexpr unsigned Version = 1;
// FIXME: I guess we need a file-handle abstraction here
// Is windows DWORDPTR still?, or should it be FILE *? (ew).
namespace Detail {
// C++11 doesn't have utf8 character literals :(
template<unsigned I>
constexpr char S2C (char const (&s)[I])
{
static_assert (I == 2, "only single octet strings may be converted");
return s[0];
}
/// Internal buffering class. Used to concatenate outgoing messages
/// and Lex incoming ones.
class MessageBuffer
{
std::vector<char> buffer; ///< buffer holding the message
size_t lastBol = 0; ///< location of the most recent Beginning Of
///< Line, or position we've readed when writing
public:
MessageBuffer () = default;
~MessageBuffer () = default;
MessageBuffer (MessageBuffer &&) = default;
MessageBuffer &operator= (MessageBuffer &&) = default;
public:
///
/// Finalize a buffer to be written. No more lines can be added to
/// the buffer. Use before a sequence of Write calls.
void PrepareToWrite ()
{
buffer.push_back (u8"\n"[0]);
lastBol = 0;
}
///
/// Prepare a buffer for reading. Use before a sequence of Read calls.
void PrepareToRead ()
{
buffer.clear ();
lastBol = 0;
}
public:
/// Begin a message line. Use before a sequence of Append and
/// related calls.
void BeginLine ();
/// End a message line. Use after a sequence of Append and related calls.
void EndLine () {}
public:
/// Append a string to the current line. No whitespace is prepended
/// or appended.
///
/// @param str the string to be written
/// @param maybe_quote indicate if there's a possibility the string
/// contains characters that need quoting. Defaults to false.
/// It is always safe to set
/// this true, but that causes an additional scan of the string.
/// @param len The length of the string. If not specified, strlen
/// is used to find the length.
void Append (char const *str, bool maybe_quote = false,
size_t len = ~size_t (0));
///
/// Add whitespace word separator. Multiple adjacent whitespace is fine.
void Space ()
{
Append (Detail::S2C(u8" "));
}
public:
/// Add a word as with Append, but prefixing whitespace to make a
/// separate word
void AppendWord (char const *str, bool maybe_quote = false,
size_t len = ~size_t (0))
{
if (buffer.size () != lastBol)
Space ();
Append (str, maybe_quote, len);
}
/// Add a word as with AppendWord
/// @param str the string to append
/// @param maybe_quote string might need quoting, as for Append
void AppendWord (std::string const &str, bool maybe_quote = false)
{
AppendWord (str.data (), maybe_quote, str.size ());
}
///
/// Add an integral value, prepending a space.
void AppendInteger (unsigned u);
private:
/// Append a literal character.
/// @param c character to append
void Append (char c);
public:
/// Lex the next input line into a vector of words.
/// @param words filled with a vector of lexed strings
/// @result 0 if no errors, an errno value on lexxing error such as
/// there being no next line (ENOENT), or malformed quoting (EINVAL)
int Lex (std::vector<std::string> &words);
public:
/// Append the most-recently lexxed line to a string. May be useful
/// in error messages. The unparsed line is appended -- before any
/// unquoting.
/// If we had c++17 string_view, we'd simply return a view of the
/// line, and leave it to the caller to do any concatenation.
/// @param l string to-which the lexxed line is appended.
void LexedLine (std::string &l);
public:
/// Detect if we have reached the end of the input buffer.
/// I.e. there are no more lines to Lex
/// @result True if at end
bool IsAtEnd () const
{
return lastBol == buffer.size ();
}
public:
/// Read from end point into a read buffer, as with read(2). This will
/// not block , unless FD is blocking, and there is nothing
/// immediately available.
/// @param fd file descriptor to read from. This may be a regular
/// file, pipe or socket.
/// @result on error returns errno. If end of file occurs, returns
/// -1. At end of message returns 0. If there is more needed
/// returns EAGAIN (or possibly EINTR). If the message is
/// malformed, returns EINVAL.
int Read (int fd) noexcept;
public:
/// Write to an end point from a write buffer, as with write(2). As
/// with Read, this will not usually block.
/// @param fd file descriptor to write to. This may be a regular
/// file, pipe or socket.
/// @result on error returns errno.
/// At end of message returns 0. If there is more to write
/// returns EAGAIN (or possibly EINTR).
int Write (int fd) noexcept;
};
///
/// Request codes. Perhaps this should be exposed? These are likely
/// useful to servers that queue requests.
enum RequestCode
{
RC_CONNECT,
RC_MODULE_REPO,
RC_MODULE_EXPORT,
RC_MODULE_IMPORT,
RC_MODULE_COMPILED,
RC_INCLUDE_TRANSLATE,
RC_HWM
};
/// Internal file descriptor tuple. It's used as an anonymous union member.
struct FD
{
int from; ///< Read from this FD
int to; ///< Write to this FD
};
}
// Flags for various requests
enum class Flags : unsigned
{
None,
NameOnly = 1<<0, // Only querying for CMI names, not contents
};
inline Flags operator& (Flags a, Flags b)
{
return Flags (unsigned (a) & unsigned (b));
}
inline Flags operator| (Flags a, Flags b)
{
return Flags (unsigned (a) | unsigned (b));
}
///
/// Response data for a request. Returned by Client's request calls,
/// which return a single Packet. When the connection is Corked, the
/// Uncork call will return a vector of Packets.
class Packet
{
public:
///
/// Packet is a variant structure. These are the possible content types.
enum Category { INTEGER, STRING, VECTOR};
private:
// std:variant is a C++17 thing, so we're doing this ourselves.
union
{
size_t integer; ///< Integral value
std::string string; ///< String value
std::vector<std::string> vector; ///< Vector of string value
};
Category cat : 2; ///< Discriminator
private:
unsigned short code = 0; ///< Packet type
unsigned short request = 0;
public:
Packet (unsigned c, size_t i = 0)
: integer (i), cat (INTEGER), code (c)
{
}
Packet (unsigned c, std::string &&s)
: string (std::move (s)), cat (STRING), code (c)
{
}
Packet (unsigned c, std::string const &s)
: string (s), cat (STRING), code (c)
{
}
Packet (unsigned c, std::vector<std::string> &&v)
: vector (std::move (v)), cat (VECTOR), code (c)
{
}
// No non-move constructor from a vector. You should not be doing
// that.
// Only move constructor and move assignment
Packet (Packet &&t)
{
Create (std::move (t));
}
Packet &operator= (Packet &&t)
{
Destroy ();
Create (std::move (t));
return *this;
}
~Packet ()
{
Destroy ();
}
private:
///
/// Variant move creation from another packet
void Create (Packet &&t);
///
/// Variant destruction
void Destroy ();
public:
///
/// Return the packet type
unsigned GetCode () const
{
return code;
}
///
/// Return the packet type
unsigned GetRequest () const
{
return request;
}
void SetRequest (unsigned r)
{
request = r;
}
///
/// Return the category of the packet's payload
Category GetCategory () const
{
return cat;
}
public:
///
/// Return an integral payload. Undefined if the category is not INTEGER
size_t GetInteger () const
{
return integer;
}
///
/// Return (a reference to) a string payload. Undefined if the
/// category is not STRING
std::string const &GetString () const
{
return string;
}
std::string &GetString ()
{
return string;
}
///
/// Return (a reference to) a constant vector of strings payload.
/// Undefined if the category is not VECTOR
std::vector<std::string> const &GetVector () const
{
return vector;
}
///
/// Return (a reference to) a non-conatant vector of strings payload.
/// Undefined if the category is not VECTOR
std::vector<std::string> &GetVector ()
{
return vector;
}
};
class Server;
///
/// Client-side (compiler) object.
class Client
{
public:
/// Response packet codes
enum PacketCode
{
PC_CORKED, ///< Messages are corked
PC_CONNECT, ///< Packet is integer version
PC_ERROR, ///< Packet is error string
PC_OK,
PC_BOOL,
PC_PATHNAME
};
private:
Detail::MessageBuffer write; ///< Outgoing write buffer
Detail::MessageBuffer read; ///< Incoming read buffer
std::string corked; ///< Queued request tags
union
{
Detail::FD fd; ///< FDs connecting to server
Server *server; ///< Directly connected server
};
bool is_direct = false; ///< Discriminator
bool is_connected = false; /// Connection handshake succesful
private:
Client ();
public:
/// Direct connection constructor.
/// @param s Server to directly connect
Client (Server *s)
: Client ()
{
is_direct = true;
server = s;
}
/// Communication connection constructor
/// @param from file descriptor to read from
/// @param to file descriptor to write to, defaults to from
Client (int from, int to = -1)
: Client ()
{
fd.from = from;
fd.to = to < 0 ? from : to;
}
~Client ();
// We have to provide our own move variants, because of the variant member.
Client (Client &&);
Client &operator= (Client &&);
public:
///
/// Direct connection predicate
bool IsDirect () const
{
return is_direct;
}
///
/// Successful handshake predicate
bool IsConnected () const
{
return is_connected;
}
public:
///
/// Get the read FD
/// @result the FD to read from, -1 if a direct connection
int GetFDRead () const
{
return is_direct ? -1 : fd.from;
}
///
/// Get the write FD
/// @result the FD to write to, -1 if a direct connection
int GetFDWrite () const
{
return is_direct ? -1 : fd.to;
}
///
/// Get the directly-connected server
/// @result the server, or nullptr if a communication connection
Server *GetServer () const
{
return is_direct ? server : nullptr;
}
public:
///
/// Perform connection handshake. All othe requests will result in
/// errors, until handshake is succesful.
/// @param agent compiler identification
/// @param ident compilation identifiation (maybe nullptr)
/// @param alen length of agent string, if known
/// @param ilen length of ident string, if known
/// @result packet indicating success (or deferrment) of the
/// connection, payload is optional flags
Packet Connect (char const *agent, char const *ident,
size_t alen = ~size_t (0), size_t ilen = ~size_t (0));
/// std::string wrapper for connection
/// @param agent compiler identification
/// @param ident compilation identification
Packet Connect (std::string const &agent, std::string const &ident)
{
return Connect (agent.c_str (), ident.c_str (),
agent.size (), ident.size ());
}
public:
/// Request compiler module repository
/// @result packet indicating repo
Packet ModuleRepo ();
public:
/// Inform of compilation of a named module interface or partition,
/// or a header unit
/// @param str module or header-unit
/// @param len name length, if known
/// @result CMI name (or deferrment/error)
Packet ModuleExport (char const *str, Flags flags, size_t len = ~size_t (0));
Packet ModuleExport (char const *str)
{
return ModuleExport (str, Flags::None, ~size_t (0));
}
Packet ModuleExport (std::string const &s, Flags flags = Flags::None)
{
return ModuleExport (s.c_str (), flags, s.size ());
}
public:
/// Importation of a module, partition or header-unit
/// @param str module or header-unit
/// @param len name length, if known
/// @result CMI name (or deferrment/error)
Packet ModuleImport (char const *str, Flags flags, size_t len = ~size_t (0));
Packet ModuleImport (char const *str)
{
return ModuleImport (str, Flags::None, ~size_t (0));
}
Packet ModuleImport (std::string const &s, Flags flags = Flags::None)
{
return ModuleImport (s.c_str (), flags, s.size ());
}
public:
/// Successful compilation of a module interface, partition or
/// header-unit. Must have been preceeded by a ModuleExport
/// request.
/// @param str module or header-unit
/// @param len name length, if known
/// @result OK (or deferment/error)
Packet ModuleCompiled (char const *str, Flags flags, size_t len = ~size_t (0));
Packet ModuleCompiled (char const *str)
{
return ModuleCompiled (str, Flags::None, ~size_t (0));
}
Packet ModuleCompiled (std::string const &s, Flags flags = Flags::None)
{
return ModuleCompiled (s.c_str (), flags, s.size ());
}
/// Include translation query.
/// @param str header unit name
/// @param len name length, if known
/// @result Packet indicating include translation boolean, or CMI
/// name (or deferment/error)
Packet IncludeTranslate (char const *str, Flags flags,
size_t len = ~size_t (0));
Packet IncludeTranslate (char const *str)
{
return IncludeTranslate (str, Flags::None, ~size_t (0));
}
Packet IncludeTranslate (std::string const &s, Flags flags = Flags::None)
{
return IncludeTranslate (s.c_str (), flags, s.size ());
}
public:
/// Cork the connection. All requests are queued up. Each request
/// call will return a PC_CORKED packet.
void Cork ();
/// Uncork the connection. All queued requests are sent to the
/// server, and a block of responses waited for.
/// @result A vector of packets, containing the in-order responses to the
/// queued requests.
std::vector<Packet> Uncork ();
///
/// Indicate corkedness of connection
bool IsCorked () const
{
return !corked.empty ();
}
private:
Packet ProcessResponse (std::vector<std::string> &, unsigned code,
bool isLast);
Packet MaybeRequest (unsigned code);
int CommunicateWithServer ();
};
/// This server-side class is used to resolve requests from one or
/// more clients. You are expected to derive from it and override the
/// virtual functions it provides. The connection resolver may return
/// a different resolved object to service the remainder of the
/// connection -- for instance depending on the compiler that is
/// making the requests.
class Resolver
{
public:
Resolver () = default;
virtual ~Resolver ();
protected:
/// Mapping from a module or header-unit name to a CMI file name.
/// @param module module name
/// @result CMI name
virtual std::string GetCMIName (std::string const &module);
/// Return the CMI file suffix to use
/// @result CMI suffix, a statically allocated string
virtual char const *GetCMISuffix ();
public:
/// When the requests of a directly-connected server are processed,
/// we may want to wait for the requests to complete (for instance a
/// set of subjobs).
/// @param s directly connected server.
virtual void WaitUntilReady (Server *s);
public:
/// Provide an error response.
/// @param s the server to provide the response to.
/// @param msg the error message
virtual void ErrorResponse (Server *s, std::string &&msg);
public:
/// Connection handshake. Provide response to server and return new
/// (or current) resolver, or nullptr.
/// @param s server to provide response to
/// @param version the client's version number
/// @param agent the client agent (compiler identification)
/// @param ident the compilation identification (may be empty)
/// @result nullptr in the case of an error. An error response will
/// be sent. If handing off to another resolver, return that,
/// otherwise this
virtual Resolver *ConnectRequest (Server *s, unsigned version,
std::string &agent, std::string &ident);
public:
// return 0 on ok, ERRNO on failure, -1 on unspecific error
virtual int ModuleRepoRequest (Server *s);
virtual int ModuleExportRequest (Server *s, Flags flags,
std::string &module);
virtual int ModuleImportRequest (Server *s, Flags flags,
std::string &module);
virtual int ModuleCompiledRequest (Server *s, Flags flags,
std::string &module);
virtual int IncludeTranslateRequest (Server *s, Flags flags,
std::string &include);
};
/// This server-side (build system) class handles a single connection
/// to a client. It has 3 states, READING:accumulating a message
/// block froma client, WRITING:writing a message block to a client
/// and PROCESSING:resolving requests. If the server does not spawn
/// jobs to build needed artifacts, the PROCESSING state will be brief.
class Server
{
public:
enum Direction
{
READING, // Server is waiting for completion of a (set of)
// requests from client. The next state will be PROCESSING.
WRITING, // Server is writing a (set of) responses to client.
// The next state will be READING.
PROCESSING // Server is processing client request(s). The next
// state will be WRITING.
};
private:
Detail::MessageBuffer write;
Detail::MessageBuffer read;
Resolver *resolver;
Detail::FD fd;
bool is_connected = false;
Direction direction : 2;
public:
Server (Resolver *r);
Server (Resolver *r, int from, int to = -1)
: Server (r)
{
fd.from = from;
fd.to = to >= 0 ? to : from;
}
~Server ();
Server (Server &&);
Server &operator= (Server &&);
public:
bool IsConnected () const
{
return is_connected;
}
public:
void SetDirection (Direction d)
{
direction = d;
}
public:
Direction GetDirection () const
{
return direction;
}
int GetFDRead () const
{
return fd.from;
}
int GetFDWrite () const
{
return fd.to;
}
Resolver *GetResolver () const
{
return resolver;
}
public:
/// Process requests from a directly-connected client. This is a
/// small wrapper around ProcessRequests, with some buffer swapping
/// for communication. It is expected that such processessing is
/// immediate.
/// @param from message block from client
/// @param to message block to client
void DirectProcess (Detail::MessageBuffer &from, Detail::MessageBuffer &to);
public:
/// Process the messages queued in the read buffer. We enter the
/// PROCESSING state, and each message line causes various resolver
/// methods to be called. Once processed, the server may need to
/// wait for all the requests to be ready, or it may be able to
/// immediately write responses back.
void ProcessRequests ();
public:
/// Accumulate an error response.
/// @param error the error message to encode
/// @param elen length of error, if known
void ErrorResponse (char const *error, size_t elen = ~size_t (0));
void ErrorResponse (std::string const &error)
{
ErrorResponse (error.data (), error.size ());
}
/// Accumulate an OK response
void OKResponse ();
/// Accumulate a boolean response
void BoolResponse (bool);
/// Accumulate a pathname response
/// @param path (may be nullptr, or empty)
/// @param rlen length, if known
void PathnameResponse (char const *path, size_t plen = ~size_t (0));
void PathnameResponse (std::string const &path)
{
PathnameResponse (path.data (), path.size ());
}
public:
/// Accumulate a (successful) connection response
/// @param agent the server-side agent
/// @param alen agent length, if known
void ConnectResponse (char const *agent, size_t alen = ~size_t (0));
void ConnectResponse (std::string const &agent)
{
ConnectResponse (agent.data (), agent.size ());
}
public:
/// Write message block to client. Semantics as for
/// MessageBuffer::Write.
/// @result errno or completion (0).
int Write ()
{
return write.Write (fd.to);
}
/// Initialize for writing a message block. All responses to the
/// incomping message block must be complete Enters WRITING state.
void PrepareToWrite ()
{
write.PrepareToWrite ();
direction = WRITING;
}
public:
/// Read message block from client. Semantics as for
/// MessageBuffer::Read.
/// @result errno, eof (-1) or completion (0)
int Read ()
{
return read.Read (fd.from);
}
/// Initialize for reading a message block. Enters READING state.
void PrepareToRead ()
{
read.PrepareToRead ();
direction = READING;
}
};
// Helper network stuff
#if CODY_NETWORKING
// Socket with specific address
int OpenSocket (char const **, sockaddr const *sock, socklen_t len);
int ListenSocket (char const **, sockaddr const *sock, socklen_t len,
unsigned backlog);
// Local domain socket (eg AF_UNIX)
int OpenLocal (char const **, char const *name);
int ListenLocal (char const **, char const *name, unsigned backlog = 0);
// ipv6 socket
int OpenInet6 (char const **e, char const *name, int port);
int ListenInet6 (char const **, char const *name, int port,
unsigned backlog = 0);
#endif
// FIXME: Mapping file utilities?
}
#endif // CODY_HH