2019-08-04 19:52:54 +02:00
|
|
|
#!/usr/bin/env python3
|
|
|
|
import argparse
|
|
|
|
import asyncio
|
|
|
|
import datetime
|
2019-08-05 03:42:27 +02:00
|
|
|
import mimetypes
|
|
|
|
import os
|
2019-08-04 19:52:54 +02:00
|
|
|
import ssl
|
|
|
|
import sys
|
2019-08-06 00:47:59 +02:00
|
|
|
import typing
|
2019-08-04 19:52:54 +02:00
|
|
|
|
2019-08-05 04:02:18 +02:00
|
|
|
__version__ = "0.0.1"
|
2019-08-04 19:52:54 +02:00
|
|
|
__title__ = "Jetforce Gemini Server"
|
|
|
|
__author__ = "Michael Lazar"
|
|
|
|
__license__ = "GNU General Public License v3.0"
|
|
|
|
__copyright__ = "(c) 2019 Michael Lazar"
|
|
|
|
|
|
|
|
|
|
|
|
ABOUT = fr"""
|
2019-08-05 03:42:27 +02:00
|
|
|
You are now riding on...
|
2019-08-04 19:52:54 +02:00
|
|
|
_________ _____________
|
|
|
|
______ /______ /___ __/_______________________
|
|
|
|
___ _ /_ _ \ __/_ /_ _ __ \_ ___/ ___/ _ \
|
|
|
|
/ /_/ / / __/ /_ _ __/ / /_/ / / / /__ / __/
|
|
|
|
\____/ \___/\__/ /_/ \____//_/ \___/ \___/
|
|
|
|
|
2019-08-05 03:42:27 +02:00
|
|
|
An Experimental Gemini Server, v{__version__}
|
2019-08-04 19:52:54 +02:00
|
|
|
https://github.com/michael-lazar/jetforce
|
|
|
|
"""
|
|
|
|
|
|
|
|
|
|
|
|
# Gemini response status codes
|
|
|
|
STATUS_SUCCESS = 2
|
|
|
|
STATUS_NOT_FOUND = 4
|
|
|
|
STATUS_SERVER_ERROR = 5
|
|
|
|
|
|
|
|
# Gemini response status codes, provisional
|
|
|
|
STATUS_MOVED = 3
|
|
|
|
STATUS_TOO_MANY_REQUESTS = 9
|
|
|
|
|
|
|
|
|
|
|
|
class EchoApp:
|
|
|
|
"""
|
2019-08-05 03:42:27 +02:00
|
|
|
A simple application that echos back the requested path.
|
2019-08-04 19:52:54 +02:00
|
|
|
"""
|
|
|
|
|
2019-08-06 00:47:59 +02:00
|
|
|
def __init__(self, environ: dict, send_status: typing.Callable) -> None:
|
2019-08-04 19:52:54 +02:00
|
|
|
self.environ = environ
|
|
|
|
self.send_status = send_status
|
|
|
|
|
2019-08-06 00:47:59 +02:00
|
|
|
def __iter__(self) -> typing.Iterator[bytes]:
|
2019-08-04 19:52:54 +02:00
|
|
|
self.send_status(STATUS_SUCCESS, "text/plain")
|
|
|
|
path = self.environ["PATH"]
|
|
|
|
yield f"Received path: {path}".encode()
|
|
|
|
|
|
|
|
|
2019-08-05 03:42:27 +02:00
|
|
|
class StaticDirectoryApp:
|
|
|
|
"""
|
|
|
|
Serve a static directory over Gemini.
|
|
|
|
|
|
|
|
If a directory contains a hidden file with the name ".gemini", that file
|
|
|
|
will be returned when the directory path is requested. Otherwise, a
|
|
|
|
directory listing will be auto-generated.
|
|
|
|
"""
|
|
|
|
|
|
|
|
root: str = "/var/gemini"
|
|
|
|
|
2019-08-06 00:47:59 +02:00
|
|
|
def __init__(self, environ: dict, send_status: typing.Callable) -> None:
|
2019-08-05 03:42:27 +02:00
|
|
|
self.environ = environ
|
|
|
|
self.send_status = send_status
|
|
|
|
|
|
|
|
self.mimetypes = mimetypes.MimeTypes()
|
|
|
|
|
2019-08-06 00:47:59 +02:00
|
|
|
def __iter__(self) -> typing.Iterator[bytes]:
|
2019-08-05 03:42:27 +02:00
|
|
|
filename = self.environ["PATH"]
|
|
|
|
filename = filename.lstrip("/")
|
|
|
|
|
|
|
|
abs_filename = os.path.abspath(os.path.join(self.root, filename))
|
|
|
|
if not abs_filename.startswith(self.root):
|
|
|
|
# Guard against breaking out of the directory
|
|
|
|
self.send_status(STATUS_NOT_FOUND, "Not Found")
|
|
|
|
|
|
|
|
elif os.path.isfile(abs_filename):
|
|
|
|
mimetype = self.guess_mimetype(abs_filename)
|
|
|
|
yield from self.load_file(abs_filename, mimetype)
|
|
|
|
|
|
|
|
elif os.path.isdir(abs_filename):
|
|
|
|
gemini_map_file = os.path.join(abs_filename, ".gemini")
|
|
|
|
if os.path.exists(gemini_map_file):
|
|
|
|
yield from self.load_file(gemini_map_file, "text/gemini")
|
|
|
|
else:
|
|
|
|
yield from self.list_directory(abs_filename)
|
|
|
|
|
|
|
|
else:
|
|
|
|
self.send_status(STATUS_NOT_FOUND, "Not Found")
|
|
|
|
|
|
|
|
def load_file(self, abs_filename: str, mimetype: str):
|
|
|
|
self.send_status(STATUS_SUCCESS, mimetype)
|
|
|
|
with open(abs_filename, "rb") as fp:
|
|
|
|
data = fp.read(1024)
|
|
|
|
while data:
|
|
|
|
yield data
|
|
|
|
data = fp.read(1024)
|
|
|
|
|
|
|
|
def list_directory(self, abs_folder: str):
|
|
|
|
self.send_status(STATUS_SUCCESS, "text/gemini")
|
|
|
|
|
|
|
|
for filename in os.listdir(abs_folder):
|
|
|
|
if filename == ".gemini" or filename.startswith("~"):
|
|
|
|
continue
|
|
|
|
abs_filename = os.path.join(abs_folder, filename)
|
|
|
|
if os.path.isdir(abs_filename):
|
|
|
|
# The directory end slash is necessary for relative paths to work
|
|
|
|
filename += "/"
|
|
|
|
yield f"=>{filename}\r\n".encode()
|
|
|
|
|
|
|
|
def guess_mimetype(self, filename: str):
|
|
|
|
mime, encoding = self.mimetypes.guess_type(filename)
|
|
|
|
if encoding:
|
|
|
|
return f"{mime}; charset={encoding}"
|
|
|
|
elif mime:
|
|
|
|
return mime
|
|
|
|
else:
|
|
|
|
return "text/plain"
|
|
|
|
|
|
|
|
|
2019-08-04 19:52:54 +02:00
|
|
|
class GeminiRequestHandler:
|
|
|
|
"""
|
|
|
|
Handle a single Gemini Protocol TCP request.
|
|
|
|
|
|
|
|
This design borrows heavily from the standard library's HTTP request
|
|
|
|
handler (http.server.BaseHTTPRequestHandler). However, I did not make any
|
|
|
|
attempts to directly emulate the existing conventions, because Gemini is an
|
|
|
|
inherently simpler protocol than HTTP and much of the boilerplate could be
|
|
|
|
removed or slimmed-down.
|
|
|
|
"""
|
|
|
|
|
2019-08-06 00:47:59 +02:00
|
|
|
def __init__(self, server: "GeminiServer", app: typing.Callable) -> None:
|
2019-08-04 19:52:54 +02:00
|
|
|
self.server = server
|
|
|
|
self.app = app
|
|
|
|
|
2019-08-06 00:47:59 +02:00
|
|
|
self.reader: typing.Optional[asyncio.StreamReader] = None
|
|
|
|
self.writer: typing.Optional[asyncio.StreamWriter] = None
|
2019-08-04 19:52:54 +02:00
|
|
|
|
2019-08-06 00:47:59 +02:00
|
|
|
self.received_timestamp: typing.Optional[datetime.datetime] = None
|
|
|
|
self.client_ip: typing.Optional[str] = None
|
|
|
|
self.client_port: typing.Optional[int] = None
|
|
|
|
self.path: typing.Optional[str] = None
|
|
|
|
self.status: typing.Optional[int] = None
|
|
|
|
self.mimetype: typing.Optional[str] = None
|
|
|
|
self.response_buffer: typing.Optional[str] = None
|
2019-08-04 19:52:54 +02:00
|
|
|
self.response_size: int = 0
|
|
|
|
|
|
|
|
async def handle(
|
|
|
|
self, reader: asyncio.StreamReader, writer: asyncio.StreamWriter
|
|
|
|
) -> None:
|
|
|
|
"""
|
|
|
|
Main method for the request handler, performs the following:
|
|
|
|
|
|
|
|
1. Read the request bytes from the reader stream
|
|
|
|
2. Parse the request and generate response data
|
|
|
|
3. Write the response bytes to the writer stream
|
|
|
|
"""
|
|
|
|
self.reader = reader
|
|
|
|
self.writer = writer
|
|
|
|
self.client_ip, self.client_port = writer.get_extra_info("peername")
|
|
|
|
self.received_timestamp = datetime.datetime.utcnow()
|
|
|
|
|
|
|
|
try:
|
|
|
|
await self.parse_request()
|
|
|
|
except Exception:
|
|
|
|
# Malformed request, throw it away and exit immediately
|
|
|
|
return
|
|
|
|
|
|
|
|
try:
|
|
|
|
environ = self.build_environ()
|
|
|
|
app = self.app(environ, self.write_status)
|
|
|
|
for data in app:
|
2019-08-05 03:42:27 +02:00
|
|
|
await self.write_body(data)
|
2019-08-04 19:52:54 +02:00
|
|
|
|
|
|
|
except Exception as e:
|
|
|
|
self.write_status(STATUS_SERVER_ERROR, str(e))
|
|
|
|
raise
|
|
|
|
|
|
|
|
finally:
|
2019-08-05 03:42:27 +02:00
|
|
|
await self.flush_status()
|
2019-08-04 19:52:54 +02:00
|
|
|
self.log_request()
|
|
|
|
await writer.drain()
|
|
|
|
|
2019-08-06 00:47:59 +02:00
|
|
|
def build_environ(self) -> typing.Dict[str, typing.Any]:
|
2019-08-04 19:52:54 +02:00
|
|
|
"""
|
|
|
|
Construct a dictionary that will be passed to the application handler.
|
|
|
|
"""
|
|
|
|
return {
|
|
|
|
"SERVER_HOST": self.server.host,
|
|
|
|
"SERVER_PORT": self.server.port,
|
2019-08-05 03:42:27 +02:00
|
|
|
"CLIENT_IP": self.client_ip,
|
|
|
|
"CLIENT_PORT": self.client_port,
|
2019-08-04 19:52:54 +02:00
|
|
|
"PATH": self.path,
|
|
|
|
}
|
|
|
|
|
|
|
|
async def parse_request(self) -> None:
|
|
|
|
"""
|
|
|
|
Parse the gemini request line.
|
|
|
|
|
|
|
|
The request is a single UTF-8 line formatted as: <path>\r\n
|
|
|
|
"""
|
|
|
|
data = await self.reader.readuntil(b"\r\n")
|
|
|
|
request = data.decode()
|
|
|
|
self.path = request[:-2] # strip the line ending
|
|
|
|
|
|
|
|
def write_status(self, status: int, mimetype: str) -> None:
|
|
|
|
"""
|
|
|
|
Write the gemini status line to an internal buffer.
|
|
|
|
|
|
|
|
The status line is a single UTF-8 line formatted as:
|
|
|
|
<code>\t<mimetype>\r\n
|
|
|
|
|
|
|
|
If the response status is 2, the mimetype field will contain the type
|
|
|
|
of the response data sent. If the status is something else, the mimetype
|
|
|
|
will contain a descriptive message.
|
|
|
|
|
|
|
|
The status is not written immediately, it's added to an internal buffer
|
|
|
|
that must be flushed. This is done so that the status can be updated as
|
|
|
|
long as no other data has been written to the stream yet.
|
|
|
|
"""
|
|
|
|
self.status = status
|
|
|
|
self.mimetype = mimetype
|
|
|
|
self.response_buffer = f"{status}\t{mimetype}\r\n"
|
|
|
|
|
2019-08-05 03:42:27 +02:00
|
|
|
async def write_body(self, data: bytes) -> None:
|
2019-08-04 19:52:54 +02:00
|
|
|
"""
|
|
|
|
Write bytes to the gemini response body.
|
|
|
|
"""
|
2019-08-05 03:42:27 +02:00
|
|
|
await self.flush_status()
|
2019-08-04 19:52:54 +02:00
|
|
|
self.response_size += len(data)
|
|
|
|
self.writer.write(data)
|
2019-08-05 03:42:27 +02:00
|
|
|
await self.writer.drain()
|
2019-08-04 19:52:54 +02:00
|
|
|
|
2019-08-05 03:42:27 +02:00
|
|
|
async def flush_status(self) -> None:
|
2019-08-04 19:52:54 +02:00
|
|
|
"""
|
|
|
|
Flush the status line from the internal buffer to the socket stream.
|
|
|
|
"""
|
|
|
|
if self.response_buffer and not self.response_size:
|
|
|
|
data = self.response_buffer.encode()
|
|
|
|
self.response_size += len(data)
|
|
|
|
self.writer.write(data)
|
2019-08-05 03:42:27 +02:00
|
|
|
await self.writer.drain()
|
2019-08-04 19:52:54 +02:00
|
|
|
self.response_buffer = None
|
|
|
|
|
|
|
|
def log_request(self) -> None:
|
|
|
|
"""
|
|
|
|
Log a gemini request using a format derived from the Common Log Format.
|
|
|
|
"""
|
|
|
|
self.server.log_message(
|
|
|
|
f"{self.client_ip} "
|
|
|
|
f"[{self.received_timestamp:%d/%b/%Y:%H:%M:%S +0000}] "
|
|
|
|
f'"{self.path}" '
|
|
|
|
f"{self.status} "
|
|
|
|
f'"{self.mimetype}" '
|
|
|
|
f"{self.response_size}"
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
class GeminiServer:
|
|
|
|
"""
|
|
|
|
An asynchronous TCP server that understands the Gemini Protocol.
|
|
|
|
"""
|
|
|
|
|
|
|
|
request_handler_class = GeminiRequestHandler
|
|
|
|
|
|
|
|
def __init__(
|
|
|
|
self,
|
|
|
|
host: str,
|
|
|
|
port: int,
|
2019-08-06 00:47:59 +02:00
|
|
|
ssl_context: typing.Union[tuple, ssl.SSLContext],
|
|
|
|
app: typing.Callable,
|
2019-08-04 19:52:54 +02:00
|
|
|
) -> None:
|
2019-08-05 03:42:27 +02:00
|
|
|
|
2019-08-04 19:52:54 +02:00
|
|
|
self.host = host
|
|
|
|
self.port = port
|
|
|
|
self.app = app
|
|
|
|
if isinstance(ssl_context, tuple):
|
|
|
|
self.ssl_context = ssl.SSLContext()
|
|
|
|
self.ssl_context.load_cert_chain(*ssl_context)
|
|
|
|
else:
|
|
|
|
self.ssl_context = ssl_context
|
|
|
|
|
|
|
|
async def run(self) -> None:
|
|
|
|
"""
|
|
|
|
The main asynchronous server loop.
|
|
|
|
"""
|
|
|
|
self.log_message(ABOUT)
|
|
|
|
server = await asyncio.start_server(
|
|
|
|
self.accept_connection, self.host, self.port, ssl=self.ssl_context
|
|
|
|
)
|
|
|
|
|
|
|
|
socket_info = server.sockets[0].getsockname()
|
2019-08-05 03:42:27 +02:00
|
|
|
self.log_message(f"Listening on {socket_info[0]}:{socket_info[1]}")
|
2019-08-04 19:52:54 +02:00
|
|
|
|
|
|
|
async with server:
|
|
|
|
await server.serve_forever()
|
|
|
|
|
|
|
|
async def accept_connection(
|
|
|
|
self, reader: asyncio.StreamReader, writer: asyncio.StreamWriter
|
|
|
|
):
|
|
|
|
"""
|
|
|
|
Hook called by the socket server when a new connection is accepted.
|
|
|
|
"""
|
|
|
|
request_handler = self.request_handler_class(self, self.app)
|
|
|
|
try:
|
|
|
|
await request_handler.handle(reader, writer)
|
|
|
|
finally:
|
|
|
|
writer.close()
|
|
|
|
|
|
|
|
def log_message(self, message: str):
|
|
|
|
"""
|
|
|
|
Log a diagnostic server message.
|
|
|
|
"""
|
|
|
|
print(message, file=sys.stderr)
|
|
|
|
|
|
|
|
|
2019-08-04 20:11:22 +02:00
|
|
|
def run_server():
|
|
|
|
parser = argparse.ArgumentParser(
|
|
|
|
prog="jetforce",
|
|
|
|
description="An Experimental Gemini Protocol Server",
|
|
|
|
formatter_class=argparse.ArgumentDefaultsHelpFormatter,
|
|
|
|
)
|
2019-08-05 04:01:10 +02:00
|
|
|
parser.add_argument("--host", help="server host", default="127.0.0.1")
|
|
|
|
parser.add_argument("--port", help="server port", type=int, default=1965)
|
2019-08-05 03:42:27 +02:00
|
|
|
parser.add_argument(
|
|
|
|
"--dir",
|
2019-08-05 04:01:10 +02:00
|
|
|
help="local directory to serve files from",
|
2019-08-05 03:42:27 +02:00
|
|
|
type=str,
|
|
|
|
default=StaticDirectoryApp.root,
|
|
|
|
)
|
2019-08-04 20:11:22 +02:00
|
|
|
parser.add_argument(
|
|
|
|
"--tls-certfile",
|
|
|
|
help="TLS certificate file",
|
|
|
|
metavar="FILE",
|
|
|
|
default="localhost.crt",
|
|
|
|
)
|
|
|
|
parser.add_argument(
|
|
|
|
"--tls-keyfile",
|
|
|
|
help="TLS private key file",
|
|
|
|
metavar="FILE",
|
|
|
|
default="localhost.key",
|
|
|
|
)
|
2019-08-04 19:52:54 +02:00
|
|
|
args = parser.parse_args()
|
|
|
|
|
2019-08-05 03:42:27 +02:00
|
|
|
StaticDirectoryApp.root = args.dir
|
|
|
|
|
2019-08-04 19:52:54 +02:00
|
|
|
server = GeminiServer(
|
|
|
|
host=args.host,
|
|
|
|
port=args.port,
|
2019-08-04 20:11:22 +02:00
|
|
|
ssl_context=(args.tls_certfile, args.tls_keyfile),
|
2019-08-05 03:42:27 +02:00
|
|
|
app=StaticDirectoryApp,
|
2019-08-04 19:52:54 +02:00
|
|
|
)
|
|
|
|
asyncio.run(server.run())
|
2019-08-04 20:11:22 +02:00
|
|
|
|
|
|
|
|
|
|
|
if __name__ == "__main__":
|
|
|
|
run_server()
|