basic markdown and reverse proxy implementation
This commit is contained in:
parent
2c122cabb5
commit
00349fabfe
|
@ -11,7 +11,8 @@ import sys
|
||||||
from .__version__ import __version__
|
from .__version__ import __version__
|
||||||
from .app.base import RateLimiter
|
from .app.base import RateLimiter
|
||||||
from .app.static import StaticDirectoryApplication
|
from .app.static import StaticDirectoryApplication
|
||||||
from .server import GeminiServer
|
from .app.static_md import StaticMarkdownDirectoryApplication
|
||||||
|
from .server import GeminiServer, ReverseProxyGeminiServer
|
||||||
|
|
||||||
if sys.version_info < (3, 7):
|
if sys.version_info < (3, 7):
|
||||||
sys.exit("Fatal Error: jetforce requires Python 3.7+")
|
sys.exit("Fatal Error: jetforce requires Python 3.7+")
|
||||||
|
@ -104,18 +105,44 @@ group.add_argument(
|
||||||
default=None,
|
default=None,
|
||||||
dest="rate_limit",
|
dest="rate_limit",
|
||||||
)
|
)
|
||||||
|
group.add_argument(
|
||||||
|
"--reverse-proxy",
|
||||||
|
help="Enable reverse proxy mode where TLS is handled by a reverse proxy such as Nginx",
|
||||||
|
action='store_true',
|
||||||
|
default=False,
|
||||||
|
dest="reverse_proxy",
|
||||||
|
)
|
||||||
|
group.add_argument(
|
||||||
|
"--markdown",
|
||||||
|
help="Enable markdown to gemini mode.",
|
||||||
|
action='store_true',
|
||||||
|
default=False,
|
||||||
|
dest="markdown",
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
def main() -> None:
|
def main() -> None:
|
||||||
args = parser.parse_args()
|
args = parser.parse_args()
|
||||||
rate_limiter = RateLimiter(args.rate_limit) if args.rate_limit else None
|
rate_limiter = RateLimiter(args.rate_limit) if args.rate_limit else None
|
||||||
app = StaticDirectoryApplication(
|
if args.markdown:
|
||||||
|
app_class = StaticMarkdownDirectoryApplication
|
||||||
|
else:
|
||||||
|
app_class = StaticDirectoryApplication
|
||||||
|
app = app_class(
|
||||||
root_directory=args.root_directory,
|
root_directory=args.root_directory,
|
||||||
index_file=args.index_file,
|
index_file=args.index_file,
|
||||||
cgi_directory=args.cgi_directory,
|
cgi_directory=args.cgi_directory,
|
||||||
default_lang=args.default_lang,
|
default_lang=args.default_lang,
|
||||||
rate_limiter=rate_limiter,
|
rate_limiter=rate_limiter,
|
||||||
)
|
)
|
||||||
|
if args.reverse_proxy:
|
||||||
|
server = ReverseProxyGeminiServer(
|
||||||
|
app=app,
|
||||||
|
host=args.host,
|
||||||
|
port=args.port,
|
||||||
|
hostname=args.hostname,
|
||||||
|
)
|
||||||
|
else:
|
||||||
server = GeminiServer(
|
server = GeminiServer(
|
||||||
app=app,
|
app=app,
|
||||||
host=args.host,
|
host=args.host,
|
||||||
|
|
|
@ -0,0 +1,154 @@
|
||||||
|
import typing
|
||||||
|
import os
|
||||||
|
import pathlib
|
||||||
|
import md2gemini
|
||||||
|
from .static import StaticDirectoryApplication
|
||||||
|
|
||||||
|
from .base import (
|
||||||
|
Request,
|
||||||
|
Response,
|
||||||
|
Status,
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
|
class StaticMarkdownDirectoryApplication(StaticDirectoryApplication):
|
||||||
|
def __init__(self, *args, **kwargs):
|
||||||
|
super().__init__(*args, **kwargs)
|
||||||
|
|
||||||
|
def serve_static_file(self, request: Request) -> Response:
|
||||||
|
"""
|
||||||
|
Convert a URL into a filesystem path, and attempt to serve the file
|
||||||
|
or directory that is represented at that path.
|
||||||
|
"""
|
||||||
|
url_path = pathlib.Path(request.path.strip("/"))
|
||||||
|
|
||||||
|
filename = pathlib.Path(os.path.normpath(str(url_path)))
|
||||||
|
if filename.is_absolute() or str(filename).startswith(".."):
|
||||||
|
# Guard against breaking out of the directory
|
||||||
|
return Response(Status.NOT_FOUND, "Not Found")
|
||||||
|
|
||||||
|
if str(filename).startswith(self.cgi_directory):
|
||||||
|
# CGI needs special treatment to account for extra-path
|
||||||
|
# PATH_INFO component (RFC 3875 section 4.1.5)
|
||||||
|
|
||||||
|
# Identify the shortest path that is not a directory
|
||||||
|
for i in range(2, len(filename.parts) + 1):
|
||||||
|
# Split the path into SCRIPT_NAME and PATH_INFO
|
||||||
|
script_name = pathlib.Path(*filename.parts[:i])
|
||||||
|
path_info = pathlib.Path(*filename.parts[i:])
|
||||||
|
|
||||||
|
filesystem_path = self.root / script_name
|
||||||
|
try:
|
||||||
|
if not filesystem_path.is_file():
|
||||||
|
continue
|
||||||
|
elif not os.access(filesystem_path, os.R_OK):
|
||||||
|
continue
|
||||||
|
elif not os.access(filesystem_path, os.X_OK):
|
||||||
|
continue
|
||||||
|
else:
|
||||||
|
if str(script_name) == ".":
|
||||||
|
request.environ["SCRIPT_NAME"] = ""
|
||||||
|
else:
|
||||||
|
request.environ["SCRIPT_NAME"] = f"/{script_name}"
|
||||||
|
|
||||||
|
if str(path_info) == ".":
|
||||||
|
request.environ["PATH_INFO"] = ""
|
||||||
|
else:
|
||||||
|
request.environ["PATH_INFO"] = f"/{path_info}"
|
||||||
|
|
||||||
|
# Add back the trailing slash that was stripped off
|
||||||
|
if request.path.endswith("/"):
|
||||||
|
request.environ["PATH_INFO"] += "/"
|
||||||
|
|
||||||
|
return self.run_cgi_script(filesystem_path, request.environ)
|
||||||
|
|
||||||
|
except OSError:
|
||||||
|
# Filename too large, etc.
|
||||||
|
return Response(Status.NOT_FOUND, "Not Found")
|
||||||
|
|
||||||
|
filesystem_path = self.root / filename
|
||||||
|
|
||||||
|
try:
|
||||||
|
if not os.access(filesystem_path, os.R_OK):
|
||||||
|
# File not readable
|
||||||
|
return Response(Status.NOT_FOUND, "Not Found")
|
||||||
|
except OSError:
|
||||||
|
# Filename too large, etc.
|
||||||
|
return Response(Status.NOT_FOUND, "Not Found")
|
||||||
|
|
||||||
|
if filesystem_path.is_file():
|
||||||
|
return self.generate_response(filesystem_path)
|
||||||
|
|
||||||
|
elif filesystem_path.is_dir():
|
||||||
|
if request.path and not request.path.endswith("/"):
|
||||||
|
url_parts = urllib.parse.urlparse(request.url)
|
||||||
|
# noinspection PyProtectedMember
|
||||||
|
url_parts = url_parts._replace(path=request.path + "/")
|
||||||
|
return Response(Status.REDIRECT_PERMANENT, url_parts.geturl())
|
||||||
|
|
||||||
|
index_file = filesystem_path / self.index_file
|
||||||
|
if index_file.exists():
|
||||||
|
return self.generate_response(index_file)
|
||||||
|
|
||||||
|
mimetype = self.add_extra_parameters("text/gemini")
|
||||||
|
generator = self.list_directory(url_path, filesystem_path)
|
||||||
|
return Response(Status.SUCCESS, mimetype, generator)
|
||||||
|
|
||||||
|
else:
|
||||||
|
return Response(Status.NOT_FOUND, "Not Found")
|
||||||
|
|
||||||
|
def generate_response(self, filesystem_path: pathlib.Path) -> typing.Iterator:
|
||||||
|
mimetype = self.guess_mimetype(filesystem_path.name)
|
||||||
|
if mimetype == "text/markdown":
|
||||||
|
generator = self._load_md_file(filesystem_path)
|
||||||
|
mimetype = self.add_extra_parameters("text/gemini")
|
||||||
|
elif mimetype == "text/gemini":
|
||||||
|
generator = self.load_file(filesystem_path)
|
||||||
|
mimetype = self.add_extra_parameters("text/gemini")
|
||||||
|
else:
|
||||||
|
generator = self.load_file(filesystem_path)
|
||||||
|
mimetype = self.add_extra_parameters(mimetype)
|
||||||
|
return Response(Status.SUCCESS, mimetype, generator)
|
||||||
|
|
||||||
|
def _load_md_file(self, filesystem_path: pathlib.Path) -> typing.Iterator[bytes]:
|
||||||
|
with filesystem_path.open("r") as fp:
|
||||||
|
gemini = md2gemini.md2gemini(fp.read(), links="paragraph")
|
||||||
|
gemini = gemini.encode()
|
||||||
|
chunks = int(len(gemini) / self.CHUNK_SIZE) + 1
|
||||||
|
for i in range(chunks):
|
||||||
|
start = self.CHUNK_SIZE * (i)
|
||||||
|
end = self.CHUNK_SIZE * (i + 1)
|
||||||
|
yield gemini[start:end]
|
||||||
|
|
||||||
|
def list_directory(
|
||||||
|
self, url_path: pathlib.Path, filesystem_path: pathlib.Path
|
||||||
|
) -> typing.Iterator[bytes]:
|
||||||
|
"""
|
||||||
|
Auto-generate a text/gemini document based on the contents of the file system.
|
||||||
|
"""
|
||||||
|
buffer = f"Directory: /{url_path}\r\n".encode()
|
||||||
|
if url_path.parent != url_path:
|
||||||
|
buffer += f"=>/{url_path.parent}\t..\r\n".encode()
|
||||||
|
|
||||||
|
for file in sorted(filesystem_path.iterdir()):
|
||||||
|
if file.name.startswith("."):
|
||||||
|
# Skip hidden directories/files that may contain sensitive info
|
||||||
|
continue
|
||||||
|
|
||||||
|
encoded_path = urllib.parse.quote(str(url_path / file.name))
|
||||||
|
if file.is_dir():
|
||||||
|
buffer += f"=>/{encoded_path}/\t{file.name}/\r\n".encode()
|
||||||
|
else:
|
||||||
|
if file.stem.isdigit():
|
||||||
|
tz = pytz.timezone("Europe/Brussels")
|
||||||
|
label = datetime.datetime.fromtimestamp(int(file.stem), tz=tz)
|
||||||
|
else:
|
||||||
|
label = f"{file.name}"
|
||||||
|
buffer += f"=>/{encoded_path}\t{label}\r\n".encode()
|
||||||
|
|
||||||
|
if len(buffer) >= self.CHUNK_SIZE:
|
||||||
|
data, buffer = buffer[: self.CHUNK_SIZE], buffer[self.CHUNK_SIZE :]
|
||||||
|
yield data
|
||||||
|
|
||||||
|
if buffer:
|
||||||
|
yield buffer
|
|
@ -302,3 +302,30 @@ class GeminiProtocol(LineOnlyReceiver):
|
||||||
pass
|
pass
|
||||||
else:
|
else:
|
||||||
self.server.log_access(message)
|
self.server.log_access(message)
|
||||||
|
|
||||||
|
|
||||||
|
class ReverseProxyGeminiProtocol(GeminiProtocol):
|
||||||
|
def __init__(self, *args, **kwargs):
|
||||||
|
super().__init__(*args, **kwargs)
|
||||||
|
|
||||||
|
def build_environ(self) -> EnvironDict:
|
||||||
|
"""
|
||||||
|
Construct a dictionary that will be passed to the application handler.
|
||||||
|
|
||||||
|
Variable names (mostly) conform to the CGI spec defined in RFC 3875.
|
||||||
|
The TLS variable names borrow from the GLV-1.12556 server.
|
||||||
|
"""
|
||||||
|
url_parts = urllib.parse.urlparse(self.url)
|
||||||
|
environ = {
|
||||||
|
"GEMINI_URL": self.url,
|
||||||
|
"HOSTNAME": self.server.hostname,
|
||||||
|
"QUERY_STRING": url_parts.query,
|
||||||
|
"REMOTE_ADDR": self.client_addr.host,
|
||||||
|
"REMOTE_HOST": self.client_addr.host,
|
||||||
|
"SERVER_NAME": self.server.hostname,
|
||||||
|
"SERVER_PORT": self.server.port,
|
||||||
|
"SERVER_PROTOCOL": "GEMINI",
|
||||||
|
"SERVER_SOFTWARE": f"jetforce/{__version__}",
|
||||||
|
"client_certificate": None,
|
||||||
|
}
|
||||||
|
return environ
|
||||||
|
|
|
@ -6,13 +6,13 @@ import typing
|
||||||
|
|
||||||
from twisted.internet import reactor as _reactor
|
from twisted.internet import reactor as _reactor
|
||||||
from twisted.internet.base import ReactorBase
|
from twisted.internet.base import ReactorBase
|
||||||
from twisted.internet.endpoints import SSL4ServerEndpoint
|
from twisted.internet.endpoints import SSL4ServerEndpoint, TCP4ServerEndpoint
|
||||||
from twisted.internet.protocol import Factory
|
from twisted.internet.protocol import Factory
|
||||||
from twisted.internet.tcp import Port
|
from twisted.internet.tcp import Port
|
||||||
|
|
||||||
from .__version__ import __version__
|
from .__version__ import __version__
|
||||||
from .app.base import ApplicationCallable
|
from .app.base import ApplicationCallable
|
||||||
from .protocol import GeminiProtocol
|
from .protocol import GeminiProtocol, ReverseProxyGeminiProtocol
|
||||||
from .tls import GeminiCertificateOptions, generate_ad_hoc_certificate
|
from .tls import GeminiCertificateOptions, generate_ad_hoc_certificate
|
||||||
|
|
||||||
if sys.stderr.isatty():
|
if sys.stderr.isatty():
|
||||||
|
@ -136,3 +136,24 @@ class GeminiServer(Factory):
|
||||||
self.log_message(f"TLS Private Key File: {self.keyfile}")
|
self.log_message(f"TLS Private Key File: {self.keyfile}")
|
||||||
self.initialize()
|
self.initialize()
|
||||||
self.reactor.run()
|
self.reactor.run()
|
||||||
|
|
||||||
|
|
||||||
|
class ReverseProxyGeminiServer(GeminiServer):
|
||||||
|
protocol_class = ReverseProxyGeminiProtocol
|
||||||
|
endpoint_class = TCP4ServerEndpoint
|
||||||
|
|
||||||
|
def __init__(self, *args, **kwargs):
|
||||||
|
super().__init__(*args, **kwargs, certfile=False)
|
||||||
|
|
||||||
|
def initialize(self) -> None:
|
||||||
|
"""
|
||||||
|
Install the server into the twisted reactor.
|
||||||
|
"""
|
||||||
|
interfaces = [self.host] if self.host else ["0.0.0.0", "::"]
|
||||||
|
for interface in interfaces:
|
||||||
|
endpoint = self.endpoint_class(
|
||||||
|
reactor=self.reactor,
|
||||||
|
port=self.port,
|
||||||
|
interface=interface,
|
||||||
|
)
|
||||||
|
endpoint.listen(self).addCallback(self.on_bind_interface)
|
||||||
|
|
Loading…
Reference in New Issue