mirror of https://github.com/xvxx/phetch
You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
436 lines
13 KiB
Rust
436 lines
13 KiB
Rust
//! phetch's Gopher library contains a few phetch-specific features:
|
|
//! the ability to make requests or downloads over TLS or Tor,
|
|
//! cleaning Unicode control characters from Gopher responses, and
|
|
//! URL parsing that recognizes different protocols like telnet and
|
|
//! IPv6 addresses.
|
|
|
|
use std::{
|
|
io::{Read, Result, Write},
|
|
net::TcpStream,
|
|
net::ToSocketAddrs,
|
|
os::unix::fs::OpenOptionsExt,
|
|
time::Duration,
|
|
};
|
|
use termion::input::TermRead;
|
|
|
|
#[cfg(feature = "tor")]
|
|
use tor_stream::TorStream;
|
|
|
|
#[cfg(feature = "tls")]
|
|
use native_tls::TlsConnector;
|
|
|
|
mod r#type;
|
|
pub use self::r#type::Type;
|
|
|
|
/// Some Gopher servers can be kind of slow, we may want to up this or
|
|
/// make it configurable eventually.
|
|
pub const TCP_TIMEOUT_IN_SECS: u64 = 8;
|
|
/// Based on `TCP_TIMEOUT_IN_SECS` but a `Duration` type.
|
|
pub const TCP_TIMEOUT_DURATION: Duration = Duration::from_secs(TCP_TIMEOUT_IN_SECS);
|
|
|
|
trait ReadWrite: Read + Write {}
|
|
impl<T: Read + Write> ReadWrite for T {}
|
|
|
|
/// Wrapper for TLS and regular TCP streams.
|
|
pub struct Stream {
|
|
io: Box<dyn ReadWrite>,
|
|
tls: bool,
|
|
}
|
|
|
|
impl Stream {
|
|
fn is_tls(&self) -> bool {
|
|
self.tls
|
|
}
|
|
}
|
|
|
|
impl Read for Stream {
|
|
fn read(&mut self, buf: &mut [u8]) -> Result<usize> {
|
|
self.io.read(buf)
|
|
}
|
|
}
|
|
|
|
impl Write for Stream {
|
|
fn write(&mut self, buf: &[u8]) -> Result<usize> {
|
|
self.io.write(buf)
|
|
}
|
|
|
|
fn flush(&mut self) -> Result<()> {
|
|
self.io.flush()
|
|
}
|
|
}
|
|
|
|
/// Gopher URL. Returned by `parse_url()`.
|
|
pub struct Url<'a> {
|
|
/// Gopher Type
|
|
pub typ: Type,
|
|
/// Hostname
|
|
pub host: &'a str,
|
|
/// Port. Defaults to 70
|
|
pub port: &'a str,
|
|
/// Selector
|
|
pub sel: &'a str,
|
|
}
|
|
|
|
/// Fetches a gopher URL and returns a tuple of:
|
|
/// (did tls work?, raw Gopher response)
|
|
pub fn fetch_url(url: &str, tls: bool, tor: bool) -> Result<(bool, String)> {
|
|
let u = parse_url(url);
|
|
fetch(u.host, u.port, u.sel, tls, tor)
|
|
}
|
|
|
|
/// Fetches a gopher URL by its component parts and returns a tuple of:
|
|
/// (did tls work?, raw Gopher response)
|
|
pub fn fetch(
|
|
host: &str,
|
|
port: &str,
|
|
selector: &str,
|
|
tls: bool,
|
|
tor: bool,
|
|
) -> Result<(bool, String)> {
|
|
let mut stream = request(host, port, selector, tls, tor)?;
|
|
let mut body = Vec::new();
|
|
stream.read_to_end(&mut body)?;
|
|
let out = clean_response(&String::from_utf8_lossy(&body));
|
|
Ok((stream.is_tls(), out))
|
|
}
|
|
|
|
/// Removes unprintable characters from Gopher response.
|
|
/// https://en.wikipedia.org/wiki/Control_character#In_Unicode
|
|
fn clean_response(res: &str) -> String {
|
|
res.chars()
|
|
.map(|c| match c {
|
|
'\u{007F}' => '?',
|
|
_ if c >= '\u{0080}' && c <= '\u{009F}' => '?',
|
|
c => c,
|
|
})
|
|
.collect()
|
|
}
|
|
|
|
/// Downloads a binary to disk. Allows canceling with Ctrl-c.
|
|
/// Returns a tuple of:
|
|
/// (path it was saved to, the size in bytes)
|
|
pub fn download_url(url: &str, tls: bool, tor: bool) -> Result<(String, usize)> {
|
|
let u = parse_url(url);
|
|
let filename = u
|
|
.sel
|
|
.split_terminator('/')
|
|
.rev()
|
|
.nth(0)
|
|
.ok_or_else(|| error!("Bad download filename: {}", u.sel))?;
|
|
let mut path = std::path::PathBuf::from(".");
|
|
path.push(filename);
|
|
let stdin = termion::async_stdin();
|
|
let mut keys = stdin.keys();
|
|
|
|
let mut stream = request(u.host, u.port, u.sel, tls, tor)?;
|
|
let mut file = std::fs::OpenOptions::new()
|
|
.write(true)
|
|
.create(true)
|
|
.truncate(true)
|
|
.mode(0o770)
|
|
.open(path)?;
|
|
|
|
let mut buf = [0; 1024];
|
|
let mut bytes = 0;
|
|
while let Ok(count) = stream.read(&mut buf) {
|
|
if count == 0 {
|
|
break;
|
|
}
|
|
bytes += count;
|
|
file.write_all(&buf[..count])?;
|
|
if let Some(Ok(termion::event::Key::Ctrl('c'))) = keys.next() {
|
|
return Err(error!("Download cancelled"));
|
|
}
|
|
}
|
|
Ok((filename.to_string(), bytes))
|
|
}
|
|
|
|
/// Make a Gopher request and return a TcpStream ready to be read()'d.
|
|
/// Will attempt a TLS connection first, then retry a regular
|
|
/// connection if it fails.
|
|
pub fn request(host: &str, port: &str, selector: &str, tls: bool, tor: bool) -> Result<Stream> {
|
|
let selector = selector.replace('?', "\t"); // search queries
|
|
let sock = format!("{}:{}", host, port)
|
|
.to_socket_addrs()
|
|
.and_then(|mut socks| socks.next().ok_or_else(|| error!("Can't create socket")))?;
|
|
|
|
// attempt tls connection
|
|
if tls {
|
|
#[cfg(feature = "tls")]
|
|
{
|
|
{
|
|
if let Ok(connector) = TlsConnector::new() {
|
|
let stream = TcpStream::connect_timeout(&sock, TCP_TIMEOUT_DURATION)?;
|
|
stream.set_read_timeout(Some(TCP_TIMEOUT_DURATION))?;
|
|
if let Ok(mut stream) = connector.connect(host, stream) {
|
|
stream.write_all(selector.as_ref());
|
|
stream.write_all("\r\n".as_ref());
|
|
return Ok(Stream {
|
|
io: Box::new(stream),
|
|
tls: true,
|
|
});
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
// tls didn't work or wasn't selected, try Tor or default
|
|
if tor {
|
|
#[cfg(feature = "tor")]
|
|
{
|
|
let proxy = std::env::var("TOR_PROXY")
|
|
.unwrap_or_else(|_| "127.0.0.1:9050".into())
|
|
.to_socket_addrs()?
|
|
.nth(0)
|
|
.unwrap();
|
|
let mut stream = match TorStream::connect_with_address(proxy, sock) {
|
|
Ok(s) => s,
|
|
Err(e) => return Err(error!("Tor error: {}", e)),
|
|
};
|
|
stream.write_all(selector.as_ref());
|
|
stream.write_all("\r\n".as_ref());
|
|
return Ok(Stream {
|
|
io: Box::new(stream),
|
|
tls: false,
|
|
});
|
|
}
|
|
}
|
|
|
|
// no tls or tor, try regular connection
|
|
let mut stream = TcpStream::connect_timeout(&sock, TCP_TIMEOUT_DURATION)?;
|
|
stream.set_read_timeout(Some(TCP_TIMEOUT_DURATION))?;
|
|
stream.write_all(selector.as_ref());
|
|
stream.write_all("\r\n".as_ref());
|
|
Ok(Stream {
|
|
io: Box::new(stream),
|
|
tls: false,
|
|
})
|
|
}
|
|
|
|
impl<'a> Url<'a> {
|
|
/// Creates a new Gopher Url quickly from a tuple of Url fields.
|
|
pub fn new(typ: Type, host: &'a str, port: &'a str, sel: &'a str) -> Url<'a> {
|
|
Url {
|
|
typ,
|
|
host,
|
|
port,
|
|
sel,
|
|
}
|
|
}
|
|
}
|
|
|
|
/// Given a Gopher URL, returns a gopher::Type.
|
|
pub fn type_for_url(url: &str) -> Type {
|
|
if url.starts_with("telnet://") {
|
|
return Type::Telnet;
|
|
}
|
|
|
|
if url.starts_with("URL:") || url.starts_with("/URL:") {
|
|
return Type::HTML;
|
|
}
|
|
|
|
if let Some(idx) = url.find('/') {
|
|
if let Some(t) = url.chars().nth(idx + 1) {
|
|
return Type::from(t).unwrap_or(Type::Menu);
|
|
}
|
|
}
|
|
|
|
Type::Menu
|
|
}
|
|
|
|
/// Parses gopher URL into parts.
|
|
/// Returns (Type, host, port, sel)
|
|
pub fn parse_url<'a>(url: &'a str) -> Url<'a> {
|
|
let mut url = url.trim_start_matches("gopher://");
|
|
let mut typ = Type::Menu;
|
|
let mut host;
|
|
let mut port = "70";
|
|
let mut sel = "";
|
|
|
|
// simple URLs, ex: "dog.com"
|
|
if !url.contains(':') && !url.contains('/') {
|
|
return Url::new(Type::Menu, url, "70", "");
|
|
}
|
|
|
|
// telnet urls
|
|
if url.starts_with("telnet://") {
|
|
typ = Type::Telnet;
|
|
url = url.trim_start_matches("telnet://");
|
|
} else if url.contains("://") {
|
|
// non-gopher URLs, stick everything in selector
|
|
return Url::new(Type::HTML, "", "", url);
|
|
}
|
|
|
|
// check selector first
|
|
if let Some(idx) = url.find('/') {
|
|
host = &url[..idx];
|
|
sel = &url[idx..];
|
|
} else {
|
|
host = &url;
|
|
}
|
|
|
|
// ipv6
|
|
if let Some(idx) = host.find('[') {
|
|
if let Some(end) = host[idx + 1..].find(']') {
|
|
host = &host[idx + 1..=end];
|
|
if host.len() > end {
|
|
if let Some(idx) = host[end..].find(':') {
|
|
port = &host[idx + 1..];
|
|
}
|
|
}
|
|
} else {
|
|
return Url::new(Type::Error, "Unclosed ipv6 bracket", "", url);
|
|
}
|
|
} else if let Some(idx) = host.find(':') {
|
|
// two :'s == probably ipv6
|
|
if host.len() > idx + 1 && !host[idx + 1..].contains(':') {
|
|
// regular hostname w/ port -- grab port
|
|
port = &host[idx + 1..];
|
|
host = &host[..idx];
|
|
}
|
|
}
|
|
|
|
// ignore type prefix on selector
|
|
if typ != Type::Telnet {
|
|
let mut chars = sel.chars();
|
|
if let (Some('/'), Some(c)) = (chars.nth(0), chars.nth(0)) {
|
|
if let Some(t) = Type::from(c) {
|
|
typ = t;
|
|
sel = &sel[2..];
|
|
}
|
|
}
|
|
}
|
|
|
|
Url::new(typ, host, port, sel)
|
|
}
|
|
|
|
#[cfg(test)]
|
|
mod tests {
|
|
use super::*;
|
|
|
|
#[test]
|
|
fn test_simple_parse() {
|
|
let urls = vec![
|
|
"gopher://gopher.club/1/phlogs/",
|
|
"gopher://sdf.org:7777/1/maps",
|
|
"gopher.floodgap.org",
|
|
"gopher.floodgap.com/0/gopher/relevance.txt",
|
|
"gopher://gopherpedia.com/7/lookup?Gopher",
|
|
"gopher://dead:beef:1234:5678:9012:3456:feed:deed",
|
|
"gopher://[1234:2345:dead:4567:7890:1234:beef:1111]:7443/1/files",
|
|
"gopher://2001:cdba:0000:0000:0000:0000:3257:9121",
|
|
"[2001:cdba::3257:9652]",
|
|
"gopher://9999:aaaa::abab:baba:aaaa:9999",
|
|
"[2001:2099:dead:beef:0000",
|
|
"::1",
|
|
"ssh://kiosk@bitreich.org",
|
|
"https://github.com/xvxx/phetch",
|
|
"telnet://bbs.impakt.net:6502/",
|
|
];
|
|
|
|
let url = parse_url(urls[0]);
|
|
assert_eq!(url.typ, Type::Menu);
|
|
assert_eq!(url.host, "gopher.club");
|
|
assert_eq!(url.port, "70");
|
|
assert_eq!(url.sel, "/phlogs/");
|
|
|
|
let url = parse_url(urls[1]);
|
|
assert_eq!(url.typ, Type::Menu);
|
|
assert_eq!(url.host, "sdf.org");
|
|
assert_eq!(url.port, "7777");
|
|
assert_eq!(url.sel, "/maps");
|
|
|
|
let url = parse_url(urls[2]);
|
|
assert_eq!(url.typ, Type::Menu);
|
|
assert_eq!(url.host, "gopher.floodgap.org");
|
|
assert_eq!(url.port, "70");
|
|
assert_eq!(url.sel, "");
|
|
|
|
let url = parse_url(urls[3]);
|
|
assert_eq!(url.typ, Type::Text);
|
|
assert_eq!(url.host, "gopher.floodgap.com");
|
|
assert_eq!(url.port, "70");
|
|
assert_eq!(url.sel, "/gopher/relevance.txt");
|
|
|
|
let url = parse_url(urls[4]);
|
|
assert_eq!(url.typ, Type::Search);
|
|
assert_eq!(url.host, "gopherpedia.com");
|
|
assert_eq!(url.port, "70");
|
|
assert_eq!(url.sel, "/lookup?Gopher");
|
|
|
|
let url = parse_url(urls[5]);
|
|
assert_eq!(url.typ, Type::Menu);
|
|
assert_eq!(url.host, "dead:beef:1234:5678:9012:3456:feed:deed");
|
|
assert_eq!(url.port, "70");
|
|
assert_eq!(url.sel, "");
|
|
|
|
let url = parse_url(urls[6]);
|
|
assert_eq!(url.typ, Type::Menu);
|
|
assert_eq!(url.host, "1234:2345:dead:4567:7890:1234:beef:1111");
|
|
assert_eq!(url.port, "70");
|
|
assert_eq!(url.sel, "/files");
|
|
|
|
let url = parse_url(urls[7]);
|
|
assert_eq!(url.typ, Type::Menu);
|
|
assert_eq!(url.host, "2001:cdba:0000:0000:0000:0000:3257:9121");
|
|
assert_eq!(url.port, "70");
|
|
assert_eq!(url.sel, "");
|
|
|
|
let url = parse_url(urls[8]);
|
|
assert_eq!(url.typ, Type::Menu);
|
|
assert_eq!(url.host, "2001:cdba::3257:9652");
|
|
assert_eq!(url.port, "70");
|
|
assert_eq!(url.sel, "");
|
|
|
|
let url = parse_url(urls[9]);
|
|
assert_eq!(url.typ, Type::Menu);
|
|
assert_eq!(url.host, "9999:aaaa::abab:baba:aaaa:9999");
|
|
assert_eq!(url.port, "70");
|
|
assert_eq!(url.sel, "");
|
|
|
|
let url = parse_url(urls[10]);
|
|
assert_eq!(url.typ, Type::Error);
|
|
assert_eq!(url.host, "Unclosed ipv6 bracket");
|
|
assert_eq!(url.port, "");
|
|
assert_eq!(url.sel, "[2001:2099:dead:beef:0000");
|
|
|
|
let url = parse_url(urls[11]);
|
|
assert_eq!(url.typ, Type::Menu);
|
|
assert_eq!(url.host, "::1");
|
|
assert_eq!(url.port, "70");
|
|
assert_eq!(url.sel, "");
|
|
|
|
let url = parse_url(urls[12]);
|
|
assert_eq!(url.typ, Type::HTML);
|
|
assert_eq!(url.host, "");
|
|
assert_eq!(url.port, "");
|
|
assert_eq!(url.sel, "ssh://kiosk@bitreich.org");
|
|
|
|
let url = parse_url(urls[13]);
|
|
assert_eq!(url.typ, Type::HTML);
|
|
assert_eq!(url.host, "");
|
|
assert_eq!(url.port, "");
|
|
assert_eq!(url.sel, "https://github.com/xvxx/phetch");
|
|
|
|
let url = parse_url(urls[14]);
|
|
assert_eq!(url.typ, Type::Telnet);
|
|
assert_eq!(url.host, "bbs.impakt.net");
|
|
assert_eq!(url.port, "6502");
|
|
assert_eq!(url.sel, "/");
|
|
}
|
|
|
|
#[test]
|
|
fn test_type_for_url() {
|
|
assert_eq!(type_for_url("phkt.io"), Type::Menu);
|
|
assert_eq!(type_for_url("phkt.io/1"), Type::Menu);
|
|
assert_eq!(type_for_url("phkt.io/1/"), Type::Menu);
|
|
assert_eq!(type_for_url("phkt.io/0/info.txt"), Type::Text);
|
|
assert_eq!(type_for_url("URL:https://google.com"), Type::HTML);
|
|
assert_eq!(
|
|
type_for_url("telnet://bbs.inter.net:6502/connect"),
|
|
Type::Telnet
|
|
);
|
|
}
|
|
}
|