Compare commits

..

3 Commits

Author SHA1 Message Date
ca9d4cfaf9 readme 2025-04-03 23:19:21 +01:00
1321e0dcaf works ish 2025-04-03 22:15:38 +01:00
a7468d3f40 Gemini version 2025-04-03 21:42:37 +01:00
3 changed files with 167 additions and 179 deletions

View File

@ -1,20 +1,24 @@
# Markdown web browser # Markdown web browser
A web browser that let's you browse 'mttp' websites that use markdown as a superior standard to html A web browser that let's you browse gemini capsules that use gemtext as a superior standard to html.
Fully static!
# Getting a website on this # Requirements
The default port is 3477, though you can use any port as long as you specify it in the url. - gemget
You need a <!DOCTYPE md> tag at the start of any markdown files so the browser know's which files are markdown and which are other generic text files.
# Installing
## Build from source:
- Clone the repo
```cargo run -r```
# Help # Help
Type h in the program to see this text: Type h in the program to see this text:
``` ```
Source code: https://git.javalsai.dynv6.net/deadvey/markdown-webbrowser Source code: https://git.javalsai.dynv6.net/deadvey/markdown-webbrowser
q: quit q: quit
d: debug info
h: help h: help
r: reload r: reload
s: view source code of page s: view source code of page
i: visit root index of this host eg: root index of mttp://deadvey.com/blog/4.md is just deadvey.com i: visit root index of this host eg: root index of gemini://deadvey.com/blog/4.md is just gemini://deadvey.com
b: go back in history b: go back in history
f: go forward in history f: go forward in history
ox: print the hyprlink of reference x eg: o5 or o24 ox: print the hyprlink of reference x eg: o5 or o24
@ -25,6 +29,8 @@ ox: print the hyprlink of reference x eg: o5 or o24
![screenshot](/images/screenshot.png) ![screenshot](/images/screenshot.png)
# TO DO # TO DO
- Make pages scrollable
- Bookmarks
- Properly comment it because I can't lie I can't even follow it. - Properly comment it because I can't lie I can't even follow it.
- Make it memory safe, it crashes if the input is unexpected. - Make it memory safe, it crashes if the input is unexpected.
- Use treesitter instead of Regex, because, reasons. - Use treesitter instead of Regex, because, reasons.

View File

@ -1,189 +1,72 @@
use std::process::{Command}; use std::process::{Command};
use std::io::{stdin,stdout,Write}; use std::io::{stdin,stdout,Write};
use colored::Colorize; use colored::Colorize;
use regex::Regex;
use url::{Url, ParseError}; use url::{Url, ParseError};
use std::fs;
const DEBUG_MODE: bool = false;
// Import other files
mod parse_gemtext;
fn clear_screen() { fn clear_screen() {
println!("clearing"); if DEBUG_MODE == false
Command::new("clear") {
.status() println!("clearing");
.expect("Failed to clear screen"); Command::new("clear")
} .status()
.expect("Failed to clear screen");
fn parse_markdown(page_content: String) -> (String, Vec<String>) {
let mut parsed_page_content: String = "".to_string();
let mut hyperlink_number_counter: u64 = 0;
let mut links: Vec<String> = Vec::new();
let (screen_width, _screen_height) = termion::terminal_size().unwrap(); // So the horizontal line (<hr/>) spans the whole console
for line in page_content.lines() {
let mut parsed_line: String = line.to_string();
// Bold
let bold_regex = Regex::new(r"((\*\*)|(__))(.*?)((\*\*)|(__))").unwrap();
parsed_line = bold_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
caps[4].bold().to_string()
}).to_string();
// Strikethrough
let strikethrough_regex = Regex::new(r"~~(.*?)~~").unwrap();
parsed_line = strikethrough_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
caps[1].strikethrough().to_string()
}).to_string();
// Horizontal lines
let hr_regex = Regex::new(r"^(\*\*\*)|(---)|(___)$").unwrap();
parsed_line = hr_regex.replace_all(&parsed_line, |_caps: &regex::Captures| {
let mut result: String = "\n".to_string();
for _x in 0..screen_width/2 {
result += "- ";
}
result += "\n";
result
}).to_string();
// html br tag support
let br_regex = Regex::new(r"(.*?)<br/>(.*?)").unwrap();
parsed_line = br_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
format!("{}{}{}", &caps[1], "\n", &caps[2])
}).to_string();
// Italics
let italic_regex = Regex::new(r"\*(.*?)\*").unwrap();
parsed_line = italic_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
caps[1].italic().to_string()
}).to_string();
let italic_regex = Regex::new(r"_(.*?)_").unwrap();
parsed_line = italic_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
caps[1].italic().to_string()
}).to_string();
// Block quotes
let block_quotes_regex = Regex::new(r"^>(.*)").unwrap();
parsed_line = block_quotes_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
format!(" | {}", &caps[1])
}).to_string();
// Ordered list
let ordered_list_regex = Regex::new(r"^([ \t]+|^)([0-9]+)\. (.*)").unwrap();
parsed_line = ordered_list_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
format!("{} {}. {}", &caps[1], &caps[2], &caps[3])
}).to_string();
// Unordered list ([ ]+|^)- (.*)
let unordered_list_regex = Regex::new(r"^([ \t]+|^)(-|\+|\*).(.*)").unwrap();
parsed_line = unordered_list_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
format!("{}{}", &caps[1], &caps[3])
}).to_string();
// Inline code
let inline_code_regex = Regex::new(r"`([^`]+?)`").unwrap();
parsed_line = inline_code_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
format!("{}", &caps[1].magenta())
}).to_string();
// HyperLink
let hyperlink_regex = Regex::new(r"(.*?)\[(.*?)\]\((.*?)\)").unwrap();
parsed_line = hyperlink_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
// Check if the character before the link is not '!'
if !caps[1].ends_with('!') { // caps[1] is everything before the link
let result = format!("{}{}[{}]", &caps[1], &caps[2].blue().underline(), hyperlink_number_counter);
let url = caps[3].to_string();
links.push(url);
hyperlink_number_counter += 1;
result
} else {
// If it's an image (starts with !), return the link as is
let url = caps[3].to_string();
links.push(url);
hyperlink_number_counter += 1;
format!("({})[{}]", &caps[2].green(), hyperlink_number_counter)
}
}).to_string();
let quick_hyperlink_regex = Regex::new(r"<(.*:\/\/.*)>").unwrap();
parsed_line = quick_hyperlink_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
hyperlink_number_counter += 1;
let url = caps[1].to_string();
links.push(url);
format!("{}[{}]", &caps[1].blue().underline(), hyperlink_number_counter)
}).to_string();
parsed_page_content+=&(parsed_line + "\n");
} }
// multiline code
let multiline_code_regex = Regex::new(r"(?ms)```((.*?\n)+?)```").unwrap();
parsed_page_content = multiline_code_regex.replace_all(&parsed_page_content, |caps: &regex::Captures| {
// Capture the code inside the %% blocks
let code_block = &caps[1];
// Add a tab to each line in the block
let indented_code = code_block
.lines()
.map(|line| format!("\t{}", line)) // Insert tab at the start of each line
.collect::<Vec<String>>()
.join("\n");
// Return the formatted block with magenta color
format!("{}", indented_code.magenta())
}).to_string();
return (parsed_page_content, links);
} }
fn fetch_page(url: &Url) -> String { fn fetch_page(url: &Url) {
let full_url_formatted = format!("{}", url); let full_url_formatted = format!("{}", url);
// Call curl using Com, mand let output = Command::new("gemget")
let output = Command::new("curl") .args([full_url_formatted, "-o".to_string(), "/tmp/page".to_string()])
.arg(full_url_formatted)
.output() .output()
.expect("Failed to execute curl command"); .expect("Failed to execute gemget command");
// Check if the command was successful // Check if the command was successful
if output.status.success() { if ! output.status.success() {
let page: String = String::from_utf8_lossy(&output.stdout).to_string(); println!("{}\n{:?}\n", "Failed to fetch page:".red(), output);
return page
} else {
eprintln!("Error:\n{}", String::from_utf8_lossy(&output.stderr));
let result: String = "error".to_string();
return result
} }
} }
fn render_page(url: Url, source: bool) -> Vec<String> { fn render_page(url: Url, source: bool) -> Vec<String> {
clear_screen(); clear_screen();
let mut content = fetch_page(&url); fetch_page(&url);
let mut links = Vec::new(); let mut links = Vec::new();
let (screen_width, _screen_height) = termion::terminal_size().unwrap(); if let Ok(mut content) = fs::read_to_string::<String>("/tmp/page".to_string()) {
Command::new("rm")
.arg("/tmp/page")
.output()
.expect("Failed to delete tmp page");
let (screen_width, _screen_height) = termion::terminal_size().unwrap();
if source == true { if source == true {
content += &format!("{}", &"Viewing source code".yellow()); content += &format!("{}", &"Viewing source code".yellow());
} }
else if &content[..13] == "<!DOCTYPE md>" { else {
(content, links) = parse_markdown((&content[13..]).to_string()); (content, links) = parse_gemtext::parse_gemtext(content);
} }
else {
content += &format!("{}", &"Warning: This page is invalid markdown, it should contain <!DOCTYPE md> at the very start of the file, showing raw text".yellow());
}
for _i in 0..screen_width { for _i in 0..screen_width {
print!(""); print!("-");
} }
print!("{}\n", url); print!("{}\n", url);
for _i in 0..screen_width { for _i in 0..screen_width {
print!(""); print!("-");
} }
println!("\n\n{}", content); println!("\n\n{}", content);
for _i in 0..screen_width { for _i in 0..screen_width {
print!(""); print!("-");
} }
println!(); println!();
// Return links (you can add link parsing logic) // Return links (you can add link parsing logic)
return links; }
return links;
} }
fn input() -> String{ fn input() -> String{
@ -206,18 +89,14 @@ fn parse_url(user_input: String, previous_url: &Url) -> Result<Url, ParseError>
println!("Contains different scheme or is a path"); println!("Contains different scheme or is a path");
user_input user_input
} }
else if user_input[..1] == *"/" {
format!("http://{}/{}",Url::host_str(previous_url).expect("ivalid").to_string(), user_input)
}
else { else {
println!("prepending scheme to user input"); format!("gemini://{}/{}",Url::host_str(previous_url).expect("ivalid").to_string(), user_input)
format!("http://{}", user_input) // Prepend 'mttp://' if no scheme is found
}; };
println!("Parsing: {}", to_parse); println!("Parsing: {}", to_parse);
if let Ok(mut url) = Url::parse(&to_parse) { if let Ok(mut url) = Url::parse(&to_parse) {
if url.port() == None { if url.port() == None {
let _ = url.set_port(Some(3477)); let _ = url.set_port(Some(1965));
} }
println!("{:?}",url); println!("{:?}",url);
println!("{}",url.as_str()); println!("{}",url.as_str());
@ -235,7 +114,7 @@ fn main() {
println!("Enter a url: "); println!("Enter a url: ");
let user_input = input(); let user_input = input();
if user_input == "q" { if user_input == "q" || user_input == "quit" || user_input == "exit" {
std::process::exit(0); std::process::exit(0);
} }
let mut load_page: bool = true; let mut load_page: bool = true;
@ -243,19 +122,30 @@ fn main() {
let mut historical_position: usize = 0; let mut historical_position: usize = 0;
let mut links: Vec<String> = Vec::new(); let mut links: Vec<String> = Vec::new();
let mut source: bool = false; // Wether to view source of markdown page or rendered version let mut source: bool = false; // Wether to view source of markdown page or rendered version
if let Ok(mut url) = parse_url(user_input, &Url::parse(&"http://deadvey.com").unwrap()) { // Change this and make internal pages ;) if let Ok(mut url) = parse_url(user_input, &Url::parse(&"gemini://geminiprotocol.net").unwrap()) { // Change this and make internal pages ;)
history.push(url.clone()); history.push(url.clone());
'mainloop: loop { 'mainloop: loop {
if load_page { if load_page {
links = render_page(history[historical_position].clone(), source); links = render_page(history[historical_position].clone(), source);
println!("Enter reference number to follow, h for help, or q to quit"); println!("Enter reference number to follow, h for help, or q to quit");
} }
url = history[historical_position].clone();
load_page = false; load_page = false;
let user_input = input(); let user_input = input();
if user_input == "q" { if user_input == "q" {
break 'mainloop; break 'mainloop;
} }
else if user_input == "d" {
println!(
"load_page: {}\nhistory: {:?}\nhistorical_postition: {}\nlinks: {:?}\nsource: {}",
load_page,
history,
historical_position,
links,
source
);
}
else if user_input == "r" { else if user_input == "r" {
load_page = true; load_page = true;
continue; continue;
@ -294,10 +184,11 @@ fn main() {
else if user_input == "h" { else if user_input == "h" {
println!("Source code: https://git.javalsai.dynv6.net/deadvey/markdown-webbrowser println!("Source code: https://git.javalsai.dynv6.net/deadvey/markdown-webbrowser
q: quit q: quit
d: debug info
h: help h: help
r: reload r: reload
s: view source code of page s: view source code of page
i: visit root index of this host eg: root index of mttp://deadvey.com/blog/4.md is just deadvey.com i: visit root index of this host eg: root index of gemini://deadvey.com/blog/4.md is just gemini://deadvey.com
b: go back in history b: go back in history
f: go forward in history f: go forward in history
ox: print the hyprlink of reference x eg: o5 or o24 ox: print the hyprlink of reference x eg: o5 or o24

91
src/parse_gemtext.rs Normal file
View File

@ -0,0 +1,91 @@
use colored::Colorize;
use regex::Regex;
pub fn parse_gemtext(page_content: String) -> (String, Vec<String>) {
let mut parsed_page_content: String = "".to_string();
let mut hyperlink_number_counter: u64 = 0;
let mut links: Vec<String> = Vec::new();
let mut preformatted_code_toggle = false;
// Regex patterns
let preformatted_text_regex = Regex::new(r"^```(.*)").unwrap();
let header1_regex = Regex::new(r"^# (.*)").unwrap();
let header2_regex = Regex::new(r"^## (.*)").unwrap();
let header3_regex = Regex::new(r"^### (.*)").unwrap();
let block_quotes_regex = Regex::new(r"^>(.*)").unwrap();
let unordered_list_regex = Regex::new(r"^([ \t]+|^)(\*).(.*)").unwrap();
let hyperlink_regex = Regex::new(r"=>\s(\S*)\s(.*)").unwrap();
let quick_hyperlink_regex = Regex::new(r"=>\s(.*)").unwrap();
for line in page_content.lines() {
let mut parsed_line: String = line.to_string();
let mut remove_line = false;
// preformatted text
parsed_line = preformatted_text_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
// Flip the toggle
preformatted_code_toggle = ! preformatted_code_toggle;
if caps[1] == *""
{
remove_line = true;
}
// Remove the ```
format!("{}", &caps[1].magenta())
}).to_string();
if preformatted_code_toggle == false
{
// Headers
parsed_line = header1_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
format!("{}", &caps[1].blue().bold().underline())
}).to_string();
parsed_line = header2_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
format!("{}", &caps[1].blue().bold())
}).to_string();
parsed_line = header3_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
format!("{}", &caps[1].bold())
}).to_string();
// Block quotes
parsed_line = block_quotes_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
format!(" | {}", &caps[1].red())
}).to_string();
// Unordered list ([ ]+|^)- (.*)
parsed_line = unordered_list_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
format!("{}{}", &caps[1], &caps[3])
}).to_string();
// HyperLink
parsed_line = hyperlink_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
// Check if the character before the link is not '!'
let result = format!("[{}] {}", hyperlink_number_counter, &caps[2].blue().underline());
let url = caps[1].to_string();
links.push(url);
hyperlink_number_counter += 1;
result
}).to_string();
parsed_line = quick_hyperlink_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
hyperlink_number_counter += 1;
let url = caps[1].to_string();
links.push(url);
format!("[{}] {}", hyperlink_number_counter, &caps[1].blue().underline())
}).to_string();
}
else if preformatted_code_toggle == true
{
parsed_line = parsed_line.magenta().to_string();
}
if remove_line == false
{
parsed_page_content+=&(parsed_line + "\n");
}
}
return (parsed_page_content, links);
}