Compare commits

..

28 Commits

Author SHA1 Message Date
ca9d4cfaf9 readme 2025-04-03 23:19:21 +01:00
1321e0dcaf works ish 2025-04-03 22:15:38 +01:00
a7468d3f40 Gemini version 2025-04-03 21:42:37 +01:00
845866ef9d readme 2025-01-26 11:15:34 +00:00
5f856f35fe source code viewing 2025-01-26 02:59:06 +00:00
7b9d2d6fd3 some stuff 2025-01-26 02:39:43 +00:00
f46d3bac42 fixed history functionality, TO DO: arguments, documentation 2025-01-26 02:12:56 +00:00
ced5648c01 url parsing works (FINALLY) 2025-01-26 01:44:24 +00:00
7b07b6f051 done for the day, got a proper url parser 2025-01-22 01:18:30 +00:00
e4b08b45bc ``` 2025-01-21 23:59:18 +00:00
1b8614b956 open http links in web browser now :D 2025-01-21 19:04:40 +00:00
d55d70ec45 <!DOCTYPE md> now required 2025-01-21 18:33:14 +00:00
67a5096267 going back in history sort of works, but is quite buggy 2025-01-13 14:43:00 +00:00
0da9e95b2a sorta done history and going back, but gonna go sleep now, not finished btw 2025-01-13 00:52:58 +00:00
2aa4a82af9 made input's more safe 2025-01-12 23:20:30 +00:00
deadvey
88200eb354 http stuff in regex 2025-01-12 02:29:11 +00:00
deadvey
bb75241a3c ignore swap files ¬_¬! 2025-01-12 02:20:16 +00:00
deadvey
4e7422c478 made code a bit safer, harder to crash 2025-01-12 02:19:05 +00:00
deadvey
3d12793550 added a todo 2025-01-09 01:07:28 +00:00
deadvey
859ec9fcfc error yaps 2025-01-09 00:59:30 +00:00
deadvey
a1dfc6bd04 readme 2025-01-09 00:55:07 +00:00
deadvey
b72d43b250 Sublists work now 2025-01-09 00:47:29 +00:00
deadvey
8e860b89e7 quick links and <br/> support 2025-01-08 23:42:01 +00:00
deadvey
590cd001be few rendering changes 2025-01-08 20:35:59 +00:00
deadvey
a433ad41b5 removed excess reference printing 2025-01-07 22:53:02 +00:00
92bf985a9a Update src/main.rs
Some comment
2025-01-07 23:34:05 +01:00
deadvey
1130e37ec3 I forgot whatt I changed 2025-01-07 22:32:32 +00:00
deadvey
7ec6bf1c47 some changes like horizontal lines --- 2025-01-07 21:14:34 +00:00
7 changed files with 352 additions and 143 deletions

3
.gitignore vendored Normal file
View File

@@ -0,0 +1,3 @@
Cargo.lock
target
*.swp

View File

@@ -6,4 +6,6 @@ edition = "2021"
[dependencies] [dependencies]
colored = "2.2.0" colored = "2.2.0"
regex = "1.11.1" regex = "1.11.1"
termion = "4.0.3"
open = "5.3.2"
url = "2.5.4" url = "2.5.4"

48
README.md Normal file
View File

@@ -0,0 +1,48 @@
# Markdown web browser
A web browser that let's you browse gemini capsules that use gemtext as a superior standard to html.
# Requirements
- gemget
# Installing
## Build from source:
- Clone the repo
```cargo run -r```
# Help
Type h in the program to see this text:
```
Source code: https://git.javalsai.dynv6.net/deadvey/markdown-webbrowser
q: quit
d: debug info
h: help
r: reload
s: view source code of page
i: visit root index of this host eg: root index of gemini://deadvey.com/blog/4.md is just gemini://deadvey.com
b: go back in history
f: go forward in history
ox: print the hyprlink of reference x eg: o5 or o24
[url]: follow the inputed url
```
# Example:
![screenshot](/images/screenshot.png)
# TO DO
- Make pages scrollable
- Bookmarks
- Properly comment it because I can't lie I can't even follow it.
- Make it memory safe, it crashes if the input is unexpected.
- Use treesitter instead of Regex, because, reasons.
- "wtf deadvey" - [error](https://git.javalsai.dynv6.net/ErrorNoInternet)
- "Don't use Regex to parse **ANYTHING**" - [error](https://git.javalsai.dynv6.net/ErrorNoInternet)
- "use treesitter" - [error](https://git.javalsai.dynv6.net/ErrorNoInternet)
- "yeah, definitley use treesitter" - [error](https://git.javalsai.dynv6.net/ErrorNoInternet)
- "use treesitter" - [error](https://git.javalsai.dynv6.net/ErrorNoInternet)
- "or glow" - [error](https://git.javalsai.dynv6.net/ErrorNoInternet)
- "I found another markdown to terminal converter" - [error](https://git.javalsai.dynv6.net/ErrorNoInternet)
- "ban [for using regex]" - [error](https://git.javalsai.dynv6.net/ErrorNoInternet)
- "use treesitter" - [error](https://git.javalsai.dynv6.net/ErrorNoInternet)
- Get a catchier name, 'markdown web browser' sounds kind of lame.
![error yapping](/images/error_yapping.gif)

BIN
images/error_yapping.gif Normal file

Binary file not shown.

After

Width:  |  Height:  |  Size: 2.3 MiB

BIN
images/screenshot.png Normal file

Binary file not shown.

After

Width:  |  Height:  |  Size: 880 KiB

View File

@@ -1,135 +1,71 @@
use std::process::{Command}; use std::process::{Command};
use std::io::{stdin,stdout,Write}; use std::io::{stdin,stdout,Write};
use colored::Colorize; use colored::Colorize;
use regex::Regex; use url::{Url, ParseError};
use url::Url; use std::fs;
const DEBUG_MODE: bool = false;
// Import other files
mod parse_gemtext;
fn clear_screen() { fn clear_screen() {
if DEBUG_MODE == false
{
println!("clearing");
Command::new("clear") Command::new("clear")
.spawn() .status()
.expect("Failed to clear screen"); .expect("Failed to clear screen");
} }
fn parse_markdown(page_content: String) -> (String, Vec<String>) {
let mut parsed_page_content: String = "".to_string();
let mut hyperlink_number_counter: u64 = 0;
let mut links: Vec<String> = Vec::new();
for line in page_content.lines() {
let mut parsed_line: String = line.to_string();
// Bold
let bold_regex = Regex::new(r"\*\*(.*?)\*\*").unwrap();
parsed_line = bold_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
caps[1].bold().to_string()
}).to_string();
let bold_regex = Regex::new(r"__(.*?)__").unwrap();
parsed_line = bold_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
caps[1].bold().to_string()
}).to_string();
// Italics
let italic_regex = Regex::new(r"\*(.*?)\*").unwrap();
parsed_line = italic_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
caps[1].italic().to_string()
}).to_string();
let italic_regex = Regex::new(r"_(.*?)_").unwrap();
parsed_line = italic_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
caps[1].italic().to_string()
}).to_string();
// Block quotes
let block_quotes_regex = Regex::new(r"^>(.*)").unwrap();
parsed_line = block_quotes_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
format!(" | {}", &caps[1].on_black())
}).to_string();
// Ordered list
let ordered_list_regex = Regex::new(r"^([0-9]+)\.(.*)").unwrap();
parsed_line = ordered_list_regex.replace_all(&parsed_line, " $1. $2").to_string();
// Unordered list
let unordered_list_regex = Regex::new(r"^(-|\+|\*).(.*)").unwrap();
parsed_line = unordered_list_regex.replace_all(&parsed_line, " • $2").to_string();
// Inline code
let inline_code_regex = Regex::new(r"`(.*)`").unwrap();
parsed_line = inline_code_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
format!("{}", &caps[1].magenta())
}).to_string();
// HyperLink
let hyperlink_regex = Regex::new(r"\[(.*?)\]\((.*?)\)").unwrap();
parsed_line = hyperlink_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
let result = format!("{}[{}]", &caps[1].blue().underline(),hyperlink_number_counter);
let url = caps[2].to_string();
links.push(url);
hyperlink_number_counter+=1;
result
}).to_string();
parsed_page_content+=&(parsed_line + "\n");
} }
// multiline code fn fetch_page(url: &Url) {
let multiline_code_regex = Regex::new(r"(?ms)%%%((.*?\n)+?)%%%").unwrap(); let full_url_formatted = format!("{}", url);
parsed_page_content = multiline_code_regex.replace_all(&parsed_page_content, |caps: &regex::Captures| {
// Capture the code inside the %% blocks
let code_block = &caps[1];
// Add a tab to each line in the block let output = Command::new("gemget")
let indented_code = code_block .args([full_url_formatted, "-o".to_string(), "/tmp/page".to_string()])
.lines()
.map(|line| format!("\t{}", line)) // Insert tab at the start of each line
.collect::<Vec<String>>()
.join("\n");
// Return the formatted block with magenta color
format!("{}", indented_code.magenta())
}).to_string();
return (parsed_page_content, links);
}
fn fetch_page(host: &String, port: &String, path: &String) -> String {
let full_url_formatted = format!("{}:{}/{}", host, port, path);
// Call curl using Com, mand
let output = Command::new("curl")
.arg(full_url_formatted)
.output() .output()
.expect("Failed to execute curl command"); .expect("Failed to execute gemget command");
// Check if the command was successful // Check if the command was successful
if output.status.success() { if ! output.status.success() {
let page: String = String::from_utf8_lossy(&output.stdout).to_string(); println!("{}\n{:?}\n", "Failed to fetch page:".red(), output);
return page
} else {
eprintln!("Error:\n{}", String::from_utf8_lossy(&output.stderr));
let result: String = "error".to_string();
return result
} }
} }
fn render_page(host: String, port: String, path: String) -> Vec<String> { fn render_page(url: Url, source: bool) -> Vec<String> {
clear_screen(); clear_screen();
let mut content = fetch_page(&host, &port, &path); fetch_page(&url);
let mut links = Vec::new(); let mut links = Vec::new();
(content, links) = parse_markdown(content); if let Ok(mut content) = fs::read_to_string::<String>("/tmp/page".to_string()) {
print!("{}: {}\n", host, path); Command::new("rm")
for _i in 0..format!("{}: {}", host, path).len() { .arg("/tmp/page")
.output()
.expect("Failed to delete tmp page");
let (screen_width, _screen_height) = termion::terminal_size().unwrap();
if source == true {
content += &format!("{}", &"Viewing source code".yellow());
}
else {
(content, links) = parse_gemtext::parse_gemtext(content);
}
for _i in 0..screen_width {
print!("-"); print!("-");
} }
print!("\n\n{}", content); print!("{}\n", url);
for _i in 0..format!("{}: {}", host, path).len() { for _i in 0..screen_width {
print!("-");
}
println!("\n\n{}", content);
for _i in 0..screen_width {
print!("-"); print!("-");
} }
println!(); println!();
for i in 0..links.len() {
println!("{}: {}", i, links[i].blue().underline()); // Return links (you can add link parsing logic)
} }
println!();
return links; return links;
} }
@@ -146,31 +82,160 @@ fn input() -> String{
return s; return s;
} }
fn main() { fn parse_url(user_input: String, previous_url: &Url) -> Result<Url, ParseError> {
println!("Enter a url: "); println!("user input: {}",user_input);
let mut host: String = input(); println!("previous url: {:?}",previous_url);
let mut port: String = "3477".to_string(); let to_parse = if user_input.contains("://") {
let mut path: String = "/".to_string(); println!("Contains different scheme or is a path");
user_input
'mainloop: loop {
let links = render_page(host.clone(), port.clone(), path.clone());
println!("{}:{}/{}", host, port, path);
println!("Enter link number to follow, or q to quit");
let link_to_follow = input();
if link_to_follow == "q" {
break 'mainloop;
} }
else { else {
let number: usize = link_to_follow.parse::<usize>().unwrap(); format!("gemini://{}/{}",Url::host_str(previous_url).expect("ivalid").to_string(), user_input)
};
let parsed_url = Url::parse(&links[number]).expect("Invalid URL"); println!("Parsing: {}", to_parse);
host = parsed_url.host_str().expect("No host found").to_string(); if let Ok(mut url) = Url::parse(&to_parse) {
port = parsed_url.port().unwrap_or(3477).to_string(); if url.port() == None {
path = parsed_url.path().to_string(); let _ = url.set_port(Some(1965));
println!("{}:{}/{}", host, port, path);
} }
println!("{:?}",url);
println!("{}",url.as_str());
println!("parsed successfully");
return Ok(url)
}
else {
return Err(ParseError::InvalidDomainCharacter)
}
}
fn main() {
clear_screen();
println!("Enter a url: ");
let user_input = input();
if user_input == "q" || user_input == "quit" || user_input == "exit" {
std::process::exit(0);
}
let mut load_page: bool = true;
let mut history: Vec<Url> = Vec::new();
let mut historical_position: usize = 0;
let mut links: Vec<String> = Vec::new();
let mut source: bool = false; // Wether to view source of markdown page or rendered version
if let Ok(mut url) = parse_url(user_input, &Url::parse(&"gemini://geminiprotocol.net").unwrap()) { // Change this and make internal pages ;)
history.push(url.clone());
'mainloop: loop {
if load_page {
links = render_page(history[historical_position].clone(), source);
println!("Enter reference number to follow, h for help, or q to quit");
}
url = history[historical_position].clone();
load_page = false;
let user_input = input();
if user_input == "q" {
break 'mainloop;
}
else if user_input == "d" {
println!(
"load_page: {}\nhistory: {:?}\nhistorical_postition: {}\nlinks: {:?}\nsource: {}",
load_page,
history,
historical_position,
links,
source
);
}
else if user_input == "r" {
load_page = true;
continue;
}
else if user_input == "s" {
source = ! source; // Flip the boolean to toggle source mode
load_page = true;
}
else if user_input == "i" {
let _ = url.set_path("/");
for _i in historical_position+1..history.len() {
history.remove(historical_position+1);
}
history.push(url.clone());
historical_position += 1;
load_page = true;
}
else if user_input == "b" {
if historical_position > 0 {
historical_position -= 1;
load_page = true;
}
else {
println!("At start of history");
}
}
else if user_input == "f" {
if historical_position < history.len()-1 {
historical_position += 1;
load_page = true;
}
else {
println!("At end of history");
}
}
else if user_input == "h" {
println!("Source code: https://git.javalsai.dynv6.net/deadvey/markdown-webbrowser
q: quit
d: debug info
h: help
r: reload
s: view source code of page
i: visit root index of this host eg: root index of gemini://deadvey.com/blog/4.md is just gemini://deadvey.com
b: go back in history
f: go forward in history
ox: print the hyprlink of reference x eg: o5 or o24
[url]: follow the inputed url");
}
else if user_input.chars().nth(0).unwrap() == 'o' {
let number_str = &user_input[1..];
if let Ok(number) = number_str.parse::<usize>() {
println!("{}", links[number]);
} else {
println!("error");
}
}
else if let Ok(number) = user_input.parse::<usize>() {
if number < links.len() {
if let Ok(parsed_value) = parse_url(links[number].clone(), &url.clone()) {
url = parsed_value;
for _i in historical_position+1..history.len() {
history.remove(historical_position+1);
}
history.push(url.clone());
historical_position += 1;
load_page = true;
}
else {
println!("Invalid url\nAttempting to open url in web browser");
}
} else {
println!("Invalid reference id");
}
}
else if let Ok(parsed_value) = parse_url(user_input, &url.clone()) {
url = parsed_value;
for _i in historical_position+1..history.len() {
history.remove(historical_position+1);
}
history.push(url.clone());
historical_position += 1;
load_page = true;
}
else {
println!("Invalid input");
}
}
}
else {
println!("Invalid mttp url, try mttp:// at the start of your input.");
} }
} }

91
src/parse_gemtext.rs Normal file
View File

@@ -0,0 +1,91 @@
use colored::Colorize;
use regex::Regex;
pub fn parse_gemtext(page_content: String) -> (String, Vec<String>) {
let mut parsed_page_content: String = "".to_string();
let mut hyperlink_number_counter: u64 = 0;
let mut links: Vec<String> = Vec::new();
let mut preformatted_code_toggle = false;
// Regex patterns
let preformatted_text_regex = Regex::new(r"^```(.*)").unwrap();
let header1_regex = Regex::new(r"^# (.*)").unwrap();
let header2_regex = Regex::new(r"^## (.*)").unwrap();
let header3_regex = Regex::new(r"^### (.*)").unwrap();
let block_quotes_regex = Regex::new(r"^>(.*)").unwrap();
let unordered_list_regex = Regex::new(r"^([ \t]+|^)(\*).(.*)").unwrap();
let hyperlink_regex = Regex::new(r"=>\s(\S*)\s(.*)").unwrap();
let quick_hyperlink_regex = Regex::new(r"=>\s(.*)").unwrap();
for line in page_content.lines() {
let mut parsed_line: String = line.to_string();
let mut remove_line = false;
// preformatted text
parsed_line = preformatted_text_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
// Flip the toggle
preformatted_code_toggle = ! preformatted_code_toggle;
if caps[1] == *""
{
remove_line = true;
}
// Remove the ```
format!("{}", &caps[1].magenta())
}).to_string();
if preformatted_code_toggle == false
{
// Headers
parsed_line = header1_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
format!("{}", &caps[1].blue().bold().underline())
}).to_string();
parsed_line = header2_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
format!("{}", &caps[1].blue().bold())
}).to_string();
parsed_line = header3_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
format!("{}", &caps[1].bold())
}).to_string();
// Block quotes
parsed_line = block_quotes_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
format!(" | {}", &caps[1].red())
}).to_string();
// Unordered list ([ ]+|^)- (.*)
parsed_line = unordered_list_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
format!("{}{}", &caps[1], &caps[3])
}).to_string();
// HyperLink
parsed_line = hyperlink_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
// Check if the character before the link is not '!'
let result = format!("[{}] {}", hyperlink_number_counter, &caps[2].blue().underline());
let url = caps[1].to_string();
links.push(url);
hyperlink_number_counter += 1;
result
}).to_string();
parsed_line = quick_hyperlink_regex.replace_all(&parsed_line, |caps: &regex::Captures| {
hyperlink_number_counter += 1;
let url = caps[1].to_string();
links.push(url);
format!("[{}] {}", hyperlink_number_counter, &caps[1].blue().underline())
}).to_string();
}
else if preformatted_code_toggle == true
{
parsed_line = parsed_line.magenta().to_string();
}
if remove_line == false
{
parsed_page_content+=&(parsed_line + "\n");
}
}
return (parsed_page_content, links);
}