Skip to content

Commit

Permalink
Merge pull request #2 from coco33920/math
Browse files Browse the repository at this point in the history
[Feature] Add supports for inline math and some env
  • Loading branch information
vanilla-extracts authored Mar 23, 2022
2 parents da64210 + 1915362 commit 6c75f54
Show file tree
Hide file tree
Showing 8 changed files with 333 additions and 217 deletions.
9 changes: 8 additions & 1 deletion README.md
Original file line number Diff line number Diff line change
Expand Up @@ -7,7 +7,7 @@ translates TeX Books (simple one like stories kind of book) to HTML. I use this

## What this project *is not*
The purpose of this project **is not** and never will be a kind of "TeX To HTML" compiler, I do *not* intend to implement the full TeX
and LaTeX specification. As such the support of mathematics is likely **never to be** included here. This is a tool mainly done *for me* for my usage, that is publishing my book on ScribbleHub and the web. I'm sure you can find real compilers if you want to support
and LaTeX specification. This is a tool mainly done *for me* for my usage, that is publishing my book on ScribbleHub and the web. I'm sure you can find real compilers if you want to support
the full specification of TeX and LaTeX

## Support
Expand All @@ -23,6 +23,13 @@ The project currently translate *LaTeX* to human-readable HTML files (the line b
- `textbf` is replaced by `<b>`
- `newline`, `\\`, and `par` puts a `<br>`
- `bigskip` closes the paragraph and open another one.
- Some math
- Inline math with `$`
- Math env
- Align*
- Align
- Equation
- Equation*

## Near Future TODO List
* parsing glossary entries from a glossary file and printing the `gls` with a link to the glossary
Expand Down
2 changes: 1 addition & 1 deletion bin/main.ml
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,7 @@ let spec = [
]

let execute_command file outname start_chapter =
Htmlfromtexbooks.Parser.print_file_in_html ~min_chap:start_chapter file outname;;
Htmlfromtexbooks.Htmlgen.print_file_in_html ~min_chap:start_chapter file outname;;

let parse_filename file outname start_chapter =
if not (Sys.file_exists file) then (Printf.printf "The %s file do not exists" file; exit 2)
Expand Down
2 changes: 2 additions & 0 deletions lib/dune
Original file line number Diff line number Diff line change
@@ -1,3 +1,5 @@
(include_subdirs unqualified)

(library
(name htmlfromtexbooks)
(libraries str))
218 changes: 218 additions & 0 deletions lib/htmlgen.ml
Original file line number Diff line number Diff line change
@@ -0,0 +1,218 @@
open Parser
open Glossary
open Utils

let url_encoded_str s = s;;

let print_table_of_content ast min_chap =
let count = [|1;1;1;1|] in
let rec aux acc ast =
match ast with
| [] -> acc
| Chapter (s,l)::q ->
let chapnum = count.(0) in
begin
count.(0) <- count.(0) + 1;
count.(1) <- 1;
count.(2) <- 1;
count.(3) <- 1;
end;
let str = aux "" l in
let new_line = if chapnum>=min_chap then Printf.sprintf "<li><a href=\"#c%i\">Chapter %i : %s</a></li>\n"
chapnum (chapnum-min_chap+1) s else "" in
aux (acc^new_line^str) q

| Section (s,l)::q ->
let chapnum,secnum = count.(0),count.(1) in
begin
count.(1) <- count.(1) + 1;
count.(2) <- 1;
count.(3) <- 1;
end;
let str = aux "" l in
let new_line = Printf.sprintf "<li><a href=\"#s%f\">Section %i.%i : %s</a></li>\n"
(2.**(float chapnum)*.3.**(float secnum)) (chapnum-min_chap+1) secnum s in
aux (acc^new_line^str) q

| Subsection (s,l)::q ->
let chapnum,secnum,ssecnum = count.(0),count.(1),count.(2) in
begin
count.(2) <- count.(2) + 1;
count.(3) <- 1;
end;
let str = aux "" l in
let new_line = Printf.sprintf "<li><a href=\"#ss%f\">Subsection %i.%i.%i : %s</a></li>\n"
(2.**(float chapnum)*.3.**(float secnum)*.5.**(float ssecnum)) (chapnum-min_chap+1) secnum ssecnum s in
aux (acc^new_line^str) q

| Subsubsection (s,l)::q ->
let chapnum,secnum,ssecnum,sssecnum = count.(0),count.(1),count.(2),count.(3) in
begin
count.(3) <- count.(3) + 1;
end;
let str = aux "" l in
let new_line = Printf.sprintf "<li><a href=\"#sss%f\">Subsubsection %i.%i.%i.%i : %s</a></li>\n"
(2.**(float chapnum)*.3.**(float secnum)*.5.**(float ssecnum)*.7.**(float sssecnum)) (chapnum-min_chap+1) secnum ssecnum sssecnum s in
aux (acc^new_line^str) q
| Env (_,l)::q -> let a = aux acc l in aux (acc^a) q
| _::q -> aux acc q
in (aux "" ast);;

let parse_to_html ?(min_chap=1) write_before ast=
let count = [|1;1;1;1|] in
let rec aux ?(write=write_before) acc ast =
match ast with
| [] -> acc
| Nul::q -> aux acc q
| Line s::q ->
let line= if write then Printf.sprintf "%s\n" s else ""
in aux ~write:write (acc^line) q
| Math s::q ->
let url = Printf.sprintf "https://latex.codecogs.com/svg.image?%s"s in
let url = url_encoded_str url in
let line = if write then Printf.sprintf "<img src=\"%s\"/>\n" url else ""
in aux ~write:write (acc^line) q
| AtomicCmd (s,_)::q ->
let new_line = (match s with
| "par" -> "<br/>\n"
| "bigskip" -> "</p>\n\n<p>\n"
| "\\" -> "<br/>\n"
| "printglossaries" -> ""
| "sep" -> "<div class=\"center\"><b>***</b></div>"
| "item" -> "·"
| "newline" -> "<br/>\n"
| "ast" -> "*"
| e ->
(try
let structure = Hashtbl.find commands e in
let str = aux ~write:write acc structure
in str
with _ -> ""))
in let new_acc = if write then acc^new_line^"\n" else ""
in aux ~write:write new_acc q

| OneArgCmd (s,_,l)::q ->
let str = aux "" l in
let new_line = (match s with
| "par" -> "<br/>\n"
| "bigskip" -> "</p>\n\n<p>\n"
| "\\" -> "<br/>\n"
| "printglossaries" -> ""
| "item" -> "·"
| "sep" -> "<div class=\"center\"><b>***</b></div>"
| "newline" -> "<br/>\n"
| "ast" -> "*"
| "gls" ->
(match l with
| [] -> ""
| Line s::_ ->
let name,_ = recognize_gls s in Printf.sprintf "<a href=\"#%s\">%s</a> " s name
| _::_ -> "")
| "textit" -> (Printf.sprintf "<i>%s</i>" str)
| "textbf" -> (Printf.sprintf "<b>%s</b>" str)
| "url" -> (Printf.sprintf "<a href=\"%s\">%s</a>" (Str.global_replace (Str.regexp "\n") "" str) str)
| e ->
(try
let structure = Hashtbl.find commands e in
let str = aux ~write:write acc structure
in str
with _ -> ""))
in let new_acc = if write then acc^(new_line) else ""
in aux ~write:write new_acc q

| Chapter (s,l)::q ->
let chapnum = count.(0) in
begin
count.(0) <- count.(0) + 1;
count.(1) <- 1;
count.(2) <- 1;
count.(3) <- 1;
end;
let str = aux ~write:(chapnum>=min_chap) "" l in
let new_line = if chapnum>=min_chap then Printf.sprintf "<h1 id=\"c%i\">Chapter %i : %s</h1><br/>\n"
chapnum (chapnum-min_chap+1) s else "" in
aux ~write:write (acc^new_line^str) q

| Section (s,l)::q ->
let chapnum,secnum = count.(0),count.(1) in
begin
count.(1) <- count.(1) + 1;
count.(2) <- 1;
count.(3) <- 1;
end;
let str = aux ~write:write "" l in
let new_line = Printf.sprintf "<h2 id=\"s%f\">Section %i.%i : %s</h2><br/>\n"
(2.**(float chapnum)*.3.**(float secnum)) (chapnum-min_chap+1) secnum s in
aux ~write:write (acc^new_line^str) q

| Subsection (s,l)::q ->
let chapnum,secnum,ssecnum = count.(0),count.(1),count.(2) in
begin
count.(2) <- count.(2) + 1;
count.(3) <- 1;
end;
let str = aux ~write:write "" l in
let new_line = Printf.sprintf "<h3 id=\"ss%f\">Subsection %i.%i.%i : %s</h3><br/>\n"
(2.**(float chapnum)*.3.**(float secnum)*.5.**(float ssecnum)) (chapnum-min_chap+1) secnum ssecnum s in
aux ~write:write (acc^new_line^str) q

| Subsubsection (s,l)::q ->
let chapnum,secnum,ssecnum,sssecnum = count.(0),count.(1),count.(2),count.(3) in
begin
count.(3) <- count.(3) + 1;
end;
let str = aux ~write:write "" l in
let new_line = Printf.sprintf "<h4 id=\"sss%f\">Subsubsection %i.%i.%i.%i : %s</h4><br/>\n"
(2.**(float chapnum)*.3.**(float secnum)*.5.**(float ssecnum)*.7.**(float sssecnum)) (chapnum-min_chap+1) secnum ssecnum sssecnum s in
aux ~write:write (acc^new_line^str) q

| Env (s,l)::q ->
let str = aux ~write:write "" l in
let new_line = (match s with
| "document" -> str
| "center" -> Printf.sprintf "<div style=\"margin: auto; text-align: center;\">\n%s\n</div>" str
| _ -> str)
in aux ~write:write (acc^new_line^"\n") q
| _::q -> aux acc q
in aux "" ast;;


let prepare_body name str toc =
let line = "<title>" ^ name ^ "</title>\n"
in let line = line ^ "<body>\n"
in let line = line ^ "<style>\n.center {\nmargin:auto;\ntext-align:center;\n}\n </style>"
in let line = line ^ "<div class=\"center\">\n"
in let line = line ^ (Printf.sprintf "<h1>%s</h1>\n" name)
in let line = line ^ "<h2>Table of Content</h2>\n"
in let line = line ^ "<ul>\n"
in let line = line ^ toc ^ "\n"
in let line = line ^ "</ul>\n"
in let line = line ^ "</div>\n"
in let line = line ^ str ^ "\n"
in let line = line ^ (prints_glossary ()) ^ "\n"
in let line = line ^ "</body>"
in line;;


let pre_parse_file file =
let str = read_file file in
let str = String.concat "\n" str in
let a = parse_string str
in let p,doc = separate_preamble a
in read_preamble p;
let doc = separate_sections doc
in let doc = calculate_environments doc
in let doc = Mathgen.re_calculate_env doc in
(match (Hashtbl.find_opt preamble "glossary") with
| Some s -> init_glossary s
| None -> (););
doc;;


let print_file_in_html ?(min_chap=1) ?(write_before=false) file outname =
let a = pre_parse_file file in
let html = parse_to_html ~min_chap:min_chap write_before a in
let toc = print_table_of_content a min_chap in
let name = try Hashtbl.find preamble "title" with _ -> "Generic" in
prepare_body name html toc
|> write_to_file outname;;
53 changes: 53 additions & 0 deletions lib/mathgen.ml
Original file line number Diff line number Diff line change
@@ -0,0 +1,53 @@
open Parser

let generate_latex_command s l =
let line = "\\"^s in
let args = String.concat "," l in
let line = if args="" then line else Printf.sprintf "%s[%s]" line args in
line;;



let generate_latex l =
let rec unparse acc l =
match l with
| [] -> String.concat " " acc
| Line s::q -> unparse (s::acc) q
| AtomicCmd (s,l)::q ->
let line = generate_latex_command s l in
unparse (line::acc) q
| OneArgCmd (s,l,l2)::q ->
let line = generate_latex_command s l in
let line = Printf.sprintf "%s{%s}" line (unparse [] l2) in
unparse (line::acc) q
| MultipleArgCmd (s,l,l2)::q ->
let line = generate_latex_command s l in
let l = List.map (unparse []) l2 in
let line = Printf.sprintf "%s{%s}" line (String.concat "\n" l) in
unparse (line::acc) q
| _::q -> unparse acc q
in unparse [] l;;

let env_de_latexer env =
match env with
| e -> e;;

let re_calculate_env ast =
let rec aux acc ast =
match ast with
| [] -> acc
| Env (s,n)::q when s="align"
-> aux (Math(Printf.sprintf "\\begin{align}%s\\end{align}" (generate_latex n))::acc) q
| Env (s,n)::q when s="align*"
-> aux (Math(Printf.sprintf "\\begin{align*}%s\\end{align*}" (generate_latex n))::acc) q
| Env (s,n)::q when s="equation"
-> aux (Math(Printf.sprintf "\\begin{equation}%s\\end{equation}" (generate_latex n))::acc) q
| Env (s,n)::q when s="equation*"
-> aux (Math(Printf.sprintf "\\begin{equation*}%s\\end{equation*}" (generate_latex n))::acc) q
| Env(s,n)::q
-> let ast = aux [] n in
let ast = List.rev ast
in let env = Env(s,ast)
in aux (env::acc) q
| e::q -> aux (e::acc) q
in List.rev (aux [] ast);;
Loading

0 comments on commit 6c75f54

Please sign in to comment.