2020-12-21 13:12:05 +01:00
|
|
|
# lib_src2md.rb
|
2021-01-11 03:15:04 +01:00
|
|
|
require 'pathname'
|
2020-12-21 13:12:05 +01:00
|
|
|
|
2021-03-03 15:45:54 +01:00
|
|
|
# The method 'src2md' converts .src.md file into .md file.
|
2021-04-27 14:08:30 +02:00
|
|
|
# The .md file is the final format for GFM, or intermediate markdown file for html and/or latex.
|
2021-01-11 03:15:04 +01:00
|
|
|
# - Links to relative URL are removed for latex. Otherwise, it remains.
|
|
|
|
# See "Hyperref and relative link" below for further explanation.
|
|
|
|
# - Width and height for images are removed for markdown and html. it remains for latex.
|
|
|
|
# ![sample](sample_image){width=10cm height=5cm} => ![sample](sample_image) for markdown and html
|
|
|
|
|
|
|
|
# ---- Hyperref and relative link ----
|
|
|
|
# Hyperref package makes internal link possible.
|
|
|
|
# The target of the link is made with '\hypertarget' command.
|
|
|
|
# And the link is made with '\hyperlink' command.
|
|
|
|
# For example,
|
|
|
|
# (sec11.tex)
|
|
|
|
# \hyperlink{tfeapplication.c}{Section 13}
|
|
|
|
# ... ...
|
|
|
|
# (sec13.tex)
|
|
|
|
# \hypertarget{tfeapplication.c}{%
|
|
|
|
# \section{tfeapplication.c}\label{tfeapplication.c}}
|
2021-04-27 14:08:30 +02:00
|
|
|
# If you click on the text 'Section 13' in sec11.tex, then you will move to 'tfeapplication.c' in sec13.tex.
|
2021-01-11 03:15:04 +01:00
|
|
|
|
|
|
|
# The following lines are the original one in sec11.md and the result in sec11.tex, which is generated by pandoc.
|
|
|
|
# (sec11.md)
|
|
|
|
# All the source files are listed in [Section 13](sec13.tex).
|
|
|
|
# (sec11.tex)
|
|
|
|
# All the source files are listed in \href{sec13.tex}{Section 13}.
|
|
|
|
# Therefore, if you want to correct the link in sec11.tex, you need to do the followings.
|
|
|
|
# 1. Look at the first line of sec13.md and get the section heading (tfeapplication.c).
|
|
|
|
# 2. substitute "\hyperlink{tfeapplication.c}{Section 13}" for "\href{sec13.tex}{Section 13}".
|
|
|
|
|
|
|
|
# The following lines are another conversion case by pandoc.
|
|
|
|
# (sec7.md)
|
|
|
|
# The source code of `tfe3.c` is stored in [src/tfe](../src/tfe) directory.
|
|
|
|
# (sec7.tex)
|
|
|
|
# The source code of \texttt{tfe3.c} is stored in \href{../src/tfe}{src/tfe} directory.
|
2021-04-20 14:36:12 +02:00
|
|
|
# The pdf file generated by lualatex recognizes that the link 'href{../src/tfe}' points a pdf file '../src/tfe.pdf'.
|
2021-01-11 03:15:04 +01:00
|
|
|
# To avoid generating such incorrect links, it is good to remove the links from the original markdown file.
|
|
|
|
|
2021-04-27 14:08:30 +02:00
|
|
|
# If the target is full URL, which means absolute URL begins with "http(s)", no problem happens.
|
2021-01-11 03:15:04 +01:00
|
|
|
|
2021-03-03 15:45:54 +01:00
|
|
|
# This script just remove the links if its target is relative URL if the target is latex.
|
2021-01-11 03:15:04 +01:00
|
|
|
# If you want to revive the link with relative URL, refer the description above.
|
|
|
|
|
2021-01-25 10:35:49 +01:00
|
|
|
# This script uses "fenced code blocks" for verbatim lines.
|
|
|
|
# It is available in GFM and pandoc's markdown but not in original markdown.
|
|
|
|
# Two characters backtick (`) and tilde (~) are possible for fences.
|
|
|
|
# This script uses tilde because info string cannot contain any backticks for the backtick code fence.
|
|
|
|
# Info string follows opening fence and it is usually a language name.
|
2021-03-03 15:45:54 +01:00
|
|
|
|
|
|
|
# GFM has fence code block as follows.
|
2021-01-25 10:35:49 +01:00
|
|
|
# ~~~C
|
|
|
|
# int main (int argc, char **argv) {
|
|
|
|
# ........
|
|
|
|
# ~~~
|
|
|
|
# Then the contents are highlighted based on C language syntax.
|
2021-03-03 15:45:54 +01:00
|
|
|
# This script finds the language by the suffix of the file name.
|
2021-01-25 10:35:49 +01:00
|
|
|
# .c => C, .h => C, .rb => ruby, Rakefile, => ruby, .xml => xml, .ui => xml, .y => bison, .lex => lex, .build => meson, .md => markdown
|
|
|
|
# Makefile => makefile
|
|
|
|
|
2021-03-03 15:45:54 +01:00
|
|
|
# Pandoc's markdown is a bit different.
|
|
|
|
# ~~~{.C .numberLines}
|
|
|
|
# int main (int argc, char **argv) {
|
|
|
|
# ........
|
|
|
|
# ~~~
|
|
|
|
# Then the contents are highlighted based on C language syntax and line numbers are added.
|
|
|
|
# Pandoc supports C, ruby, xml, bison, lex, markdown and makefile languages, but doesn't meson.
|
|
|
|
#
|
|
|
|
# After a markdown file is converted to a latex file, listings package is used by lualatex to convert it to a pdf file.
|
|
|
|
# Listings package supports only C, ruby, xml and make.
|
|
|
|
# Bison, lex, markdown and meson aren't supported.
|
|
|
|
|
2021-04-27 14:08:30 +02:00
|
|
|
# file_table contains paths of source, GFM, html and latex.
|
|
|
|
# It is possible to get the relationship between source file and created GFM/html/latex file.
|
|
|
|
|
|
|
|
# type is "gfm", "html" or "latex".
|
|
|
|
# Caller can specify the target type.
|
|
|
|
|
|
|
|
def src2md srcmd, md, file_table=nil, type="gfm"
|
2021-02-08 14:24:54 +01:00
|
|
|
# parameters:
|
|
|
|
# srcmd: .src.md file's path. source
|
|
|
|
# md: .md file's path. destination
|
2020-12-21 13:12:05 +01:00
|
|
|
src_buf = IO.readlines srcmd
|
|
|
|
src_dir = File.dirname srcmd
|
2021-01-11 03:15:04 +01:00
|
|
|
md_dir = File.dirname md
|
2021-03-12 06:45:24 +01:00
|
|
|
type_dir = File.basename md_dir # type of the target. gfm, html or latex
|
|
|
|
if type_dir == "gfm" || type_dir == "html" || type_dir == "latex"
|
|
|
|
type = type_dir
|
|
|
|
end
|
2021-01-11 03:15:04 +01:00
|
|
|
|
2021-03-03 15:45:54 +01:00
|
|
|
# phase 1
|
|
|
|
# @@@if - @@@elif - @@@else - @@@end
|
|
|
|
md_buf = []
|
|
|
|
if_stat = 0
|
|
|
|
src_buf.each do |line|
|
|
|
|
if line =~ /^@@@if *(\w+)/ && if_stat == 0
|
|
|
|
if_stat = type == $1 ? 1 : -1
|
|
|
|
elsif line =~ /^@@@elif *(\w+)/
|
|
|
|
if if_stat == 1
|
|
|
|
if_stat = -2
|
|
|
|
elsif if_stat == -1
|
|
|
|
if_stat = type == $1 ? 3 : -3
|
|
|
|
elsif if_stat == -2
|
|
|
|
# if_stat is kept to be -2
|
|
|
|
elsif if_stat == 3
|
|
|
|
if_stat = -2
|
|
|
|
elsif if_stat == -3
|
|
|
|
if_stat = type == $1 ? 3 : -3
|
|
|
|
end
|
|
|
|
elsif line =~ /^@@@else/
|
|
|
|
if if_stat == 1
|
|
|
|
if_stat = -2
|
|
|
|
elsif if_stat == -1
|
|
|
|
if_stat = 2
|
|
|
|
elsif if_stat == -2
|
|
|
|
# if_stat is kept to be -2
|
|
|
|
elsif if_stat == 3
|
|
|
|
if_stat = -2
|
|
|
|
elsif if_stat == -3
|
|
|
|
if_stat = 2
|
|
|
|
end
|
|
|
|
elsif line =~ /^@@@end/
|
|
|
|
if_stat = 0
|
|
|
|
elsif if_stat >= 0
|
|
|
|
md_buf << line
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
# phase 2
|
|
|
|
# @@@include and @@@shell
|
|
|
|
src_buf = md_buf
|
2020-12-21 13:12:05 +01:00
|
|
|
md_buf = []
|
2021-02-08 14:24:54 +01:00
|
|
|
include_flag = ""
|
|
|
|
shell_flag = false
|
2020-12-21 13:12:05 +01:00
|
|
|
src_buf.each do |line|
|
2021-02-08 14:24:54 +01:00
|
|
|
if include_flag == "-N" || include_flag == "-n"
|
|
|
|
if line == "@@@\n"
|
2021-03-03 15:45:54 +01:00
|
|
|
include_flag = ""
|
|
|
|
elsif line =~ /^\s*(\S*)\s*(.*)$/
|
2021-02-08 14:24:54 +01:00
|
|
|
c_file = $1
|
|
|
|
c_functions = $2.strip.split(" ")
|
|
|
|
if c_file =~ /^\// # absolute path
|
2021-02-17 15:59:50 +01:00
|
|
|
c_file_buf = File.readlines(c_file)
|
2021-02-08 14:24:54 +01:00
|
|
|
else #relative path
|
2021-02-17 15:59:50 +01:00
|
|
|
c_file_buf = File.readlines(src_dir+"/"+c_file)
|
2020-12-21 13:12:05 +01:00
|
|
|
end
|
2021-02-08 14:24:54 +01:00
|
|
|
if c_functions.empty? # no functions are specified
|
|
|
|
tmp_buf = c_file_buf
|
|
|
|
else
|
|
|
|
tmp_buf = []
|
|
|
|
spc = false
|
|
|
|
c_functions.each do |c_function|
|
|
|
|
from = c_file_buf.find_index { |line| line =~ /^#{c_function} *\(/ }
|
|
|
|
if ! from
|
2021-03-03 15:45:54 +01:00
|
|
|
warn "lib_src2md: ERROR in #{srcmd}: Didn't find #{c_function} in #{c_file}."
|
2020-12-21 13:12:05 +01:00
|
|
|
break
|
|
|
|
end
|
2021-02-08 14:24:54 +01:00
|
|
|
to = from
|
|
|
|
while to < c_file_buf.size do
|
|
|
|
if c_file_buf[to] == "}\n"
|
|
|
|
break
|
|
|
|
end
|
|
|
|
to += 1
|
|
|
|
end
|
2021-03-03 15:45:54 +01:00
|
|
|
if to >= c_file_buf.size
|
|
|
|
warn "lib_src2md: ERROR in #{srcmd}: function #{c_function} didn't end in #{c_file}."
|
|
|
|
break
|
|
|
|
end
|
2021-02-08 14:24:54 +01:00
|
|
|
n = from-1
|
|
|
|
if spc
|
|
|
|
tmp_buf << "\n"
|
|
|
|
else
|
|
|
|
spc = true
|
|
|
|
end
|
|
|
|
while n <= to do
|
|
|
|
tmp_buf << c_file_buf[n]
|
|
|
|
n += 1
|
|
|
|
end
|
2020-12-21 13:12:05 +01:00
|
|
|
end
|
2021-02-08 14:24:54 +01:00
|
|
|
end
|
2021-03-03 15:45:54 +01:00
|
|
|
if type == "gfm"
|
|
|
|
md_buf << "~~~#{lang(c_file, "gfm")}\n"
|
|
|
|
elsif type == "html"
|
|
|
|
language = lang(c_file, "pandoc")
|
|
|
|
if include_flag == "-n"
|
|
|
|
if language != ""
|
|
|
|
md_buf << "~~~{.#{language} .numberLines}\n"
|
|
|
|
else
|
|
|
|
md_buf << "~~~{.numberLines}\n"
|
|
|
|
end
|
|
|
|
else
|
|
|
|
if lang(c_file, "pandoc") != ""
|
|
|
|
md_buf << "~~~{.#{language}}\n"
|
|
|
|
else
|
|
|
|
md_buf << "~~~\n"
|
|
|
|
end
|
|
|
|
end
|
|
|
|
elsif type =="latex"
|
|
|
|
language = lang(c_file, "pandoc")
|
|
|
|
if include_flag == "-n"
|
|
|
|
if language == "C" || language == "ruby" || language == "xml" || language == "makefile"
|
|
|
|
md_buf << "~~~{.#{language} .numberLines}\n"
|
|
|
|
else
|
|
|
|
md_buf << "~~~{.numberLines}\n"
|
|
|
|
end
|
|
|
|
else
|
|
|
|
if language == "C" || language == "ruby" || language == "xml" || language == "makefile"
|
|
|
|
md_buf << "~~~{.#{language}}\n"
|
|
|
|
else
|
|
|
|
md_buf << "~~~\n"
|
|
|
|
end
|
|
|
|
end
|
2021-03-12 06:45:24 +01:00
|
|
|
else
|
|
|
|
md_buf << "~~~\n"
|
2021-03-03 15:45:54 +01:00
|
|
|
end
|
2021-02-08 14:24:54 +01:00
|
|
|
ln_width = tmp_buf.size.to_s.length
|
|
|
|
n = 1
|
|
|
|
tmp_buf.each do |l|
|
2021-03-03 15:45:54 +01:00
|
|
|
if type == "gfm" && include_flag == "-n"
|
2021-02-08 14:24:54 +01:00
|
|
|
l = sprintf("%#{ln_width}d %s", n, l)
|
2020-12-21 13:12:05 +01:00
|
|
|
end
|
2021-03-03 15:45:54 +01:00
|
|
|
md_buf << l
|
2021-02-08 14:24:54 +01:00
|
|
|
n += 1
|
2020-12-21 13:12:05 +01:00
|
|
|
end
|
2021-02-08 14:24:54 +01:00
|
|
|
md_buf << "~~~\n"
|
2020-12-21 13:12:05 +01:00
|
|
|
end
|
2021-02-08 14:24:54 +01:00
|
|
|
elsif shell_flag
|
|
|
|
if line == "@@@\n"
|
2021-03-03 15:45:54 +01:00
|
|
|
md_buf << "~~~\n"
|
2021-02-08 14:24:54 +01:00
|
|
|
shell_flag = false
|
|
|
|
else
|
2021-03-03 15:45:54 +01:00
|
|
|
md_buf << "$ #{line}"
|
2021-02-08 14:24:54 +01:00
|
|
|
`cd #{src_dir}; #{line.chomp}`.each_line do |l|
|
2021-03-03 15:45:54 +01:00
|
|
|
md_buf << l
|
2021-02-08 14:24:54 +01:00
|
|
|
end
|
|
|
|
end
|
2021-03-03 15:45:54 +01:00
|
|
|
elsif line == "@@@include\n" || line =~ /^@@@include *-n/
|
|
|
|
include_flag = "-n"
|
|
|
|
elsif line =~ /^@@@include *-N/
|
|
|
|
include_flag = "-N"
|
|
|
|
elsif line == "@@@shell\n"
|
|
|
|
md_buf << "~~~\n"
|
|
|
|
shell_flag = true
|
|
|
|
else
|
2021-04-27 14:08:30 +02:00
|
|
|
line = change_rel_link(line, src_dir, md_dir, file_table, type)
|
2021-03-03 15:45:54 +01:00
|
|
|
if type == "latex" # remove relative link
|
2021-04-22 04:48:18 +02:00
|
|
|
if ! (line =~ /\[[^\]]*\]\(http[^)]*\)/)
|
|
|
|
line.gsub!(/^([^!]*)\[([^\]]*)\]\([^\)]*\)/,"\\1\\2")
|
|
|
|
end
|
2021-03-03 15:45:54 +01:00
|
|
|
else # type == "gfm" or "html", then remove size option from link to image files.
|
|
|
|
line.gsub!(/(!\[[^\]]*\]\([^\)]*\)) *{width *= *\d*(|\.\d*)cm *height *= *\d*(|\.\d*)cm}/,"\\1")
|
2021-01-11 03:15:04 +01:00
|
|
|
end
|
2021-03-03 15:45:54 +01:00
|
|
|
md_buf << line
|
2021-01-11 03:15:04 +01:00
|
|
|
end
|
|
|
|
end
|
2020-12-21 13:12:05 +01:00
|
|
|
IO.write(md,md_buf.join)
|
|
|
|
end
|
|
|
|
|
2021-01-25 10:35:49 +01:00
|
|
|
# Change the base of relative links from org_dir to new_dir
|
2021-04-27 14:08:30 +02:00
|
|
|
def change_rel_link line, org_dir, new_dir, file_table=nil, type="gfm"
|
|
|
|
i = [nil, "gfm", "html", "latex"].find_index(type)
|
|
|
|
raise "Illegal type (#{type}).\n" unless i == 1 || i == 2 || i == 3
|
2021-01-25 10:35:49 +01:00
|
|
|
p_new_dir = Pathname.new new_dir
|
2021-01-11 03:15:04 +01:00
|
|
|
left = ""
|
|
|
|
right = line
|
2021-01-24 08:50:52 +01:00
|
|
|
while right =~ /(!?\[[^\]]*\])\(([^\)]*)\)/
|
2021-02-06 09:26:57 +01:00
|
|
|
left += $`
|
2021-01-11 03:15:04 +01:00
|
|
|
right = $'
|
|
|
|
name = $1
|
|
|
|
link = $2
|
2021-04-27 14:08:30 +02:00
|
|
|
if file_table
|
|
|
|
file_table.each do |tbl|
|
|
|
|
if tbl[0] == link
|
|
|
|
link = tbl[i]
|
|
|
|
break
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
if ! (link =~ /^(http|\/)/)
|
2021-01-25 10:35:49 +01:00
|
|
|
p_link = Pathname.new "#{org_dir}/#{link}"
|
|
|
|
link = p_link.relative_path_from(p_new_dir).to_s
|
2021-01-11 03:15:04 +01:00
|
|
|
end
|
|
|
|
left += "#{name}(#{link})"
|
|
|
|
end
|
|
|
|
left + right
|
|
|
|
end
|
|
|
|
|
2021-03-03 15:45:54 +01:00
|
|
|
def lang file, type_of_md
|
2021-01-25 10:35:49 +01:00
|
|
|
tbl = {".c" => "C", ".h" => "C", ".rb" => "ruby", ".xml" => "xml", ".ui" => "xml",
|
|
|
|
".y" => "bison", ".lex" => "lex", ".build" => "meson", ".md" => "markdown" }
|
|
|
|
name = File.basename file
|
|
|
|
if name == "Makefile"
|
|
|
|
return "makefile"
|
|
|
|
elsif name == "Rakefile"
|
|
|
|
return "ruby"
|
|
|
|
else
|
|
|
|
suffix = File.extname name
|
|
|
|
tbl.each do |key, val|
|
|
|
|
if suffix == key
|
2021-03-03 15:45:54 +01:00
|
|
|
return val if type_of_md == "gfm"
|
|
|
|
return val if type_of_md == "pandoc" && val != "meson"
|
2021-01-25 10:35:49 +01:00
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
return ""
|
|
|
|
end
|