gh-md-toc 6.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229
  1. #!/usr/bin/env bash
  2. #
  3. # Steps:
  4. #
  5. # 1. Download corresponding html file for some README.md:
  6. # curl -s $1
  7. #
  8. # 2. Discard rows where no substring 'user-content-' (github's markup):
  9. # awk '/user-content-/ { ...
  10. #
  11. # 3.1 Get last number in each row like ' ... </span></a>sitemap.js</h1'.
  12. # It's a level of the current header:
  13. # substr($0, length($0), 1)
  14. #
  15. # 3.2 Get level from 3.1 and insert corresponding number of spaces before '*':
  16. # sprintf("%*s", substr($0, length($0), 1)*3, " ")
  17. #
  18. # 4. Find head's text and insert it inside "* [ ... ]":
  19. # substr($0, match($0, /a>.*<\/h/)+2, RLENGTH-5)
  20. #
  21. # 5. Find anchor and insert it inside "(...)":
  22. # substr($0, match($0, "href=\"[^\"]+?\" ")+6, RLENGTH-8)
  23. #
  24. gh_toc_version="0.5.0"
  25. gh_user_agent="gh-md-toc v$gh_toc_version"
  26. #
  27. # Download rendered into html README.md by its url.
  28. #
  29. #
  30. gh_toc_load() {
  31. local gh_url=$1
  32. if type curl &>/dev/null; then
  33. curl --user-agent "$gh_user_agent" -s "$gh_url"
  34. elif type wget &>/dev/null; then
  35. wget --user-agent="$gh_user_agent" -qO- "$gh_url"
  36. else
  37. echo "Please, install 'curl' or 'wget' and try again."
  38. exit 1
  39. fi
  40. }
  41. #
  42. # Converts local md file into html by GitHub
  43. #
  44. # ➥ curl -X POST --data '{"text": "Hello world github/linguist#1 **cool**, and #1!"}' https://api.github.com/markdown
  45. # <p>Hello world github/linguist#1 <strong>cool</strong>, and #1!</p>'"
  46. gh_toc_md2html() {
  47. local gh_file_md=$1
  48. URL=https://api.github.com/markdown/raw
  49. TOKEN="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)/token.txt"
  50. if [ -f "$TOKEN" ]; then
  51. URL="$URL?access_token=$(cat $TOKEN)"
  52. fi
  53. curl -s --user-agent "$gh_user_agent" \
  54. --data-binary @"$gh_file_md" -H "Content-Type:text/plain" \
  55. $URL
  56. }
  57. #
  58. # Is passed string url
  59. #
  60. gh_is_url() {
  61. case $1 in
  62. https* | http*)
  63. echo "yes";;
  64. *)
  65. echo "no";;
  66. esac
  67. }
  68. #
  69. # TOC generator
  70. #
  71. gh_toc(){
  72. local gh_src=$1
  73. local gh_src_copy=$1
  74. local gh_ttl_docs=$2
  75. local need_replace=$3
  76. if [ "$gh_src" = "" ]; then
  77. echo "Please, enter URL or local path for a README.md"
  78. exit 1
  79. fi
  80. # Show "TOC" string only if working with one document
  81. if [ "$gh_ttl_docs" = "1" ]; then
  82. echo "Table of Contents"
  83. echo "================="
  84. echo ""
  85. gh_src_copy=""
  86. fi
  87. if [ "$(gh_is_url "$gh_src")" == "yes" ]; then
  88. gh_toc_load "$gh_src" | gh_toc_grab "$gh_src_copy"
  89. if [ "$need_replace" = "yes" ]; then
  90. echo
  91. echo "!! '$gh_src' is not a local file"
  92. echo "!! Can't insert the TOC into it."
  93. echo
  94. fi
  95. else
  96. local toc=`gh_toc_md2html "$gh_src" | gh_toc_grab "$gh_src_copy"`
  97. echo "$toc"
  98. if [ "$need_replace" = "yes" ]; then
  99. local ts="<\!--ts-->"
  100. local te="<\!--te-->"
  101. local dt=`date +'%F_%H%M%S'`
  102. local ext=".orig.${dt}"
  103. local toc_path="${gh_src}.toc.${dt}"
  104. local toc_footer="<!-- Added by: `whoami`, at: `date --iso-8601='minutes'` -->"
  105. # http://fahdshariff.blogspot.ru/2012/12/sed-mutli-line-replacement-between-two.html
  106. # clear old TOC
  107. sed -i${ext} "/${ts}/,/${te}/{//!d;}" "$gh_src"
  108. # create toc file
  109. echo "${toc}" > "${toc_path}"
  110. echo -e "\n${toc_footer}\n" >> "$toc_path"
  111. # insert toc file
  112. if [[ "`uname`" == "Darwin" ]]; then
  113. sed -i "" "/${ts}/r ${toc_path}" "$gh_src"
  114. else
  115. sed -i "/${ts}/r ${toc_path}" "$gh_src"
  116. fi
  117. echo
  118. echo "!! TOC was added into: '$gh_src'"
  119. echo "!! Origin version of the file: '${gh_src}${ext}'"
  120. echo "!! TOC added into a separate file: '${toc_path}'"
  121. echo
  122. fi
  123. fi
  124. }
  125. #
  126. # Grabber of the TOC from rendered html
  127. #
  128. # $1 — a source url of document.
  129. # It's need if TOC is generated for multiple documents.
  130. #
  131. gh_toc_grab() {
  132. # if closed <h[1-6]> is on the new line, then move it on the prev line
  133. # for example:
  134. # was: The command <code>foo1</code>
  135. # </h1>
  136. # became: The command <code>foo1</code></h1>
  137. sed -e ':a' -e 'N' -e '$!ba' -e 's/\n<\/h/<\/h/g' |
  138. # find strings that corresponds to template
  139. grep -E -o '<a.*id="user-content-[^"]*".*</h[1-6]' |
  140. # remove code tags
  141. sed 's/<code>//' | sed 's/<\/code>//' |
  142. # now all rows are like:
  143. # <a id="user-content-..." href="..."><span ...></span></a> ... </h1
  144. # format result line
  145. # * $0 — whole string
  146. echo -e "$(awk -v "gh_url=$1" '{
  147. print sprintf("%*s", substr($0, length($0), 1)*3, " ") "* [" substr($0, match($0, /a>.*<\/h/)+2, RLENGTH-5)"](" gh_url substr($0, match($0, "href=\"[^\"]+?\" ")+6, RLENGTH-8) ")"}' | sed 'y/+/ /; s/%/\\x/g')"
  148. }
  149. #
  150. # Returns filename only from full path or url
  151. #
  152. gh_toc_get_filename() {
  153. echo "${1##*/}"
  154. }
  155. #
  156. # Options hendlers
  157. #
  158. gh_toc_app() {
  159. local app_name="gh-md-toc"
  160. local need_replace="no"
  161. if [ "$1" = '--help' ] || [ $# -eq 0 ] ; then
  162. echo "GitHub TOC generator ($app_name): $gh_toc_version"
  163. echo ""
  164. echo "Usage:"
  165. echo " $app_name [--insert] src [src] Create TOC for a README file (url or local path)"
  166. echo " $app_name - Create TOC for markdown from STDIN"
  167. echo " $app_name --help Show help"
  168. echo " $app_name --version Show version"
  169. return
  170. fi
  171. if [ "$1" = '--version' ]; then
  172. echo "$gh_toc_version"
  173. return
  174. fi
  175. if [ "$1" = "-" ]; then
  176. if [ -z "$TMPDIR" ]; then
  177. TMPDIR="/tmp"
  178. elif [ -n "$TMPDIR" -a ! -d "$TMPDIR" ]; then
  179. mkdir -p "$TMPDIR"
  180. fi
  181. local gh_tmp_md
  182. gh_tmp_md=$(mktemp $TMPDIR/tmp.XXXXXX)
  183. while read input; do
  184. echo "$input" >> "$gh_tmp_md"
  185. done
  186. gh_toc_md2html "$gh_tmp_md" | gh_toc_grab ""
  187. return
  188. fi
  189. if [ "$1" = '--insert' ]; then
  190. need_replace="yes"
  191. shift
  192. fi
  193. for md in "$@"
  194. do
  195. echo ""
  196. gh_toc "$md" "$#" "$need_replace"
  197. done
  198. echo ""
  199. echo "Created by [gh-md-toc](https://github.com/ekalinin/github-markdown-toc)"
  200. }
  201. #
  202. # Entry point
  203. #
  204. gh_toc_app "$@"