#!/usr/bin/env tclsh # string.tcl -- # # Utilities for manipulating strings, words, single lines, # paragraphs, ... # # Copyright (c) 2000 by Ajuba Solutions. # Copyright (c) 2000 by Eric Melski # Copyright (c) 2002 by Joe English # Copyright (c) 2001-2014 by Andreas Kupries # # See the file "license.terms" for information on usage and redistribution # of this file, and for a DISCLAIMER OF ALL WARRANTIES. # # RCS: @(#) $Id: string.tcl,v 1.2 2008/03/22 16:03:11 mic42 Exp $ # ### ### ### ######### ######### ######### ## Requirements package require Tcl 8.2 namespace eval ::textutil::string {} # ### ### ### ######### ######### ######### ## API implementation # @c Removes the last character from the given . # # @a string: The string to manipulate. # # @r The without its last character. # # @i chopping proc ::textutil::string::chop {string} { return [string range $string 0 [expr {[string length $string]-2}]] } # @c Removes the first character from the given . # @c Convenience procedure. # # @a string: string to manipulate. # # @r The without its first character. # # @i tail proc ::textutil::string::tail {string} { return [string range $string 1 end] } # @c Capitalizes first character of the given . # @c Complementary procedure to

. # # @a string: string to manipulate. # # @r The with its first character capitalized. # # @i capitalize proc ::textutil::string::cap {string} { return [string toupper [string index $string 0]][string range $string 1 end] } # @c unCapitalizes first character of the given . # @c Complementary procedure to

" incr index } {^[ ]{0,3}#{1,6}} { # ATX STYLE HEADINGS set h_level 0 set h_result {} while {$index < $no_lines && ![is_empty_line $line]} { incr index if {!$h_level} { regexp {^\s*#+} $line m set h_level [string length [string trim $m]] } lappend h_result $line set line [lindex $lines $index] } set h_result [\ parse_inline [\ regsub -all {^\s*#+\s*|\s*#+\s*$} [join $h_result \n] {} \ ]\ ] append result "$h_result" } {^[ ]{0,3}\>} { # BLOCK QUOTES set bq_result {} while {$index < $no_lines} { incr index lappend bq_result [regsub {^[ ]{0,3}\>[ ]?} $line {}] if {[is_empty_line [lindex $lines $index]]} { set eoq 0 for {set peek $index} {$peek < $no_lines} {incr peek} { set line [lindex $lines $peek] if {![is_empty_line $line]} { if {![regexp {^[ ]{0,3}\>} $line]} { set eoq 1 } break } } if {$eoq} { break } } set line [lindex $lines $index] } set bq_result [string trim [join $bq_result \n]] append result

\n \ [apply_templates bq_result] \ \n

} {^\s{4,}\S+} { # CODE BLOCKS set code_result {} while {$index < $no_lines} { incr index lappend code_result [html_escape [\ regsub {^ } $line {}]\ ] set eoc 0 for {set peek $index} {$peek < $no_lines} {incr peek} { set line [lindex $lines $peek] if {![is_empty_line $line]} { if {![regexp {^\s{4,}} $line]} { set eoc 1 } break } } if {$eoc} { break } set line [lindex $lines $index] } set code_result [join $code_result \n] append result

 $code_result \n

} {^(?:(?:`{3,})|(?:~{3,}))\{?(\S+)?\}?\s*$} { # FENCED CODE BLOCKS set code_result {} if {[string index $line 0] eq {`}} { set end_match {^`{3,}\s*$} } else { set end_match {^~{3,}\s*$} } # # A language specifier might be provided # immediately after the leading delimiters. # # ```tcl # # The language specifier is used for two purposes: # a) As a CSS class name # (useful e.g. for highlight.js) # b) As a name for a source code to HTML converter. # When such a converter is registered, # the codeblock will be sent through this converter. # set lang_specifier [string tolower [lindex $matches end]] if {$lang_specifier ne ""} { set code_CCS_class " class='$lang_specifier'" incr ::Markdown::lang_counter($lang_specifier) } else { set code_CCS_class "" } while {$index < $no_lines} { incr index set line [lindex $lines $index] if {[regexp $end_match $line]} { incr index break } lappend code_result $line } set code_result [join $code_result \n] # # If there is a converter registered, apply it on # the resulting snippet. # if {[info exists ::Markdown::converter($lang_specifier)]} { set code_result [{*}$::Markdown::converter($lang_specifier) $code_result] } else { set code_result [html_escape $code_result] } append result \ "

" \
			 \
			$code_result \

} {^[ ]{0,3}(?:\*|-|\+) |^[ ]{0,3}\d+\. } { # LISTS set list_result {} # continue matching same list type if {[regexp $ol_match $line]} { set list_type ol set list_match $ol_match } else { set list_type ul set list_match $ul_match } set last_line AAA while {$index < $no_lines} \ { if {![regexp $list_match [lindex $lines $index]]} { break } set item_result {} set in_p 1 set p_count 1 if {[is_empty_line $last_line]} { incr p_count } set last_line $line set line [regsub "$list_match\\s*" $line {}] # prevent recursion on same line set line [regsub {\A(\d+)\.(\s+)} $line {\1\\.\2}] set line [regsub {\A(\*|\+|-)(\s+)} $line {\\\1\2}] lappend item_result $line for {set peek [expr $index + 1]} {$peek < $no_lines} {incr peek} { set line [lindex $lines $peek] if {[is_empty_line $line]} { set in_p 0 }\ elseif {[regexp {^ } $line]} { if {!$in_p} { incr p_count } set in_p 1 }\ elseif {[regexp $list_match $line]} { if {!$in_p} { incr p_count } break }\ elseif {!$in_p} { break } set last_line $line lappend item_result [regsub {^ } $line {}] } set item_result [join $item_result \n] if {$p_count > 1} { set item_result [apply_templates item_result li] } else { if {[regexp -lineanchor \ {(\A.*?)((?:^[ ]{0,3}(?:\*|-|\+) |^[ ]{0,3}\d+\. ).*\Z)} \ $item_result \ match para rest]} \ { set item_result [parse_inline $para] append item_result [apply_templates rest] } else { set item_result [parse_inline $item_result] } } lappend list_result "

$item_result

" set index $peek } append result <$list_type>\n \ [join $list_result \n] \ \n\n } {^<(?:p|div|h[1-6]|blockquote|pre|table|dl|ol|ul|script|noscript|form|fieldset|iframe|math|ins|del)} { # HTML BLOCKS set re_htmltag {<(/?)(\w+)(?:\s+\w+=(?:\"[^\"]+\"|'[^']+'))*\s*>} set buffer {} while {$index < $no_lines} \ { while {$index < $no_lines} \ { incr index append buffer $line \n if {[is_empty_line $line]} { break } set line [lindex $lines $index] } set tags [regexp -inline -all $re_htmltag $buffer] set stack_count 0 foreach {match type name} $tags { if {$type eq {}} { incr stack_count +1 } else { incr stack_count -1 } } if {$stack_count == 0} { break } } append result $buffer } {(?:^\s{0,3}|[^\\]+)\|} { # SIMPLE TABLES set cell_align {} set row_count 0 while {$index < $no_lines} \ { # insert a space between || to handle empty cells set row_cols [regexp -inline -all {(?:[^|]|\\\|)+} \ [regsub -all {\|(?=\|)} [string trim $line] {| }] \ ] if {$row_count == 0} \ { set sep_cols [lindex $lines [expr $index + 1]] # check if we have a separator row if {[regexp {^\s{0,3}\|?(?:\s*:?-+:?(?:\s*$|\s*\|))+} $sep_cols]} \ { set sep_cols [regexp -inline -all {(?:[^|]|\\\|)+} \ [string trim $sep_cols]] foreach {cell_data} $sep_cols \ { switch -regexp $cell_data { {:-*:} { lappend cell_align center } {:-+} { lappend cell_align left } {-+:} { lappend cell_align right } default { lappend cell_align {} } } } incr index } append result "\n" append result "\n" append result " \n" if {$cell_align ne {}} { set num_cols [llength $cell_align] } else { set num_cols [llength $row_cols] } for {set i 0} {$i < $num_cols} {incr i} \ { if {[set align [lindex $cell_align $i]] ne {}} { append result " "\n" } append result " \n" append result "\n" } else { if {$row_count == 1} { append result "\n" } append result " \n" if {$cell_align ne {}} { set num_cols [llength $cell_align] } else { set num_cols [llength $row_cols] } for {set i 0} {$i < $num_cols} {incr i} \ { if {[set align [lindex $cell_align $i]] ne {}} { append result " "\n" } append result " \n" } incr row_count set line [lindex $lines [incr index]] if {![regexp {(?:^\s{0,3}|[^\\]+)\|} $line]} { switch $row_count { 1 { append result "

" } else { append result "	" } append result [parse_inline [string trim \ [lindex $row_cols $i]]]
" } else { append result "	" } append result [parse_inline [string trim \ [lindex $row_cols $i]]]

\n" } default { append result "\n" append result "\n" } } break } } } default { # PARAGRAPHS AND SETTEXT STYLE HEADERS set p_type p set p_result {} while {($index < $no_lines) && ![is_empty_line $line]} \ { incr index switch -regexp $line { {^[ ]{0,3}=+$} { set p_type h1 break } {^[ ]{0,3}-+$} { set p_type h2 break } {^[ ]{0,3}(?:\*|-|\+) |^[ ]{0,3}\d+\. } { if {$parent eq {li}} { incr index -1 break } else { lappend p_result $line } } {^[ ]{0,3}-[ ]*-[ ]*-[- ]*$} - {^[ ]{0,3}_[ ]*_[ ]*_[_ ]*$} - {^[ ]{0,3}\*[ ]*\*[ ]*\*[\* ]*$} - {^[ ]{0,3}#{1,6}} \ { incr index -1 break } default { lappend p_result $line } } set line [lindex $lines $index] } set p_result [\ parse_inline [\ string trim [join $p_result \n]\ ]\ ] if {[is_empty_line [regsub -all {} $p_result {}]]} { # Do not make a new paragraph for just comments. append result $p_result } else { append result "<$p_type>$p_result" } } } } return $result } ## \private proc parse_inline {text} { set text [regsub -all -lineanchor {[ ]{2,}$} $text
] set index 0 set result {} set re_backticks {\A`+} set re_whitespace {\s} set re_inlinelink {\A\!?\[((?:[^\]]|\[[^\]]*?\])+)\]\s*$\s*((?:[^\s$]+|$[^\s$]+\))+)?(\s+([\"'])(.*)?\4)?\s*\)} set re_reflink {\A\!?\[((?:[^\]]|\[[^\]]*?\])+)\](?:\s*\[((?:[^\]]|\[[^\]]*?\])*)\])?} set re_htmltag {\A|\A<\w+(?:\s+\w+=(?:\"[^\"]+\"|\'[^\']+\'))*\s*/?>} set re_autolink {\A<(?:(\S+@\S+)|(\S+://\S+))>} set re_comment {\A} set re_entity {\A\&\S+;} while {[set chr [string index $text $index]] ne {}} { switch $chr { "\\" { # ESCAPES set next_chr [string index $text [expr $index + 1]] if {[string first $next_chr {\`*_\{\}[]()#+-.!>|}] != -1} { set chr $next_chr incr index } } {_} - {*} { # EMPHASIS if {[regexp $re_whitespace [string index $result end]] && [regexp $re_whitespace [string index $text [expr $index + 1]]]} \ { #do nothing } \ elseif {[regexp -start $index \ "\\A(\\$chr{1,3})((?:\[^\\$chr\\\\]|\\\\\\$chr)*)\\1" \ $text m del sub]} \ { switch [string length $del] { 1 { append result "[parse_inline $sub]" } 2 { append result "[parse_inline $sub]" } 3 { append result "[parse_inline $sub]" } } incr index [string length $m] continue } } {`} { # CODE regexp -start $index $re_backticks $text m set start [expr $index + [string length $m]] if {[regexp -start $start -indices $m $text m]} { set stop [expr [lindex $m 0] - 1] set sub [string trim [string range $text $start $stop]] append result "[html_escape $sub]" set index [expr [lindex $m 1] + 1] continue } } {!} - {[} { # LINKS AND IMAGES if {$chr eq {!}} { set ref_type img } else { set ref_type link } set match_found 0 if {[regexp -start $index $re_inlinelink $text m txt url ign del title]} { # INLINE incr index [string length $m] set url [html_escape [string trim $url {<> }]] set txt [parse_inline $txt] set title [parse_inline $title] set match_found 1 } elseif {[regexp -start $index $re_reflink $text m txt lbl]} { if {$lbl eq {}} { set lbl [regsub -all {\s+} $txt { }] } set lbl [string tolower $lbl] if {[info exists ::Markdown::_references($lbl)]} { lassign $::Markdown::_references($lbl) url title set url [html_escape [string trim $url {<> }]] set txt [parse_inline $txt] set title [parse_inline $title] # REFERENCED incr index [string length $m] set match_found 1 } } # PRINT IMG, A TAG if {$match_found} { if {$ref_type eq {link}} { if {$title ne {}} { append result "$txt" } else { append result "$txt" } } else { if {$title ne {}} { append result " $\"$txt\"$ " } else { append result " $\"$txt\"/$ " } } continue } } {<} { # HTML TAGS, COMMENTS AND AUTOLINKS if {[regexp -start $index $re_comment $text m]} { append result $m incr index [string length $m] continue } elseif {[regexp -start $index $re_autolink $text m email link]} { if {$link ne {}} { set link [html_escape $link] append result "$link" } else { set mailto_prefix "mailto:" if {![regexp "^${mailto_prefix}(.*)" $email mailto email]} { # $email does not contain the prefix "mailto:". set mailto "mailto:$email" } append result "$email" } incr index [string length $m] continue } elseif {[regexp -start $index $re_htmltag $text m]} { append result $m incr index [string length $m] continue } set chr [html_escape $chr] } {&} { # ENTITIES if {[regexp -start $index $re_entity $text m]} { append result $m incr index [string length $m] continue } set chr [html_escape $chr] } {>} - {'} - "\"" { # OTHER SPECIAL CHARACTERS set chr [html_escape $chr] } default {} } append result $chr incr index } return $result } ## \private proc is_empty_line {line} { return [regexp {^\s*$} $line] } ## \private proc html_escape {text} { return [string map {& & < < > > \" "} $text] } } package provide Markdown 1.1 ############################################################################## # # Author : Dr. Detlef Groth # Created By : Dr. Detlef Groth # Created : Sat Mar 7 22:17:34 2020 # Last Modified : <201109.1846> # # Description : plugin f�r mkdoc to convert Roxygen2 documention # nach Markdown # # ############################################################################## # # Copyright (c) 2020 Dr. Detlef Groth. # # # License: MIT # ############################################################################## package provide mkdoc::rox2md 0.1 namespace eval ::mkdoc {} proc ::mkdoc::rox2md {infile outfile} { set pkgname [lindex [split [file dirname $infile] "/"] end-1] set basename [file rootname [file tail [file tail $infile]]] # converts an R roxgene2 format into markdown # todo: # - html mode # - rox2html # - name tag, multiple files from same R file set filename $infile set res "" set nblock 0 set ddict [dict create] ;# all other parts set fdict [dict create] ;# first title part array set c [list title "" description "" details "" examples "" \ section "" usage "" seealso "" references "" return "" \ keywords "" param "" funcname "" alias "" args "" type ""] if [catch {open $filename r} infh] { puts stderr "Cannot open $filename: $infh" exit } else { set region "START" while {[gets $infh line] >= 0} { if {[regexp {^\s*#'.+%} $line]} { set line [regsub -all {\\%} $line "%"] } if {[regexp {^\s*#'\s+@title (.+)} $line -> title]} { incr nblock if {$nblock == 2} { set dkey [regsub {\$} $c(funcname) "_"] foreach key [array names c] { dict set fdict $dkey $key $c($key) set c($key) "" } } elseif {$nblock > 2} { set dkey [regsub {\$} $c(funcname) "_"] foreach key [array names c] { dict set ddict $dkey $key $c($key) set c($key) "" } } append c(title) "$title\n" #puts $out "# $title" set region TITLE } elseif {[regexp {^\s*#'\s+@description (.+)} $line -> descr]} { set region DESCRIPTION #puts $out "\n## DESCRIPTION\n\n> $descr" append c(description) "$descr\n" } elseif {[regexp {^\s*#'\s+@section\s+Details:(.*)} $line -> det]} { set region DETAILS #puts $out "\n## DETAILS\n\n> $det" append c(details) "$det\n" } elseif {[regexp {^\s*#'\s+@details (.*)} $line -> det]} { set region DETAILS #puts $out "\n## DETAILS\n\n> $det" append c(details) "$det\n" } elseif {[regexp {^\s*#'\s+@section (.*):} $line -> section]} { set region SECTION #puts $out "\n## [string toupper $section]\n\n" append c(section) "\n## [string toupper $section]\n\n" } elseif {[regexp {^\s*#'\s+@usage (.+)} $line -> txt]} { set region USAGE #puts $out "\n## USAGE\n\n> $txt" append c(usage) " $txt\n" } elseif {[regexp {^\s*#'\s+@(return|format) (.*)} $line -> flag text]} { if {$region eq "EXAMPLES"} { #puts $out "```" append c(examples) "```\n" } set region RETURN #puts $out "\n## VALUE\n\n> $txt" append c(return) "- $text\n" } elseif {[regexp {^\s*#'\s+@references *(.*)} $line -> txt]} { if {$region eq "EXAMPLES"} { #puts $out "```" append c(examples) "```\n" } set region REFERENCES #puts $out "\n## REFERENCES\n\n> $txt" append c(references) "$txt\n" } elseif {[regexp {^\s*#'\s+@seealso\s*(.*)} $line -> txt]} { if {$region eq "EXAMPLES"} { #puts $out "```" append c(examples) "```\n" } set region SEEALSO #puts $out "\n## SEE ALSO\n\n> $txt" append c(seealso) "$txt\n" } elseif {[regexp {^\s*#'\s+@keywords\s*(.*)} $line -> txt]} { if {$region eq "EXAMPLES"} { #puts $out "```" append c(examples) "```\n" } set region KEYWORDS #puts $out "\n## KEYWORDS\n\n> $txt" append c(keywords) "\n## KEYWORDS\n\n> $txt\n" } elseif {[regexp {^\s*#'\s+@examples\s*(.*)} $line -> txt]} { set region EXAMPLES #puts $out "\n## EXAMPLES\n\n```$txt" append c(examples) "```$txt\n" } elseif {[regexp {^\s*#'\s+@author\s*(.*)} $line -> txt]} { if {$region eq "EXAMPLES"} { #puts $out "```" append c(examples) "```\n" } set region AUTHORS #puts $out "\n## AUTHORS\n\n> $txt" append c(author) "$txt\n" } elseif {[regexp {^\s*#'\s+@param\s+([^\s]+)\s(.+)} $line -> param descr]} { if {$region ne "PARAM"} { set region PARAM #puts $out "\n*ARGUMENTS*\n> " } #puts $out "- *$param*: $descr" append c(param) "- *$param*: $descr\n" } elseif {[regexp {\s*#'\s+@([a-z]+)} $line -> txt]} { if {$region eq "EXAMPLES"} { #puts $out "```" append c(examples) "```\n" set region [string toupper $txt] } # puts $out "$txt" } elseif {[regexp {\s*#'\s+\\(describe|enumerate)} $line -> reg]} { set iregion $reg set sec [string tolower $region] append c($sec) "\n" continue } elseif {[regexp {\s*#' \}\s*$} $line] || [regexp {\s*#'\s+\\dontrun} $line]} { # skip dontrun finish regions etc continue } elseif {[regexp {\s*#'\s+\\item{(.+)}{(.+)}} $line -> item text]} { set sec [string tolower $region] if {$iregion eq "enumerate"} { #puts $out "1. *${item}* - $text" append c($sec) "1. ${item} - $text\n" } else { #puts $out "- *${item}* - $text" append c($sec) "- ${item} - $text\n" } } elseif {[regexp {\s*#'\s+\\item\s+(.+)} $line -> text]} { set sec [string tolower $region] if {$region eq "enumerate"} { #puts $out "1. $text" append c($sec) "1. $text\n" } else { #puts $out "- $text" append c($sec) "- $text\n" } } elseif {$region eq "DETAILS" && [regexp {\s*#'\s+([A-Za-z0-9]+.+)} $line -> text]} { set sec [string tolower $region] append c($sec) "$text\n" } elseif {$region eq "DETAILS" && [regexp {\s*#'\s*$} $line]} { set sec [string tolower $region] append c($sec) "\n" } elseif {[regexp {\s*#'\s*(.+)} $line -> text]} { if {$region ne "IGNORE"} { set sec [string tolower $region] #puts $out "$text" set text [regsub -all {\\code\{([^\}]+)\}} $text "`\\1`"] append c($sec) "$text\n" } } elseif {![regexp {\s*#'} $line]} { if {$region eq "EXAMPLES"} { #puts $out "```" append c(examples) "```\n" set region START } # puts $out "$txt" } if {$region ne "START"} { if {[regexp {^([a-zA-Z][^- =<]+)\s*(=|<-)} $line -> funcname] || [regexp {^\s*(NULL)} $line -> funcname]} { if {[regexp function $line]} { set c(type) function } else { set c(type) object } if {[regexp {$(.*)$\s*\{} $line -> args]} { if {$args eq ""} { append c(args) " " } else { append c(args) $args } set region START } elseif {[regexp {$(.+)} $line -> args]} { append c(args) $args set region ARGS } set c(funcname) $funcname } elseif {$region eq "ARGS" && [regexp {\s+(.+)$\s*\{} $line -> args]} { append c(args) $args set region START } elseif {$region eq "ARGS" && [regexp {\s+(.+)} $line -> args]} { append c(args) $args } } } close $infh # last entry set dkey [regsub {\$} $c(funcname) "_"] if {$nblock == 0} { puts stderr "Error: No documentation with roxygen2 tags found with $infile" return } foreach key [array names c] { if {$nblock == 1} { dict set fdict $dkey $key $c($key) } elseif {$nblock > 1} { dict set ddict $dkey $key $c($key) } set c($key) "" } set keys [list title funcname description] set out [open $outfile w 0600] set key [lindex [dict keys $fdict] 0] if {[dict get [dict get $fdict $key] type] eq "function"} { set mode S3 set top false set ddict [dict merge $fdict $ddict] } else { set mode OOP set top true mkdoc::roxout $out $pkgname $basename [dict get $fdict $key] $top } set x 0 foreach key [lsort [dict keys $ddict]] { if {[incr x] == 1 && $mode eq "OOP"} { puts $out "\n\n## METHODS\n\n" } mkdoc::roxout $out $pkgname $basename [dict get $ddict $key] false } close $out } } proc ::mkdoc::roxlink { } { uplevel 1 { if {[regexp {\\link\[([^\]]+?):([^\]]+?)(_.+)\]\{(.+?)\}} $line -> pkg bname link text]} { if {$pkg eq $pkgname && $basename eq $bname} { set line [regsub -all {\\link\[[^\]]+?:([^\]]+?)\]\{(.+?)\}} $line "\[\\2](#\\1)"] } elseif {$pkg eq $pkgname} { set line [regsub -all {\\link\[.+?:(.+)\]\{(.+?)\}} $line "\[\\2](${bname}.html#\\1)"] } else { set line [regsub -all {\\link\[.+?:(.+)\]\{(.+?)\}} $line "\[\\2](../../$pkg/${bname}.html#\\1)"] } } if {[regexp {\\link\[(.+):([^-]+)-class\]\{(.+?)\}} $line -> pkg bname link text]} { if {$pkg eq $pkgname && $basename eq $bname} { #puts stderr true set line [regsub -all {\\link\[.+?:([^-]+?)-class\]\{(.+?)\}} $line "\[\\2](#\\1)"] #puts $line } elseif {$pkg eq $pkgname} { set line [regsub -all {\\link\[.+?:(.+)-class\]\{(.+?)\}} $line "\[\\2](${bname}.html)"] } else { set line [regsub -all {\\link\[.+?:(.+)\]\{(.+?)\}} $line "\[\\2](../../$pkg/${bname}.html#\\1)"] } } set line [regsub -all {\\link\{(https?:.+?)\}} $line "\[\\1](\\1)"] set line [regsub -all {\\link\[.+?:(.+)\]\{(.+?)\}} $line "\[\\2](#\\1)"] set line [regsub -all {\\link\{(.+?)\}} $line "\[\\1\](\\1.html)"] set line [regsub -all {\\code\{(.+?)\}} $line "`\\1`"] } } proc ::mkdoc::roxtext { } { uplevel 1 { set item "> -" foreach line [split $det "\n"] { mkdoc::roxlink if {!$top && [regexp {^\s*$} $line]} { # new list items on empty line set item "> -" } elseif {!$top && $item eq "> -"} { set line "$item $line" set line [regsub {> - - } $line "> - "] puts $out $line set item "" } else { puts $out $line } } } } proc ::mkdoc::roxout {out pkgname basename cdict {top true}} { if {$top} { puts $out "# [dict get $cdict title]" puts $out "## NAME\n" if {[dict get $cdict funcname] ne "NULL"} { puts -nonewline $out "[dict get $cdict funcname] - " } puts $out "[dict get $cdict title]\n" } else { puts $out "\n## %} [dict get $cdict funcname] "\\1pipe"] "_"] _] {}]\">[dict get $cdict funcname]\n" } if {[dict exists $cdict description]} { if {$top} { puts $out "## DESCRIPTION\n" } else { puts $out "> " } puts $out "[dict get $cdict description]\n" } if {!$top} { puts -nonewline $out "> *Usage:* \n\n > - [dict get $cdict funcname]" if {[dict get $cdict args] ne ""} { puts $out " ([dict get $cdict args])\n" } else { puts $out "\n" } } if {[dict exists $cdict param] && [dict get $cdict param] ne ""} { if {$top} { puts $out "## Arguments\n\n" } else { puts $out "\n> *Arguments:*\n> " } set par [dict get $cdict param] set par [regsub -all {\\dots} $par "..."] puts $out $par } if {[dict exists $cdict return] && [dict get $cdict return] ne ""} { if {$top} { puts $out "## VALUE\n\n" } else { puts $out "\n> *Return value:*\n> " } set det [dict get $cdict return] mkdoc::roxtext } if {[dict exists $cdict details] && [dict get $cdict details] ne ""} { if {$top} { puts $out "## DETAILS\n" } set det [dict get $cdict details] if {!$top} { puts -nonewline $out "\n> *Details:*\n\n" } mkdoc::roxtext } foreach k [list references seealso] { if {[dict exists $cdict $k] && [dict get $cdict $k] ne ""} { set h [regsub "seealso" $k "See also"] set h [regsub "references" $h "References"] if {$top} { puts $out "\n## [string toupper $h]\n" } else { puts -nonewline $out "\n> *${h}:*\n\n> -" } set see [dict get $cdict $k] set it "" foreach line [split $see "\n"] { if {[regexp {^\s*$} $line]} { continue } if {!$top && [regexp {^\s*$} $line]} { set it "> - " } mkdoc::roxlink #set line [regsub -all {\\link\[.+?:(.+)\]\{(.+?)\}} $line "\[\\2\](#\\1)"] #set line [regsub -all {\\link\{(.+?)\}} $line "\[\\1\](#\\1)"] set line [regsub -all {\\code\{(.+)\}} $line "\\1"] if {![regexp {^\s*$} $line]} { puts $out "$it $line" } else { puts $out "" } } } } if {[dict exists $cdict examples] && [dict get $cdict examples] ne ""} { if {$top} { puts $out "## EXAMPLES\n" puts $out [dict get $cdict examples] } else { puts $out "\n> *Examples:*\n" set ex [regsub -all {```} [dict get $cdict examples] {> ```}] puts $out $ex } } if {[dict exists $cdict author] && [dict get $cdict author] ne ""} { if {$top} { puts $out "## AUTHOR(S)\n" } else { puts $out "> *Author(s):*\n\n> " } set auths [dict get $cdict author] foreach auth [split $auths "\n"] { if {[regexp {[a-z]} $auth]} { puts $out "- $auth" } } } } #!/bin/sh # A Tcl comment, whose contents don't matter \ exec tclsh "$0" "$@" ############################################################################## # Author : Dr. Detlef Groth # Created : Fri Nov 15 10:20:22 2019 # Last Modified : <201109.1919> # # Description : Command line utility and package to extract Markdown documentation # from programming code if embedded as after comment sequence #' # manual pages and installation of Tcl files as Tcl modules. # Copy and adaptation of dgw/dgwutils.tcl # # History : 2019-11-08 version 0.1 # 2019-11-28 version 0.2 # 2020-02-26 version 0.3 # ############################################################################## # # Copyright (c) 2019 Dr. Detlef Groth, E-mail: detlef(at)dgroth(dot)de # # This library is free software; you can use, modify, and redistribute it # for any purpose, provided that existing copyright notices are retained # in all copies and that this notice is included verbatim in any # distributions. # # This software is distributed WITHOUT ANY WARRANTY; without even the # implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. # ############################################################################## #' #' --- #' title: mkdoc::mkdoc __PKGVERSION__ #' author: Dr. Detlef Groth, Schwielowsee, Germany #' documentclass: scrartcl #' geometry: #' - top=20mm #' - right=20mm #' - left=20mm #' - bottom=30mm #' --- #' #' ## NAME #' #' **mkdoc::mkdoc** - Tcl package and command line application to extract and format #' embedded programming documentation from source code files written in Markdown and #' optionally converts them into HTML. #' #' ## TABLE OF CONTENTS #' #' - [SYNOPSIS](#synopsis) #' - [DESCRIPTION](#description) #' - [COMMAND](#command) #' - [mkdoc::mkdoc](#mkdoc) #' - [mkdoc::run](#run) #' - [EXAMPLE](#example) #' - [BASIC FORMATTING](#format) #' - [INSTALLATION](#install) #' - [SEE ALSO](#see) #' - [CHANGES](#changes) #' - [TODO](#todo) #' - [AUTHOR](#authors) #' - [LICENSE AND COPYRIGHT](#license) #' #' ## SYNOPSIS #' #' Usage as package: #' #' ``` #' package require mkdoc::mkdoc #' mkdoc::mkdoc inputfile outputfile ?-html|-md|-pandoc -css file.css? #' ``` #' #' Usage as command line application for extraction of Markdown comments prefixed with `#'`: #' #' ``` #' mkdoc inputfile outputfile ?--html|--md|--pandoc --css file.css? #' ``` #' #' Usage as command line application for conversion of Markdown to HTML: #' #' ``` #' mkdoc inputfile.md outputfile.html ?--css file.css? #' ``` #' #' ## DESCRIPTION #' #' **mkdoc::mkdoc** extracts embedded Markdown documentation from source code files and as well converts Markdown output to HTML if desired. #' The documentation inside the source code must be prefixed with the `#'` character sequence. #' The file extension of the output file determines the output format. File extensions can bei either `.md` for Markdown output or `.html` for html output. The latter requires the tcllib Markdown extension to be installed. If the file extension of the inputfile is *.md* and file extension of the output files is *.html* there will be simply a conversion from a Markdown to a HTML file. #' #' The file `mkdoc.tcl` can be as well directly used as a console application. An explanation on how to do this, is given in the section [Installation](#install). #' #' ## COMMAND #' #' #' **mkdoc::mkdoc** *infile outfile ?-mode -css file.css?* #' #' > Extracts the documentation in Markdown format from *infile* and writes the documentation #' to *outfile* either in Markdown or HTML format. #' #' > - *-infile filename* - file with embedded markdown documentation #' - *-outfile filename* - name of output file extension #' - *-html* - (mode) outfile should be a html file, not needed if the outfile extension is html #' - *-md* - (mode) outfile should be a Markdown file, not needed if the outfile extension is md #' - *-pandoc* - (mode) outfile should be a pandoc Markdown file with YAML header, needed even if the outfile extension is md #' - *-css cssfile* if outfile mode is html uses the given *cssfile* #' #' > If the *-mode* flag (one of -html, -md, -pandoc) is not given, the output format is taken from the file extension of the output file, either *.html* for HTML or *.md* for Markdown format. This deduction from the filetype can be overwritten giving either `-html` or `-md` as command line flags. If as mode `-pandoc` is given, the Markdown markup code as well contains the YAML header. #' If infile has the extension .md than conversion to html will be performed, outfile file extension #' In this case must be .html. If output is html a *-css* flag can be given to use the given stylesheet file instead of the default style sheet embedded within the mkdoc code. #' #' > Example: #' #' > ``` #' package require mkdoc::mkdoc #' mkdoc::mkdoc mkdoc.tcl mkdoc.html #' mkdoc::mkdoc mkdoc.tcl mkdoc.rmd -md #' > ``` package require Tcl 8.4 if {[package provide Markdown] eq ""} { package require Markdown } package provide mkdoc::mkdoc 0.4 package provide mkdoc [package present mkdoc::mkdoc] namespace eval mkdoc { variable mkdocfile [info script] variable htmltemplate { $document(title) $document(style) } variable htmltitle {

$document(title)

$document(author)

$document(date)

} $line]} { set synopsis false } if {[regexp -nocase {^

.*Synopsis} $line]} { set synopsis true } if {$synopsis && [regexp {

} $line]} {
                    set line [regsub {} $line ""]
                }
                append html "$line\n"
            }
            set out [open $outfile w 0644]
            if {$extract} {
                puts $out $header
                puts $out $htmltitle
            } else {
                set header [subst -nobackslashes -nocommands $header]
                puts $out $header
            }
            puts $out $html
            puts $out "\n"
            close $out
            puts stderr "Success: file $outfile was written!"
        } elseif {$mode eq "pandoc"} {
            set out [open $outfile w 0644]
            puts $out $YAML
            puts $out $mdhtml
            close $out
            
        } else {
            set out [open $outfile w 0644]
            puts $out $mdheader
            puts $out $mdhtml
            close $out
        }
    }
}
#' 
#' 
#' **mkdoc::run** *infile* 
#' 
#' > Source the code in infile and runs the examples in the documentation section
#'    written with Markdown documentation. Below follows an example section which can be
#'    run with `tclsh mkdoc.tcl mkdoc.tcl -run`
#' 
#' ## EXAMPLE
#' 
#' ```
#' puts "Hello mkdoc package"
#' puts "I am in the example section"
#' ```
#' 
proc mkdoc::run {argv} {
    set filename [lindex $argv 0]
    source $filename
    set extext ""
    set example false
    set excode false
    if [catch {open $filename r} infh] {
        puts stderr "Cannot open $filename: $infh"
        exit
    } else {
        while {[gets $infh line] >= 0} {
            # Process line
            if {$extext eq "" && [regexp -nocase \
                             {^\s*#'\s+#{2,3}\s.+Example} $line]} {
                set example true
            } elseif {$extext ne "" && \
                      [regexp -nocase "^\\s*#'.*\\s# demo: $extext" $line]} {
                set excode true
            } elseif {$example && [regexp {^\s*#'\s+>?\s*```} $line]} {
                set example false
                set excode true
            } elseif {$excode && [regexp {^\s*#'\s+>?\s*```} $line]} {
                namespace eval :: $code
                break
                # eval code
            } elseif {$excode && [regexp {^\s*#'\s(.+)} $line -> c]} {
                append code "$c\n"
            }
        }
        close $infh
        catch {
            update idletasks
            after 1000 
            destroy .
        }
    }
}
if {[info exists argv0] && $argv0 eq [info script]} {
    if {[lsearch $argv {--version}] > -1} {
        puts "[package provide mkdoc::mkdoc]"
        return
    } elseif {[lsearch $argv {--license}] > -1} {
        puts "MIT License - see manual page"
        return
    }
    if {[llength $argv] < 2 || [lsearch $argv {--help}] > -1} {
        puts "mkdoc - extract documentation in Markdown and convert it optionally into HTML"
        puts "        Author/Copyright: @ Detlef Groth, Caputh, Germany, 2019-2020"
        puts "        License: MIT"
        puts "\nUsage:  [info script] inputfile outputfile ?--html|--md|--pandoc --version --run --css file.css?\n"
        puts "     inputfile: the inputfile with embedded Markdown text after #' comments"
        puts "     outputfile: should have either the extension html or md "
        puts "        for automatic selection of the correct output format."  
        puts "        Deduction of output format can be suppressed by given mode flags:"
        puts "     --html, --md or --pandoc"
        puts "        --html give HTML output even if outputfile extension is not html"
        puts "        --md   give Markdown output event if outputfile extension is not md"
        puts "        --pandoc command line argument will emmit as well the YAML header"
        puts "          header which is a Markdown extension."
        puts "     --css file.css: use the given stylesheet filename instead of the"
        puts "           inbuild default on"
        puts "     --help: shows this help page"        
        puts "     --version: returns the package version"
        puts "     --run: runs the example section in the inout file"        
        puts "  Example: extract mkdoc's own embedded documentation as html:"
        puts "       tclsh mkdoc.tcl mkdoc.tcl mkdoc.html" 
        #        puts "        The -rox2md flag extracts roxygen2 R documentation from R script files"
        #        puts "        and converts them into markdown"
    } elseif {[llength $argv] == 2 && [lsearch $argv {--run}] == 1} {
        mkdoc::run $argv 
    } elseif {[llength $argv] == 2} {
        mkdoc::mkdoc [lindex $argv 0] [lindex $argv 1]
    } elseif {[llength $argv] > 2} {
        mkdoc::mkdoc [lindex $argv 0] [lindex $argv 1] [lrange $argv 2 end]
    }
}

#'
#' ## BASIC FORMATTING
#' 
#' For a complete list of Markdown formatting commands consult the basic Markdown syntax at [https://daringfireball.net](https://daringfireball.net/projects/markdown/syntax). 
#' Here just the most basic essentials  to create documentation are described.
#' Please note, that formatting blocks in Markdown are separated by an empty line, and empty line in this documenting mode is a line prefixed with the `#'` and nothing thereafter. 
#'
#' **Title and Author**
#' 
#' Title and author can be set at the beginning of the documentation in a so called YAML header. 
#' This header will be as well used by the document converter [pandoc](https://pandoc.org)  to handle various options for later processing if you extract not HTML but Markdown code from your documentation.
#'
#' A YAML header starts and ends with three hyphens. Here is the YAML header of this document:
#' 
#' ```
#' #' ---
#' #' title: mkdoc - Markdown extractor and formatter
#' #' author: Dr. Detlef Groth, Schwielowsee, Germany
#' #' ---
#' ```
#' 
#' Those four lines produce the two lines on top of this document. You can extend the header if you would like to process your document after extracting the Markdown with other tools, for instance with Pandoc.
#' 
#' You can as well specify an other style sheet, than the default by adding
#' the following style information:
#'
#' ```
#' #' ---
#' #' title: mkdoc - Markdown extractor and formatter
#' #' author: Dr. Detlef Groth, Schwielowsee, Germany
#' #' output:
#' #'   html_document:
#' #'     css: tufte.css
#' #' ---
#' ```
#' 
#' Please note, that the indentation is required and it is two spaces.
#'
#' **Headers**
#'
#' Headers are prefixed with the hash symbol, single hash stands for level 1 heading, double hashes for level 2 heading, etc.
#' Please note, that the embedded style sheet centers level 1 and level 3 headers, there are intended to be used
#' for the page title (h1), author (h3) and date information (h3) on top of the page.
#' ```
#' #' ## Section title
#' #'
#' #' Some free text that follows after the required empty 
#' #' line above ...
#' ```
#'
#' This produces a level 2 header. Please note, if you have a section name `synopsis` the code fragments thereafer will be hilighted different than the other code fragments. You should only use level 2 and 3 headers for the documentation. Level 1 header are reserved for the title.
#' 
#' **Lists**
#'
#' Lists can be given either using hyphens or stars at the beginning of a line.
#'
#' ```
#' #' - item 1
#' #' - item 2
#' #' - item 3
#' ```
#' 
#' Here the output:
#'
#' - item 1
#' - item 2
#' - item 3
#' 
#' A special list on top of the help page could be the table of contents list. Here is an example:
#'
#' ```
#' #' ## Table of Contents
#' #'
#' #' - [Synopsis](#synopsis)
#' #' - [Description](#description)
#' #' - [Command](#command)
#' #' - [Example](#example)
#' #' - [Authors](#author)
#' ```
#'
#' This will produce in HTML mode a clickable hyperlink list. You should however create
#' the name targets using html code like so:
#'
#' ```
#' ## Synopsis 
#' ```
#' 
#' **Hyperlinks**
#'
#' Hyperlinks are written with the following markup code:
#'
#' ```
#' [Link text](URL)
#' ```
#' 
#' Let's link to the Tcler's Wiki:
#' ```
#' [Tcler's Wiki](https://wiki.tcl-lang.org/)
#' ```
#' 
#' produces: [Tcler's Wiki](https://wiki.tcl-lang.org/)
#'
#' **Indentations**
#'
#' Indentations are achieved using the greater sign:
#' 
#' ```
#' #' Some text before
#' #'
#' #' > this will be indented
#' #'
#' #' This will be not indented again
#' ```
#' 
#' Here the output:
#'
#' Some text before
#' 
#' > this will be indented
#' 
#' This will be not indented again
#'
#' Also lists can be indented:
#' 
#' ```
#' > - item 1
#'   - item 2
#'   - item 3
#' ```
#'
#' produces:
#'
#' > - item 1
#'   - item 2
#'   - item 3
#'
#' **Fontfaces**
#' 
#' Italic font face can be requested by using single stars or underlines at the beginning 
#' and at the end of the text. Bold is achieved by dublicating those symbols:
#' Monospace font appears within backticks.
#' Here an example:
#' 
#' ```
#' I am _italic_ and I am __bold__! But I am programming code: `ls -l`
#' ```
#'
#' > I am _italic_ and I am __bold__! But I am programming code: `ls -l`
#' 
#' **Code blocks**
#'
#' Code blocks can be started using either three or more spaces after the #' sequence 
#' or by embracing the code block with triple backticks on top and on bottom. Here an example:
#' 
#' ```
#' #' ```
#' #' puts "Hello World!"
#' #' ```
#' ```
#'
#' Here the output:
#'
#' ```
#' puts "Hello World!"
#' ```
#'
#' **Images**
#'
#' If you insist on images in your documentation, images can be embedded in Markdown with a syntax close to links.
#' The links here however start with an exclamation mark:
#' 
#' ```
#' ![image caption](filename.png)
#' ```
#' 
#' The source code of mkdoc.tcl is a good example for usage of this source code 
#' annotation tool. Don't overuse the possibilities of Markdown, sometimes less is more. 
#' Write clear and concise, don't use fancy visual effects.
#' 
#' **Includes**
#' 
#' mkdoc in contrast to standard markdown as well support includes. Using the `#' #include "filename.md"` syntax 
#' it is possible to include other markdown files. This might be useful for instance to include the same 
#' header or a footer in a set of related files.
#'
#' ## INSTALLATION
#' 
#' The mkdoc::mkdoc package can be installed either as command line application or as a Tcl module. It requires the Markdown package from tcllib to be installed.
#' 
#' Installation as command line application can be done by copying the `mkdoc.tcl` as 
#' `mkdoc` to a directory which is in your executable path. You should make this file executable using `chmod`. There exists as well a standalone script which does not need already installed tcllib package.  You can download this script named: `mkdoc-version.app` from the [chiselapp release page](https://chiselapp.com/user/dgroth/repository/tclcode/wiki?name=releases).
#' 
#' Installation as Tcl module is achieved by copying the file `mkdoc.tcl` to a place 
#' which is your Tcl module path as `mkdoc/mkdoc-0.1.tm` for instance. See the [tm manual page](https://www.tcl.tk/man/tcl8.6/TclCmd/tm.htm)
#'
#' ## SEE ALSO
#' 
#' - [tcllib](https://core.tcl-lang.org/tcllib/doc/trunk/embedded/index.md) for the Markdown and the textutil packages
#' - [dgtools](https://chiselapp.com/user/dgroth/repository/tclcode) project for example help page
#' - [pandoc](https://pandoc.org) - a universal document converter
#' - [Ruff!](https://github.com/apnadkarni/ruff) Ruff! documentation generator for Tcl using Markdown syntax as well

#' 
#' ## CHANGES
#'
#' - 2019-11-19 Relase 0.1
#' - 2019-11-22 Adding direct conversion from Markdown files to HTML files.
#' - 2019-11-27 Documentation fixes
#' - 2019-11-28 Kit version
#' - 2019-11-28 Release 0.2 to fossil
#' - 2019-12-06 Partial R-Roxygen/Markdown support
#' - 2020-01-05 Documentation fixes and version information
#' - 2020-02-02 Adding include syntax
#' - 2020-02-26 Adding stylesheet option --css 
#' - 2020-02-26 Adding files pandoc.css and dgw.css
#' - 2020-02-26 Making standalone file using pkgDeps and mk_tm
#' - 2020-02-26 Release 0.3 to fossil
#' - 2020-02-27 support for \_\_DATE\_\_, \_\_PKGNAME\_\_, \_\_PKGVERSION\_\_ macros  in Tcl code based on package provide line
#' - 2020-09-01 Roxygen2 plugin
#' - 2020-11-09 argument --run supprt
#' - 2020-11-10 Release 0.4
#' 
#'
#' ## TODO
#'
#' - extract Roxygen2 documentation codes from R files (done)
#' - standalone files using mk_tm module maker (done, just using cat ;)
#' - support for \_\_PKGVERSION\_\_ and \_\_PKGNAME\_\_ replacements at least in Tcl files and via command line for other file types (done)
#'
#' ## AUTHOR(s)
#'
#' The **mkdoc::mkdoc** package was written by Dr. Detlef Groth, Schwielowsee, Germany.
#'
#' ## LICENSE AND COPYRIGHT
#'
#' Markdown extractor and converter mkdoc::mkdoc, version __PKGVERSION__
#'
#' Copyright (c) 2019-20  Dr. Detlef Groth, E-mail: 
#' 
#' This library is free software; you can use, modify, and redistribute it
#' for any purpose, provided that existing copyright notices are retained
#' in all copies and that this notice is included verbatim in any
#' distributions.
#' 
#' This software is distributed WITHOUT ANY WARRANTY; without even the
#' implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
#'