#+TITLE: sdp defaults #+AUTHOR: Ralph Amissah #+EMAIL: ralph.amissah@gmail.com #+STARTUP: indent #+LANGUAGE: en #+OPTIONS: H:3 num:nil toc:t \n:nil @:t ::t |:t ^:nil _:nil -:t f:t *:t <:t #+OPTIONS: TeX:t LaTeX:t skip:nil d:nil todo:t pri:nil tags:not-in-toc #+OPTIONS: author:nil email:nil creator:nil timestamp:nil #+PROPERTY: header-args :padline no :exports code :noweb yes #+EXPORT_SELECT_TAGS: export #+EXPORT_EXCLUDE_TAGS: noexport #+FILETAGS: :sdp:rel:ao: #+TAGS: assert(a) class(c) debug(d) mixin(m) sdp(s) tangle(T) template(t) WEB(W) noexport(n) [[./sdp.org][sdp]] [[./][org/]] * 0. ao regex & defaults ** 0. defaults :defaults: [[./sdp.org][sdp]] [[./][org/]] *** 0. defaults: :defaults: #+name: tangle_defaults #+BEGIN_SRC d :tangle ../src/sdp/ao_defaults.d /++ default settings +/ template SiSUregisters() { <> <> } <> <> <> <> <> #+END_SRC *** imports #+name: ao_defaults_imports #+BEGIN_SRC d private import std.algorithm, std.array, std.container, std.exception, std.file, std.getopt, std.json, std.path, std.process, std.range, std.regex, std.stdio, std.string, std.traits, std.typecons, std.uni, std.utf, std.conv : to; #+END_SRC *** settings metadata associative array indexes :settings: ***** conf associative array #+name: ao_defaults_template_registers #+BEGIN_SRC d string[string][string] conf_aa() { auto conf_ = [ "webserv": [ "url_root" : "", "path" : "~/sdp_www" , "images" : "" , "cgi" : "/usr/local/lib/sdp-cgi" ], "webserv_cgi": [ "host" : "localhost", "base_path" : "", "port" : "8081", "user" : "", "file_links" : "www.sisudoc.org" ], "processing": [ "path" : "~", "dir" : "_sisu_processing", "concord_max" : "400000" ], "flag": [ "act0" : "--digest --qrcode --text --html --epub --concordance --pdf --odf --docbook --xhtml --xml-sax --xml-dom --sqlite --manifest --verbose", "act1" : "--digest --text --html --manifest", "act2" : "--digest --text --html --epub --pdf --manifest", "act3" : "--digest --qrcode --text --html --epub --concordance --pdf --manifest", "act4" : "--digest --qrcode --text --html --epub --concordance --pdf --odf --docbook --manifest", "act5" : "--digest --qrcode --text --html --epub --concordance --pdf --odf --docbook --sqlite --manifest", "act6" : "--digest --qrcode --text --html --epub --concordance --pdf --odf --docbook --xhtml --xml-sax --xml-dom --sqlite --manifest", "act7" : "--digest --qrcode --text --html --epub --concordance --pdf --odf --docbook --xhtml --xml-sax --xml-dom --sqlite --source --sisupod --manifest", "act8" : "--digest --qrcode --text --html --epub --concordance --pdf --odf --docbook --xhtml --xml-sax --xml-dom --pg --update --manifest", "act9" : "--digest --qrcode --text --html --epub --concordance --pdf --odf --docbook --xhtml --xml-sax --xml-dom --pg --update --source --sisupod --manifest" ], "default": [ "papersize" : "a4,letter", "text_wrap" : "78", "emphasis" : "bold", "language" : "en", "digest" : "sha256" ], "permission": [ "share_source" : "" ], "program_select": [ "editor" : "vim", "epub_viewer" : "ebook-viewer", "html_viewer" : "xombrero", "odf_viewer" : "lowriter", "pdf_viewer" : "evince", "xml_viewer" : "xml-viewer" ], "search": [ "flag" : "", "action" : "", "db" : "", "title" : "" ] ]; return conf_; } #+END_SRC ***** make associative array #+name: ao_defaults_template_registers #+BEGIN_SRC d string[string][string] make_aa() { auto make_ = [ "make": [ "bold" : "", "breaks" : "", "cover_image" : "", "css" : "", "emphasis" : "", "footer" : "", "headings" : "", "home_button_image" : "", "home_button_text" : "", "italics" : "", "num_top" : "", "num_depth" : "", "substitute" : "", "texpdf_font" : "" ] ]; return make_; } #+END_SRC ***** meta (metadata) associative array #+name: ao_defaults_template_registers #+BEGIN_SRC d string[string][string] meta_aa() { auto meta_ = [ "classify": [ "dewey" : "", "keywords" : "", "loc" : "", "subject" : "", "topic_register" : "" ], "creator": [ "author" : "", "author_email" : "", "illustrator" : "", "translator" : "" ], "date": [ "added_to_site" : "", "available" : "", "created" : "", "issued" : "", "modified" : "", "published" : "", "valid" : "" ], "identifier": [ "isbn" : "", "oclc" : "", "pg" : "" ], "links": [ "link" : "" ], "notes": [ "abstract" : "", "description" : "" ], "original": [ "language" : "", "source" : "", "title" : "" ], "publisher": [ "name" : "" ], "rights": [ "copyright" : "", "cover" : "", "illustrations" : "", "license" : "" ], "title": [ "edition" : "", "full" : "", "language" : "", "main" : "", "note" : "", "sub" : "", "subtitle" : "" ] ]; return meta_; } #+END_SRC *** metadata associative array indexes :header: #+name: ao_defaults_template_registers #+BEGIN_SRC d auto ptr_head_main = [ "classify", "creator", "date", "identifier", "links", "make", /+ make +/ "original", "notes", "rights", "title" ]; auto ptr_head_sub_classify = [ "dewey", "keywords", "loc", "subject", "topic_register" ]; auto ptr_head_sub_creator = [ "author", "author_email", "cover", "illustrator", "translator" ]; auto ptr_head_sub_date = [ "added_to_site", "available", "created", "issued", "modified", "published", "valid" ]; auto ptr_head_sub_identifier = [ "isbn", "oclc", "pg" ]; /+ make +/ auto ptr_head_sub_make = [ "cover_image", "home_button_image", "home_button_text", "footer", "headings", "num_top", "num_depth", "breaks", "substitute", "bold", "italics", "emphasis", "texpdf_font", "css" ]; auto ptr_head_sub_notes = [ "abstract", "description" ]; auto ptr_head_sub_original = [ "language", "source", "title" ]; auto ptr_head_sub_publisher = [ "name" ]; auto ptr_head_sub_rights = [ "copyright", "cover", "illustrations", "license" ]; auto ptr_head_sub_title = [ "edition", "full", "language", "main", "note", "sub" ]; auto config_jsonstr = `{ }`; #+END_SRC **** notes headers #+name: ao_defaults_template #+BEGIN_SRC d /+ /+ unify internal representation of header info for native & sdlang document headers represent either using struct, hashes or possibly json sdp internal representation should be identical for native & sdlang variants +/ header. ├── make // make instructions │   ├── bold │   ├── breaks │   ├── cover_image │   ├── css │   ├── emphasis │   ├── footer │   ├── headings │   ├── home_button_image │   ├── home_button_text │   ├── italics │   ├── num_top │   ├── substitute │   └── texpdf_font └── meta // metadata    ├── author // move author to creator:author    ├── classify    │   ├── dewey    │   ├── keyword    │   ├── loc    │   ├── subject    │   └── topic_register    ├── creator    │   ├── author │ │ ├── [ [first_name: x0, last_name: y0], [first_name: x1, last_name: y1] ] │ │ └── [ full_name0, full_name1 ]    │   ├── author_email    │   ├── illustrator    │   └── translator    ├── date    │   ├── added_to_site    │   ├── available    │   ├── created    │   ├── issued    │   ├── modified    │   ├── published    │   └── valid    ├── identifier    │   ├── isbn    │   ├── oclc    │   └── pg    ├── links    ├── notes    │   ├── abstract    │   └── description    ├── original    │   ├── language    │   ├── source    │   └── title    ├── publisher    │   └── name    ├── rights    │   ├── copyright    │   ├── cover    │   ├── illustrations    │   └── license    └── title // move title: to title:main    ├── edition    ├── [ full (main + sub) ]    ├── language    ├── main    ├── note    ├── sub    └── subtitle // move title:subtitle to title:sub 61 leaves +/ #+END_SRC *** template: flags regex initialize :regex_flags: #+name: ao_defaults_template_init_flags #+BEGIN_SRC d template SiSUrgxInitFlags() { /+ regex flags +/ int[string] flags_type_init() { int[string] flags_type_init = [ "make_headings" : 0, "header_make" : 0, "header_meta" : 0, "heading" : 0, "biblio_section" : 0, "glossary_section" : 0, "blurb_section" : 0, "para" : 0, "blocks" : 0, // 0..2 generic "code" : 0, // 0..2 "poem" : 0, // 0..2 "table" : 0, // 0..2 "group" : 0, // 0..2 "block" : 0, // 0..2 "quote" : 0, // 0..2 "verse_new" : 0, "curly_code" : 0, "curly_poem" : 0, "curly_group" : 0, "curly_block" : 0, "curly_quote" : 0, "curly_table" : 0, "curly_table_special_markup" : 0, "tic_code" : 0, "tic_poem" : 0, "tic_group" : 0, "tic_block" : 0, "tic_quote" : 0, "tic_table" : 0, "ocn_status" : 0, // 0 obj_cite_number; 1 no obj_cite_number; 2 no obj_cite_number & dummy headings "ocn_status_multi_obj" : 0, // 0 obj_cite_number; 1 no obj_cite_number; 2 no obj_cite_number & dummy headings "book_index" : 0, ]; return flags_type_init; } } #+END_SRC #+name: ao_defaults_template_node #+BEGIN_SRC d template SiSUnode() { string[string] node_metadata_heading_str() { auto _node = [ "is" : "", "ocn" : "", "marked_up_lev" : "", "segment_anchor_tag" : "", "attrib" : "", ]; return _node; } int[string] node_metadata_heading_int() { auto _node = [ "ocn" : 0, "ptr_doc_object" : 0, "ptr_html_segnames" : 0, "ptr_heading" : 0, "heading_lev_markup" : 9, "heading_lev_collapsed" : 9, "parent_ocn" : 0, "parent_lev_markup" : 9, ]; return _node; } string[string] node_metadata_para_str() { auto _node = [ "is" : "", "ocn" : "", "attrib" : "", ]; return _node; } int[string] node_metadata_para_int() { auto _node = [ "ocn" : 0, "indent_base" : 0, "indent_hang" : 0, "bullet" : 0, // bool (0|1) ]; return _node; } } #+END_SRC *** template: bibliography :biblio: #+name: ao_defaults_template_biblio #+BEGIN_SRC d template SiSUbiblio() { // required: deemed_author (author || editor); year; fulltitle; struct BibJsnStr { auto biblio_entry_tags_jsonstr() { string x = `{ "is" : "", "sortby_deemed_author_year_title" : "", "deemed_author" : "", "author_raw" : "", "author" : "", "author_arr" : [ "" ], "editor_raw" : "", "editor" : "", "editor_arr" : [ "" ], "title" : "", "subtitle" : "", "fulltitle" : "", "language" : "", "trans" : "", "src" : "", "journal" : "", "in" : "", "volume" : "", "edition" : "", "year" : "", "place" : "", "publisher" : "", "url" : "", "pages" : "", "note" : "", "short_name" : "", "id" : "" }`; // is: book, article, magazine, newspaper, blog, other return x; } } } #+END_SRC ** 1. ctRegex :regex: [[./sdp.org][sdp]] [[./][org/]] http://dlang.org/phobos/std_regex.html - Plain string, in which case it's compiled to bytecode before matching. - Regex!char (wchar/dchar) that contains a pattern in the form of compiled bytecode. - StaticRegex!char (wchar/dchar) that contains a pattern in the form of compiled native machine code. *** 0. rgx code template: :ao_rgx: #+name: tangle_ao_rgx #+BEGIN_SRC d :tangle ../src/sdp/ao_rgx.d /++ regex: regular expressions used in sisu document parser +/ template SiSUrgxInit() { private import ao_defaults; struct Rgx { <> <> } } #+END_SRC *** misc :misc: #+name: ao_rgx #+BEGIN_SRC d /+ misc +/ static true_dollar = ctRegex!(`\$`, "gm"); static flag_action = ctRegex!(`^(--[a-z][a-z0-9-]+)$`); static flag_action_str = ctRegex!(` (--[a-z][a-z0-9-]+)`); static within_quotes = ctRegex!(`"(.+?)"`); static make_heading_delimiter = ctRegex!(`[;][ ]*`); static arr_delimiter = ctRegex!(`[ ]*[;][ ]*`); static name_delimiter = ctRegex!(`^([^,]+)[ ]*,[ ]+(.+?)$`); static book_index_go = ctRegex!("(?P(?P[0-9]+)(?:-[0-9]+)?)"); static book_index_go_scroll = ctRegex!("(?P(?P[0-9]+)(?:-[0-9]+)?)"); static book_index_go_seg = ctRegex!("(?P(?P[0-9]+)(?:-[0-9]+)?):(?P[a-z0-9_-]+)"); static book_index_go_seg_ = ctRegex!("(?P(?P[0-9]+)(?:-[0-9]+)?)(:(?P[a-z0-9_-]+))?"); static book_index_go_seg_anchorless = ctRegex!("(?P(?P[0-9]+)(?:-[0-9]+)?)"); static trailing_comma = ctRegex!(",[ ]*$"); static trailing_linebreak = ctRegex!(",[ ]{1,2}\\\\\\\\\n[ ]{4}$","m"); static newline_eol_delimiter = ctRegex!("\n"); static newline_eol_strip_preceding = ctRegex!("[ ]*\n"); static newline_eol_delimiter_only = ctRegex!("^\n"); static line_delimiter_ws_strip = ctRegex!("[ ]*\n[ ]*"); static para_delimiter = ctRegex!("\n[ ]*\n+"); static table_col_delimiter = ctRegex!("[ ]*\n+", "mg"); static table_row_delimiter = ctRegex!("\n[ ]*\n+", "mg"); static table_row_delimiter_special = ctRegex!("[ ]*\n", "mg"); // static table_col_delimiter_special = ctRegex!("[ ]*[|][ ]*", "mg"); // static levels_markup = ctRegex!(`^[A-D1-4]$`); static levels_numbered = ctRegex!(`^[0-9]$`); static levels_numbered_headings = ctRegex!(`^[0-7]$`); static numeric = ctRegex!(`[ 0-9,.-]+`); static numeric_col = ctRegex!(`^[ 0-9,.$£₤Є€€¥-]+$`); #+END_SRC *** comments :comment: #+name: ao_rgx #+BEGIN_SRC d /+ comments +/ static comment = ctRegex!(`^%+ `); static comments = ctRegex!(`^%+ |^%+$`); #+END_SRC *** native headers **** native header :native:header: #+name: ao_rgx #+BEGIN_SRC d /+ header +/ static main_headers = ctRegex!(`^(?:creator|title|rights|date|original|classify|identifier|notes|publisher|make|links)$`, "m"); static native_header = ctRegex!(`^@([a-z_]+):(?:\s|$)`); static native_header_make = ctRegex!(`^@(make):(?:\s|$)`); static native_header_meta = ctRegex!(`^@(?:creator|title|rights|date|original|classify|identifier|notes|publisher|links):(?:\s|$)`); static native_header_main = ctRegex!(`^@(?P
[a-z_]+):\s*(?P.*)`, "m"); static native_header_sub = ctRegex!(`^[ ]*:(?P[a-z_]+):\s+(?P.+)`, "m"); static native_header_meta_title = ctRegex!(`^@title:\s`, "m"); static variable_doc_title = ctRegex!(`@title`); static variable_doc_author = ctRegex!(`@author|@creator`); static raw_author_munge = ctRegex!(`(\S.+?),\s+(.+)`,"i"); #+END_SRC **** subheader :native:subheader: #+name: ao_rgx #+BEGIN_SRC d /+ head +/ static native_subhead_creator = ctRegex!(`^(?:author|translator|illustrator)$`, "m"); static native_subhead_title = ctRegex!(`^(?:main|sub(?:title)?|full|language|edition|note)$`, "m"); static native_subhead_rights = ctRegex!(`^(?:copyright|illustrations|license|cover)$`, "m"); static native_subhead_date = ctRegex!(`^(?:published|created|issued|available|valid|modified|added_to_site)$`, "m"); static native_subhead_original = ctRegex!(`^(?:title|language|source)$`, "m"); static native_subhead_classify = ctRegex!(`^(?:topic_register|subject|keywords|loc|dewey)$`, "m"); static native_subhead_identifier = ctRegex!(`^(?:oclc|pg|isbn)$`, "m"); static native_subhead_notes = ctRegex!(`^(?:abstract|description)$`, "m"); static native_subhead_publisher = ctRegex!(`^(?:name)$`, "m"); static native_subhead_make = ctRegex!(`^(?:cover_image|home_button_image|home_button_text|footer|headings|num_top|num_depth|breaks|substitute|bold|italics|emphasis|texpdf_font|css)$`, "m"); #+END_SRC *** heading & paragraph operators :paragraph:operator: #+name: ao_rgx #+BEGIN_SRC d /+ heading & paragraph operators +/ static heading_a = ctRegex!(`^:?[A][~] `, "m"); static heading = ctRegex!(`^:?([A-D1-4])[~]([a-z0-9_.-]*[?]?)\s+`,"i"); static heading_seg_and_above = ctRegex!(`^:?([A-D1])[~]([a-z0-9_.-]*[?]?)\s+`,"i"); static heading_marker = ctRegex!(`^:?([A-D1-4])[~]`); static heading_anchor_tag = ctRegex!(`^:?[A-D1-4][~]([a-z0-9_.-]+) `,"i"); static heading_identify_anchor_tag = ctRegex!(`^:?[A-D1-4][~]\s+(?:(?:(?:chapter|article|section|clause)\s+[0-9.]+)|(?:[0-9]+))`,"i"); // unless dob.obj =~/^:?[A-D1-4]~\s+(?:|(?:chapter|article|section|clause)\s+)([0-9.]+)/i static heading_extract_named_anchor_tag = ctRegex!(`^:?[A-D1-4][~]\s+(chapter|article|section|clause)\s+((?:[0-9]+.)*[0-9]+)(?:[.:;, ]|$)`,"i"); static heading_extract_unnamed_anchor_tag = ctRegex!(`^:?[A-D1-4][~]\s+((?:[0-9]+.)*[0-9]+)(?:[.:;, ]|$)`); static heading_marker_missing_tag = ctRegex!(`^:?([A-D1-4])[~] `); static heading_title = ctRegex!(`^:?[A-D1-4][~][a-z0-9_.-]*[?]?\s+(.+?)$`); static heading_all = ctRegex!(`^:?([A-D1-4])[~]([a-z0-9_.-]*[?]?)\s+(.+?)$`); // test, particularly [2] name/hashtag which may or may not be, does this affect title [3] static heading_backmatter = ctRegex!(`^:?1[~][!](glossary|bibliography|biblio|blurb)\s+`,"i"); static heading_biblio = ctRegex!(`^:?(1)[~][!](biblio(?:graphy)?|references?)`); static heading_glossary = ctRegex!(`^:?(1)[~][!](glossary)`); static heading_blurb = ctRegex!(`^:?(1)[~][!](blurb)`); static heading_biblio_glossary = ctRegex!(`^:?(?:(1)[~][!](?:(?:biblio(?:graphy)?|references?)|glossary)|[A-D1][~])`); static heading_biblio_blurb = ctRegex!(`^:?(?:(1)[~][!](?:(?:biblio(?:graphy)?|references?)|blurb)|[A-D1][~])`); static heading_blurb_glossary = ctRegex!(`^:?(?:(1)[~][!](?:blurb|glossary)|[A-D1][~])`); static para_bullet = ctRegex!(`^_[*] `); static para_bullet_indent = ctRegex!(`^_([1-9])[*] `); static para_indent = ctRegex!(`^_([1-9]) `); static para_indent_hang = ctRegex!(`^_([0-9])_([0-9]) `); static para_attribs = ctRegex!(`^_(?:(?:[0-9])(?:_([0-9]))?|(?:[1-9])?[*]) `); #+END_SRC *** blocked markup **** blocked markup :block:tic: #+name: ao_rgx #+BEGIN_SRC d /+ blocked markup +/ static block_open = ctRegex!("^((code([.][a-z][0-9a-z_]+)?|poem|group|block|quote|table)[{].*?$)|^`{3} (code([.][a-z][0-9a-z_]+)?|poem|group|block|quote|table)|^[{]table(~h)?(?P(?:[ ]+[0-9]+;)+)[}]"); static block_poem_open = ctRegex!("^((poem[{].*?$)|`{3} poem)"); #+END_SRC *** blocked markup tics :block:tic: #+name: ao_rgx #+BEGIN_SRC d /+ blocked markup tics +/ static block_tic_open = ctRegex!("^`{3} (code([.][a-z][0-9a-z_]+)?|poem|group|block|quote|table)"); static block_tic_code_open = ctRegex!("^`{3} (?:code)(?:[.]([a-z][0-9a-z_]+))?(?:[ ]+([#]))?"); static block_tic_poem_open = ctRegex!("^`{3} (poem)"); static block_tic_group_open = ctRegex!("^`{3} (group)"); static block_tic_block_open = ctRegex!("^`{3} (block)"); static block_tic_quote_open = ctRegex!("^`{3} (quote)"); static block_tic_table_open = ctRegex!("^`{3} table(.*)"); static block_tic_close = ctRegex!("^(`{3})$","m"); #+END_SRC **** blocked markup curly :block:curly: #+name: ao_rgx #+BEGIN_SRC d /+ blocked markup curly +/ static block_curly_open = ctRegex!(`^((code([.][a-z][0-9a-z_]+)?|poem|group|block|quote|table)[{].*?$)`); static block_curly_code_open = ctRegex!(`^(?:code(?:[.]([a-z][0-9a-z_]+))?[{]([#]?)\s*$)`); static block_curly_code_close = ctRegex!(`^([}]code)`); static block_curly_poem_open = ctRegex!(`^(poem[{].*?$)`); static block_curly_poem_close = ctRegex!(`^([}]poem)`); static block_curly_group_open = ctRegex!(`^(group[{].*?$)`); static block_curly_group_close = ctRegex!(`^([}]group)`); static block_curly_block_open = ctRegex!(`^(block[{].*?$)`); static block_curly_block_close = ctRegex!(`^([}]block)`); static block_curly_quote_open = ctRegex!(`^(quote[{].*?$)`); static block_curly_quote_close = ctRegex!(`^([}]quote)`); static block_curly_table_open = ctRegex!(`^table[{](.*)`); static block_curly_table_close = ctRegex!(`^([}]table)`); static block_curly_table_special_markup = ctRegex!(`^[{]table((~h)?(?P(?:[ ]+[0-9]+;)+))[}]`, "mg"); // sepcial table block markup #+END_SRC **** block sub-matches :block:curly: #+name: ao_rgx #+BEGIN_SRC d static table_head_instructions = ctRegex!(`(?Ph)?(?:[ ]+c(?P[0-9]);)?(?P(?:[ ]+[0-9]+[lr]?;)+)`); static table_col_widths_and_alignment = ctRegex!(`(?P[0-9]+)(?P[lr]?)`); static table_col_widths = ctRegex!(`(?P[0-9]+)`); static table_col_align = ctRegex!(`(?P[lr]?)`); static table_col_align_match = ctRegex!(`(?P[lr])`); static table_col_separator = ctRegex!(`┊`); static table_col_separator_nl = ctRegex!(`[┊]$`, "mg"); #+END_SRC *** inline markup footnotes endnotes :inline:footnote: #+name: ao_rgx #+BEGIN_SRC d /+ inline markup footnotes endnotes +/ static inline_notes_curly_gen = ctRegex!(`~\{.+?\}~`, "m"); static inline_notes_curly = ctRegex!(`~\{\s*(.+?)\}~`, "mg"); static inline_curly_delimiter_open_and_close_regular = ctRegex!(`~\{\s*|\s*\}~`, "m"); static inline_notes_delimiter_curly_regular = ctRegex!(`~\{[ ]*(.+?)\}~`, "m"); static inline_notes_curly_sp = ctRegex!(`~\{[*+]+\s+(.+?)\}~`, "m"); static inline_notes_curly_sp_asterisk = ctRegex!(`~\{[*]+\s+(.+?)\}~`, "m"); static inline_notes_curly_sp_plus = ctRegex!(`~\{[+]+\s+(.+?)\}~`, "m"); static inline_note_curly_delimiters = ctRegex!(`(~\{[*+]?\s*)(.+?)(\}~)`, "mg"); static inline_notes_square = ctRegex!(`~\[\s*(.+?)\]~`, "mg"); static inline_text_and_note_square_sp = ctRegex!(`(.+?)~\[[*+]+\s+(.+?)\]~`, "mg"); static inline_text_and_note_square = ctRegex!(`(.+?)~\[\s*(.+?)\]~`, "mg"); static inline_note_square_delimiters = ctRegex!(`(~\[\s*)(.+?)(\]~)`, "mg"); static inline_curly_delimiter_open_regular = ctRegex!(`~\{\s*`, "m"); static inline_curly_delimiter_open_symbol_star = ctRegex!(`~\{[*]\s`, "m"); // static inline_curly_delimiter_open_symbol_plus = ctRegex!(`~\{[+]\s`, "m"); // static inline_curly_delimiter_open_star_or_plus = ctRegex!(`~\{[+*]`, "m"); // static inline_curly_delimiter_close_regular = ctRegex!(`\s*\}~`, "m"); static inline_text_and_note_curly = ctRegex!(`(?P.+?)(?:(?:[~])[{][*+ ]*)(?P.+?)(?:[}][~])`, "mg"); static note_ref = ctRegex!(`^\S+?noteref_([0-9]+)`, "mg"); // {^{73.}^}#noteref_73 #+END_SRC **** links/ urls :inline:footnote: #+name: ao_rgx #+BEGIN_SRC d static inline_url_generic = ctRegex!(`(?:^|[}(\[ ])(?:(?:https?|git):\/\/|¤?\.\.\/|¤?\.\/|¤|#)[a-zA-Z0-9_#]`, "mg"); static inline_url = ctRegex!(`((?:(?:https?|git):\/\/|¤?\.\.\/|¤?\.\/|¤|#)[a-zA-Z0-9_]\S*)`, "mg"); static inline_link_naked_url = ctRegex!(`(?P^|[ ])(?P(?:(?:https?|git):\/\/|¤?\.\.\/|¤?\.\/|¤|#)\S+?)(?P[.,;:?!'"]?(?:[ ]|$))`, "mg"); static inline_link_markup_regular = ctRegex!(`(?P^|[ ])\{\s*(?P.+?)\s*\}(?P(?:(?:https?|git):\/\/|¤?\.\.\/|¤?\.\/|¤|#)\S+?)(?P[.,;:?!]?(?:[ ]|$))`, "mg"); static inline_link_endnote_url_helper_punctuated = ctRegex!(`\{~\^\s+(?P.+?)\}(?P(?:(?:https?|git):\/\/|¤?\.\.\/|¤?\.\/|¤|#)\S+?)(?P[.,;:?!]?(?:[ ]|$))`, "mg"); static inline_link_endnote_url_helper = ctRegex!(`\{~\^\s+(?P.+?)\}(?P(?:(?:https?|git):\/\/|¤?\.\.\/|¤?\.\/|¤|#)\S+)`, "mg"); #+END_SRC **** images :images: #+name: ao_rgx #+BEGIN_SRC d static image = ctRegex!(`([a-zA-Z0-9._-]+?\.(?:png|gif|jpg))`, "mg"); #+END_SRC **** inline markup book index :inline:bookindex: #+name: ao_rgx #+BEGIN_SRC d /+ inline markup book index +/ static book_index = ctRegex!(`^=\{\s*(.+?)\}$`, "m"); static book_index_open = ctRegex!(`^=\{\s*([^}]+?)$`); static book_index_close = ctRegex!(`^(.*?)\}$`, "m"); // strip #+END_SRC *** no obj_cite_number object :ocn:off:object: #+name: ao_rgx #+BEGIN_SRC d /+ no obj_cite_number object +/ static obj_cite_number_off = ctRegex!(`~#$`, "m"); static obj_cite_number_off_dh = ctRegex!(`-#$`, "m"); static obj_cite_number_off_all = ctRegex!(`[~-]#$`, "m"); #+END_SRC *** no obj_cite_number block :ocn:off:block: #+name: ao_rgx #+BEGIN_SRC d /+ no obj_cite_number block +/ static obj_cite_number_off_block = ctRegex!(`^--~#$`); static obj_cite_number_off_block_dh = ctRegex!(`^---#$`); static obj_cite_number_off_block_close = ctRegex!(`^--\+#$`); static obj_cite_number_block_marks = ctRegex!(`^--[+~-]#$`); #+END_SRC *** ignore outside code blocks :block:code: #+name: ao_rgx #+BEGIN_SRC d /+ ignore outside code blocks +/ static skip_from_regular_parse = ctRegex!(`^(--[+~-]#|-[\\]{2}-|=[.\\]{2}=)$`); // not structural info #+END_SRC *** line & page breaks :break: #+name: ao_rgx #+BEGIN_SRC d /+ line & page breaks +/ static break_line_within_object = ctRegex!(`[\\]{2}( |$)`); static break_page = ctRegex!(`^-[\\]{2}-$`); static break_page_new = ctRegex!(`^=[\\]{2}=$`); static break_page_line_across = ctRegex!(`^=[.]{2}=$`); static break_string = ctRegex!(`』`); static parent = ctRegex!(`([0-7]):([0-9]+)`); #+END_SRC *** json :json: #+name: ao_rgx #+BEGIN_SRC d /+ json +/ static tailing_comma = ctRegex!(`,$`, "m"); #+END_SRC *** biblio tags :biblio:tags: #+name: ao_rgx #+BEGIN_SRC d /+ biblio tags +/ static biblio_tags = ctRegex!(`^(is|au|author_raw|author|author_arr|editor_raw|ed|editor_arr|ti|title|subtitle|fulltitle|lng|language|trans|src|jo|journal|in|vol|volume|edn|edition|yr|year|pl|place|pb|pub|publisher|url|pg|pages|note|short_name|id):\s+(.+)`); static biblio_abbreviations = ctRegex!(`^(au|ed|ti|lng|jo|vol|edn|yr|pl|pb|pub|pg|pgs|sn)$`); #+END_SRC *** bookindex split :bookindex:split: #+name: ao_rgx #+BEGIN_SRC d /+ bookindex split +/ static bi_main_terms_split = ctRegex!(`\s*;\s*`); static bi_main_term_plus_rest_split = ctRegex!(`\s*:\s*`); static bi_sub_terms_plus_obj_cite_number_offset_split = ctRegex!(`\s*\|\s*`); static bi_term_and_obj_cite_numbers_match = ctRegex!(`^(.+?)\+(\d+)`); #+END_SRC *** language codes :language:codes: #+name: ao_rgx #+BEGIN_SRC d /+ language codes +/ auto language_codes = ctRegex!("(am|bg|bn|br|ca|cs|cy|da|de|el|en|eo|es|et|eu|fi|fr|ga|gl|he|hi|hr|hy|ia|is|it|ja|ko|la|lo|lt|lv|ml|mr|nl|no|nn|oc|pl|pt|pt_BR|ro|ru|sa|se|sk|sl|sq|sr|sv|ta|te|th|tk|tr|uk|ur|vi|zh)"); auto language_code_and_filename = ctRegex!("(am|bg|bn|br|ca|cs|cy|da|de|el|en|eo|es|et|eu|fi|fr|ga|gl|he|hi|hr|hy|ia|is|it|ja|ko|la|lo|lt|lv|ml|mr|nl|no|nn|oc|pl|pt|pt_BR|ro|ru|sa|se|sk|sl|sq|sr|sv|ta|te|th|tk|tr|uk|ur|vi|zh)/[A-Za-z0-9._-].+?[.](?:sst|ssm)$"); #+END_SRC * 1. output regex & defaults ** 0. defaults :defaults: *** 0. defaults: :defaults: #+name: tangle_defaults #+BEGIN_SRC d :tangle ../src/sdp/defaults.d /++ default settings +/ <> <> <> <> #+END_SRC *** imports #+name: defaults_imports #+BEGIN_SRC d private import std.algorithm, std.array, std.container, std.exception, std.file, std.getopt, std.json, std.path, std.process, std.range, std.regex, std.stdio, std.string, std.traits, std.typecons, std.uni, std.utf, std.conv : to; #+END_SRC *** TODO template: dir paths :dir:path: #+name: defaults_template_paths #+BEGIN_SRC d template SiSUpaths() { #+END_SRC **** base #+name: defaults_template_paths #+BEGIN_SRC d struct DirPaths { string base_filename(string fn_src) { return baseName(stripExtension(fn_src)); } } #+END_SRC **** sisupod ***** pod #+name: defaults_template_paths #+BEGIN_SRC d struct SiSUpodPaths { string base_filename(string fn_src) { return baseName(stripExtension(fn_src)); } string sisupod_filename(string fn_src) { return "sisupod".chainPath(base_filename(fn_src) ~ ".zip").array; } string base(string fn_src) { return "sisupod".chainPath(base_filename(fn_src)).array; } } #+END_SRC ***** pod zipped #+name: defaults_template_paths #+BEGIN_SRC d struct SiSUpodPathsZipped { auto spod_pths = SiSUpodPaths(); string base_filename(string fn_src) { return spod_pths.base_filename(fn_src); } string sisupod_filename(string fn_src) { return spod_pths.sisupod_filename(fn_src); } string base(string fn_src) { return spod_pths.base(fn_src); } auto doc_root(string fn_src) { return "doc"; } auto doc(string fn_src) { return doc_root(fn_src); } auto doc_lng(string fn_src, string lng) { return doc_root(fn_src).chainPath(lng).array; } auto conf(string fn_src) { return doc_root(fn_src).chainPath("_sisu").array; } auto image(string fn_src) { return conf(fn_src).chainPath("image").array; } auto css(string fn_src) { return conf(fn_src).chainPath("css").array; } auto fn_doc(string fn_src, string lng) { return (doc_lng(fn_src, lng)).chainPath(baseName(fn_src)).array; } auto fn_doc_insert(string fn_src, string fn_insert, string lng) { return (doc_lng(fn_src, lng)).chainPath(baseName(fn_insert)).array; } } #+END_SRC ***** pod unzipped archive #+name: defaults_template_paths #+BEGIN_SRC d struct SiSUpodPathsFilesystemArchive { auto spod_pths = SiSUpodPaths(); string base_filename(string fn_src) { return spod_pths.base_filename(fn_src); } string sisupod_filename(string fn_src) { return spod_pths.sisupod_filename(fn_src); } string base(string fn_src) { return spod_pths.base(fn_src); } auto doc_root(string fn_src) { return base(fn_src).chainPath("doc").array; } auto doc(string fn_src) { return doc_root(fn_src); } auto doc_lng(string fn_src, string lng) { return doc_root(fn_src).chainPath(lng).array; } auto conf(string fn_src) { return doc_root(fn_src).chainPath("_sisu").array; } auto image(string fn_src) { return conf(fn_src).chainPath("image").array; } auto css(string fn_src) { return conf(fn_src).chainPath("css").array; } auto fn_doc(string fn_src, string lng) { return (doc_lng(fn_src, lng)).chainPath(baseName(fn_src)).array; } auto fn_doc_insert(string fn_src, string fn_insert, string lng) { return (doc_lng(fn_src, lng)).chainPath(baseName(fn_insert)).array; } } #+END_SRC **** html5 #+name: defaults_template_paths #+BEGIN_SRC d struct HtmlPaths { string base_filename(string fn_src) { return baseName(stripExtension(fn_src)); } string base() { return "en".chainPath("html").array; } string seg(string fn_src) { return base.chainPath(base_filename(fn_src)).array; } string fn_scroll(string fn_src) { return base.chainPath(base_filename(fn_src) ~ ".html").array; } string fn_seg(string fn_src, string seg_filename) { return seg(fn_src).chainPath(seg_filename ~ ".html").array; } } #+END_SRC **** epub3 #+name: defaults_template_paths #+BEGIN_SRC d struct Epub3paths { string dirtop() { return "".chainPath("").array; } string base_filename(string fn_src) { return baseName(stripExtension(fn_src)); } string base() { return "en".chainPath("epub3").array; } string epub_file(string fn_src) { return base.chainPath(base_filename(fn_src) ~ ".epub").array; } string docdir(string fn_src) { return base.chainPath(base_filename(fn_src)).array; } string doc_meta_inf(string fn_src) { return dirtop.chainPath("META-INF").array; } string doc_oebps(string fn_src) { return dirtop.chainPath("OEBPS").array; } string doc_oebps_css(string fn_src) { return doc_oebps(fn_src).chainPath("css").array; } string doc_oebps_image(string fn_src) { return doc_oebps(fn_src).chainPath("image").array; } string fn_mimetypes(string fn_src) { return dirtop.chainPath("mimetypes").array; } string fn_dmi_container_xml(string fn_src) { return doc_meta_inf(fn_src).chainPath("container.xml").array; } string fn_oebps_toc_nav_xhtml(string fn_src) { return doc_oebps(fn_src).chainPath("toc_nav.xhtml").array; } string fn_oebps_toc_ncx(string fn_src) { return doc_oebps(fn_src).chainPath("toc.ncx").array; } string fn_oebps_content_opf(string fn_src) { return doc_oebps(fn_src).chainPath("content.opf").array; } string fn_oebps_content_xhtml(string fn_src, string seg_filename) { return doc_oebps(fn_src).chainPath(seg_filename ~ ".xhtml").array; } debug(epub_output) { string dbg_doc_meta_inf(string fn_src) { return docdir(fn_src).chainPath("META-INF").array; } string dbg_doc_oebps(string fn_src) { return docdir(fn_src).chainPath("OEBPS").array; } string dbg_doc_oebps_css(string fn_src) { return doc_oebps(fn_src).chainPath("css").array; } string dbg_doc_oebps_image(string fn_src) { return doc_oebps(fn_src).chainPath("image").array; } string dbg_fn_mimetypes(string fn_src) { return docdir(fn_src).chainPath("mimetypes").array; } string dbg_fn_dmi_container_xml(string fn_src) { return doc_meta_inf(fn_src).chainPath("container.xml").array; } string dbg_fn_oebps_toc_nav_xhtml(string fn_src) { return doc_oebps(fn_src).chainPath("toc_nav.xhtml").array; } string dbg_fn_oebps_toc_ncx(string fn_src) { return doc_oebps(fn_src).chainPath("toc.ncx").array; } string dbg_fn_oebps_content_opf(string fn_src) { return doc_oebps(fn_src).chainPath("content.opf").array; } string dbg_fn_oebps_content_xhtml(string fn_src, string seg_filename) { return doc_oebps(fn_src).chainPath(seg_filename ~ ".xhtml").array; } } } } #+END_SRC ** 1. ctRegex :regex: [[./sdp.org][sdp]] [[./][org/]] http://dlang.org/phobos/std_regex.html - Plain string, in which case it's compiled to bytecode before matching. - Regex!char (wchar/dchar) that contains a pattern in the form of compiled bytecode. - StaticRegex!char (wchar/dchar) that contains a pattern in the form of compiled native machine code. *** 0. code template: :rgx: #+name: tangle_ao_rgx #+BEGIN_SRC d :tangle ../src/sdp/output_rgx.d /++ regex: regular expressions used in sisu document parser +/ template SiSUoutputRgxInit() { private import defaults; struct Rgx { <> <> } } #+END_SRC *** special characters **** xhtml special characters #+name: sp_ch_xhtml_rgx #+BEGIN_SRC d static xhtml_ampersand = ctRegex!(`[&]`); // & static xhtml_less_than = ctRegex!(`[<]`); // < static xhtml_greater_than = ctRegex!(`[>]`); // > static xhtml_line_break = ctRegex!(` [\\]{2}`); //
#+END_SRC * 2. defaults shared by ao & output (generic) ** 0. defaults :defaults: *** template: internal markup :markup: #+name: defaults_template_markup #+BEGIN_SRC d template InternalMarkup() { struct InlineMarkup { auto en_a_o = "【"; auto en_a_c = "】"; // endnote en_a_o: '~{'; en_a_c: '}~'; auto en_b_o = "〖"; auto en_b_c = "〗"; // endnote en_b_o: '~['; en_b_c: ']~'; auto lnk_o = "┥"; auto lnk_c = "┝"; // auto lnk_o = "⌠"; auto lnk_c = "⌡"; // '⌈' '⌋' '⌠' '⌡' #Mx[:lnk_o= '◁'; Mx[:lnk_c= '▷' #‹ › auto url_o = "┤"; auto url_c = "├"; auto mark_internal_site_lnk = "¤"; auto nbsp = "░"; auto br_line = "┘"; // "╱"; // lB ▌ 9612 ┘ ¶ auto br_nl = "┙"; // "╲"; // lB ▌ 』 ┘ auto br_paragraph = "┚"; // "█"; // FB █ 9608 # PP ∥ 8741 #▐ #'┘' #'¶' #FB █ 9608 lB ▌ 9612 RB ▐ 9616 auto br_obj = "break_obj"; auto br_page_line = "┼"; // "▭"; auto br_page = "┿"; // "┼"; auto br_page_new = "╂"; // "╋"; auto tc_s = "┊"; // "┴"; //"『"; // "┏" ┓ auto tc_o = "┏"; //"『"; // "┏" ┓ auto tc_c = "┚"; // "』"; // "┚" table row mark #Mx[:tc_c]="』\n" auto tc_p = "┆"; // table col/misc mark string indent_by_spaces_provided(int indent, string _indent_spaces ="░░") { _indent_spaces = replicate(_indent_spaces, indent); return _indent_spaces; } string repeat_character_by_number_provided(C,N)(C _character ="-", N number=10) { _character = replicate(_character, number); return _character; } } } #+END_SRC *** template language codes #+name: defaults_template_language_codes #+BEGIN_SRC d template SiSUlanguageCodes() { /+ language codes +/ struct Lang { string[string][string] codes() { auto _lang_codes = [ "am": [ "c": "am", "n": "Amharic", "t": "Amharic", "xlp": "amharic" ], "bg": [ "c": "bg", "n": "Bulgarian", "t": "Български (Bəlgarski)", "xlp": "bulgarian" ], "bn": [ "c": "bn", "n": "Bengali", "t": "Bengali", "xlp": "bengali" ], "br": [ "c": "br", "n": "Breton", "t": "Breton", "xlp": "breton" ], "ca": [ "c": "ca", "n": "Catalan", "t": "catalan", "xlp": "catalan" ], "cs": [ "c": "cs", "n": "Czech", "t": "česky", "xlp": "czech" ], "cy": [ "c": "cy", "n": "Welsh", "t": "Welsh", "xlp": "welsh" ], "da": [ "c": "da", "n": "Danish", "t": "dansk", "xlp": "danish" ], "de": [ "c": "de", "n": "German", "t": "Deutsch", "xlp": "german" ], "el": [ "c": "el", "n": "Greek", "t": "Ελληνικά (Ellinika)", "xlp": "greek" ], "en": [ "c": "en", "n": "English", "t": "English", "xlp": "english" ], "eo": [ "c": "eo", "n": "Esperanto", "t": "Esperanto", "xlp": "esperanto" ], "es": [ "c": "es", "n": "Spanish", "t": "español", "xlp": "spanish" ], "et": [ "c": "et", "n": "Estonian", "t": "Estonian", "xlp": "estonian" ], "eu": [ "c": "eu", "n": "Basque", "t": "basque", "xlp": "basque" ], "fi": [ "c": "fi", "n": "Finnish", "t": "suomi", "xlp": "finnish" ], "fr": [ "c": "fr", "n": "French", "t": "français", "xlp": "french" ], "ga": [ "c": "ga", "n": "Irish", "t": "Irish", "xlp": "irish" ], "gl": [ "c": "gl", "n": "Galician", "t": "Galician", "xlp": "galician" ], "he": [ "c": "he", "n": "Hebrew", "t": "Hebrew", "xlp": "hebrew" ], "hi": [ "c": "hi", "n": "Hindi", "t": "Hindi", "xlp": "hindi" ], "hr": [ "c": "hr", "n": "Croatian", "t": "Croatian", "xlp": "croatian" ], "hy": [ "c": "hy", "n": "Armenian", "t": "Armenian", "xlp": "armenian" ], "ia": [ "c": "ia", "n": "Interlingua", "t": "Interlingua", "xlp": "interlingua" ], "is": [ "c": "is", "n": "Icelandic", "t": "Icelandic", "xlp": "icelandic" ], "it": [ "c": "it", "n": "Italian", "t": "Italiano", "xlp": "italian" ], "ja": [ "c": "ja", "n": "Japanese", "t": "日本語 (Nihongo)", "xlp": "japanese" ], "ko": [ "c": "ko", "n": "Korean", "t": "Korean", "xlp": "korean" ], "la": [ "c": "la", "n": "Latin", "t": "Latin", "xlp": "latin" ], "lo": [ "c": "lo", "n": "Lao", "t": "Lao", "xlp": "lao" ], "lt": [ "c": "lt", "n": "Lithuanian", "t": "Lithuanian", "xlp": "lithuanian" ], "lv": [ "c": "lv", "n": "Latvian", "t": "Latvian", "xlp": "latvian" ], "ml": [ "c": "ml", "n": "Malayalam", "t": "Malayalam", "xlp": "malayalam" ], "mr": [ "c": "mr", "n": "Marathi", "t": "Marathi", "xlp": "marathi" ], "nl": [ "c": "nl", "n": "Dutch", "t": "Nederlands", "xlp": "dutch" ], "no": [ "c": "no", "n": "Norwegian", "t": "norsk", "xlp": "norsk" ], "nn": [ "c": "nn", "n": "Norwegian Nynorsk", "t": "nynorsk", "xlp": "nynorsk" ], "oc": [ "c": "oc", "n": "Occitan", "t": "Occitan", "xlp": "occitan" ], "pl": [ "c": "pl", "n": "Polish", "t": "polski", "xlp": "polish" ], "pt": [ "c": "pt", "n": "Portuguese", "t": "Português", "xlp": "portuges" ], "pt_BR": [ "c": "pt_BR", "n": "Portuguese Brazil", "t": "Brazilian Português", "xlp": "brazilian" ], "ro": [ "c": "ro", "n": "Romanian", "t": "română", "xlp": "romanian" ], "ru": [ "c": "ru", "n": "Russian", "t": "Русский (Russkij)", "xlp": "russian" ], "sa": [ "c": "sa", "n": "Sanskrit", "t": "Sanskrit", "xlp": "sanskrit" ], "se": [ "c": "se", "n": "Sami", "t": "Samin", "xlp": "samin" ], "sk": [ "c": "sk", "n": "Slovak", "t": "slovensky", "xlp": "slovak" ], "sl": [ "c": "sl", "n": "Slovenian", "t": "Slovenian", "xlp": "slovenian" ], "sq": [ "c": "sq", "n": "Albanian", "t": "Albanian", "xlp": "albanian" ], "sr": [ "c": "sr", "n": "Serbian", "t": "Serbian", "xlp": "serbian" ], "sv": [ "c": "sv", "n": "Swedish", "t": "svenska", "xlp": "swedish" ], "ta": [ "c": "ta", "n": "Tamil", "t": "Tamil", "xlp": "tamil" ], "te": [ "c": "te", "n": "Telugu", "t": "Telugu", "xlp": "telugu" ], "th": [ "c": "th", "n": "Thai", "t": "Thai", "xlp": "thai" ], "tk": [ "c": "tk", "n": "Turkmen", "t": "Turkmen", "xlp": "turkmen" ], "tr": [ "c": "tr", "n": "Turkish", "t": "Türkçe", "xlp": "turkish" ], "uk": [ "c": "uk", "n": "Ukranian", "t": "українська (ukrajins\"ka)", "xlp": "ukrainian" ], "ur": [ "c": "ur", "n": "Urdu", "t": "Urdu", "xlp": "urdu" ], "us": [ "c": "en", "n": "English (American)","t": "English", "xlp": "english" ], "vi": [ "c": "vi", "n": "Vietnamese", "t": "Vietnamese", "xlp": "vietnamese" ], "zh": [ "c": "zh", "n": "Chinese", "t": "中文", "xlp": "chinese" ], "en": [ "c": "en", "n": "English", "t": "English", "xlp": "english" ], "xx": [ "c": "xx", "n": "Default", "t": "English", "xlp": "english" ], ]; return _lang_codes; } string[] code_arr_ptr() { auto _lang_codes = ["am", "bg", "bn", "br", "ca", "cs", "cy", "da", "de", "el", "en", "eo", "es", "et", "eu", "fi", "fr", "ga", "gl", "he", "hi", "hr", "hy", "ia", "is", "it", "ja", "ko", "la", "lo", "lt", "lv", "ml", "mr", "nl", "no", "nn", "oc", "pl", "pt", "pt_BR", "ro", "ru", "sa", "se", "sk", "sl", "sq", "sr", "sv", "ta", "te", "th", "tk", "tr", "uk", "ur", "us", "vi", "zh", "en", "xx",]; return _lang_codes; } string[] code_arr() { auto _lang_codes = ["am", "bg", "bn", "br", "ca", "cs", "cy", "da", "de", "el", "en", "eo", "es", "et", "eu", "fi", "fr", "ga", "gl", "he", "hi", "hr", "hy", "ia", "is", "it", "ja", "ko", "la", "lo", "lt", "lv", "ml", "mr", "nl", "no", "nn", "oc", "pl", "pt", "pt_BR", "ro", "ru", "sa", "se", "sk", "sl", "sq", "sr", "sv", "ta", "te", "th", "tk", "tr", "uk", "ur", "vi", "zh"]; return _lang_codes; } auto codes_() { return "(" ~ join(code_arr,"|") ~ ")"; } auto codes_regex() { return regex(codes_); } } } #+END_SRC ** 1. ctRegex :regex: *** misc generic #+name: prgmkup_rgx #+BEGIN_SRC d static newline = ctRegex!("\n", "mg"); static strip_br = ctRegex!("^
\n|
\n*$"); static space = ctRegex!(`[ ]`, "mg"); static spaces_line_start = ctRegex!(`^(?P[ ]+)`, "mg"); static spaces_multiple = ctRegex!(`(?P[ ]{2,})`, "mg"); // could be issues for endnotes static two_spaces = ctRegex!(`[ ]{2}`, "mg"); static nbsp_char = ctRegex!(`░`, "mg"); static nbsp_chars_line_start = ctRegex!(`^░+`, "mg"); static nbsp_and_space = ctRegex!(` [ ]`, "mg"); static nbsp_char_and_space = ctRegex!(`░[ ]`, "mg"); #+END_SRC *** filename (and path) matching (including markup insert file) :insert:file:path:filename: #+name: prgmkup_rgx #+BEGIN_SRC d static src_pth = ctRegex!(`^(?P[a-zA-Z0-9._-]+/)*(?P[a-zA-Z0-9._-]+[.]ss[tm])$`); static src_fn = ctRegex!(`^([a-zA-Z0-9._-]+/)*(?P(?P[a-zA-Z0-9._-]+)[.](?Pss[tm]))$`); static src_fn_master = ctRegex!(`^(?P[a-zA-Z0-9._-]+/)*(?P[a-zA-Z0-9._-]+[.]ssm)$`); static src_fn_text = ctRegex!(`^(?P[a-zA-Z0-9._-]+/)*(?P[a-zA-Z0-9._-]+[.]sst)$`); static src_fn_insert = ctRegex!(`^(?P[a-zA-Z0-9._-]+/)*(?P[a-zA-Z0-9._-]+[.]ssi)$`); static src_fn_find_inserts = ctRegex!(`^(?P[a-zA-Z0-9._-]+/)*(?P[a-zA-Z0-9._-]+[.]ss[im])$`); static insert_src_fn_ssi_or_sst = ctRegex!(`^<<\s*(?P[a-zA-Z0-9._-]+/)*(?P[a-zA-Z0-9._-]+[.]ss[ti])$`); #+END_SRC *** inline markup **** inline (internal program) markup footnotes endnotes :inline:footnote: #+name: prgmkup_rgx #+BEGIN_SRC d /+ inline markup footnotes endnotes +/ static inline_notes_al = ctRegex!(`【(?:[*+]\s+|\s*)(.+?)】`, "mg"); static inline_notes_al_gen = ctRegex!(`【.+?】`, "m"); static inline_al_delimiter_open_regular = ctRegex!(`【\s`, "m"); static inline_al_delimiter_open_symbol_star = ctRegex!(`【[*]\s`, "m"); static inline_al_delimiter_open_symbol_plus = ctRegex!(`【[+]\s`, "m"); static inline_al_delimiter_close_regular = ctRegex!(`】`, "m"); static inline_al_delimiter_open_and_close_regular = ctRegex!(`【|】`, "m"); static inline_notes_delimiter_al_regular = ctRegex!(`【(.+?)】`, "mg"); static inline_notes_delimiter_al_regular_number_note = ctRegex!(`【(\d+)\s+(.+?)】`, "mg"); static inline_al_delimiter_open_asterisk = ctRegex!(`【\*`, "m"); static inline_al_delimiter_open_plus = ctRegex!(`【\+`, "m"); static inline_text_and_note_al = ctRegex!(`(?P.+?)【(?:[*+ ]*)(?P.+?)】`, "mg"); static inline_text_and_note_al_ = ctRegex!(`(.+?(?:【[*+]*\s+.+?】|$))`, "mg"); #+END_SRC **** inline links #+name: prgmkup_rgx #+BEGIN_SRC d /+ inline markup footnotes endnotes +/ static inline_link = ctRegex!(`┥(.+?)┝┤(.+?)├`, "mg"); static inline_a_url = ctRegex!(`(┤)(\S+?)(├)`, "mg"); static fn_suffix = ctRegex!(`\.fnSuffix`, "mg"); static inline_link_fn_suffix = ctRegex!(`¤(.+?)(\.fnSuffix)`, "mg"); static inline_seg_link = ctRegex!(`(¤)(?:.+?)\.fnSuffix`, "mg"); static mark_internal_site_lnk = ctRegex!(`¤`, "mg"); #+END_SRC **** TODO inline markup font face mod :inline:font:face: #+name: prgmkup_rgx #+BEGIN_SRC d /+ inline markup font face mod +/ static inline_faces = ctRegex!(`(?P(?P[*!_^,+#-])\{(?P.+?)\}[*!_^,+#-])`, "mg"); static inline_emphasis = ctRegex!(`\*\{(?P.+?)\}\*`, "mg"); static inline_bold = ctRegex!(`!\{(?P.+?)\}!`, "mg"); static inline_underscore = ctRegex!(`_\{(?P.+?)\}_`, "mg"); static inline_italics = ctRegex!(`/\{(?P.+?)\}/`, "mg"); static inline_superscript = ctRegex!(`\^\{(?P.+?)\}\^`, "mg"); static inline_subscript = ctRegex!(`,\{(?P.+?)\},`, "mg"); static inline_strike = ctRegex!(`-\{(?P.+?)\}-`, "mg"); static inline_insert = ctRegex!(`\+\{(?P.+?)\}\+`, "mg"); static inline_mono = ctRegex!(`#\{(?P.+?)\}#`, "mg"); static inline_cite = ctRegex!(`"\{(?P.+?)\}"`, "mg"); static inline_faces_line = ctRegex!(`^[*!/_]_ (?P.+?)((?: [\\]{2}|[~]#){0,2}$)`); static inline_emphasis_line = ctRegex!(`^\*_ (?P.+?)((?: [\\]{2}|[~]#){0,2}$)`); static inline_bold_line = ctRegex!(`^!_ (?P.+?)((?: [\\]{2}|[~]#){0,2}$)`); static inline_italics_line = ctRegex!(`^/_ (?P.+?)((?: [\\]{2}|[~]#){0,2}$)`); static inline_underscore_line = ctRegex!(`^__ (?P.+?)((?: [\\]{2}|[~]#){0,2}$)`); #+END_SRC **** table related #+name: prgmkup_rgx #+BEGIN_SRC d /+ table delimiters +/ static table_delimiter_col = ctRegex!("[ ]*[┊][ ]*", "mg"); // static table_delimiter_row = ctRegex!("[ ]*\n", "mg"); // #+END_SRC * +set colors for terminal+ (unused) :colors:terminal: #+name: ao_ansi_colors #+BEGIN_SRC d string[string] scr_txt_color = [ "off" : "\033[0m", "white" : "\033[37m", "white_bold" : "\033[1m", "marker" : "\033[42m", "bold" : "\033[1m", "underline" : "\033[4m", "invert" : "\033[7m", "darkgrey_hi" : "\033[100m", "grey_hi" : "\033[47m", "pink_hi" : "\033[105m", "fuchsia_hi" : "\033[45m", "red_hi" : "\033[41m", "orange_hi" : "\033[101m", "yellow_hi" : "\033[103m", "brown_hi" : "\033[43m", "lightgreen_hi" : "\033[102m", "green_hi" : "\033[42m", "cyan_hi" : "\033[106m", "blue_hi" : "\033[104m", "navy_hi" : "\033[44m", "grey" : "\033[90m", "pink" : "\033[95m", "fuchsia" : "\033[35m", "ruby" : "\033[31m", "red" : "\033[91m", "orange" : "\033[91m", "yellow" : "\033[93m", "brown" : "\033[33m", "green" : "\033[92m", "darkgreen" : "\033[32m", "cyan" : "\033[36m", "blue" : "\033[94m", "navy" : "\033[34m", "black" : "\033[30m" ]; string[string] scr_txt_marker = [ "white" : "\033[37m*\033[0m ", "bold" : "\033[1m*\033[0m ", "invert" : "\033[7m*\033[0m ", "darkgrey_hi" : "\033[100m*\033[0m ", "grey_hi" : "\033[47m*\033[0m ", "pink_hi" : "\033[105m*\033[0m ", "fuchsia_hi" : "\033[45m*\033[0m ", "red_hi" : "\033[41m*\033[0m ", "orange_hi" : "\033[101m*\033[0m ", "yellow_hi" : "\033[103m*\033[0m ", "brown_hi" : "\033[43m*\033[0m ", "lightgreen_hi" : "\033[102m*\033[0m ", "green_hi" : "\033[42m*\033[0m ", "cyan_hi" : "\033[106m*\033[0m ", "blue_hi" : "\033[104m*\033[0m ", "navy_hi" : "\033[44m*\033[0m ", "grey" : "\033[90m*\033[0m ", "pink" : "\033[95m*\033[0m ", "fuchsia" : "\033[35m*\033[0m ", "ruby" : "\033[31m*\033[0m ", "red" : "\033[91m*\033[0m ", "orange" : "\033[91m*\033[0m ", "yellow" : "\033[93m*\033[0m ", "brown" : "\033[33m*\033[0m ", "green" : "\033[92m*\033[0m ", "darkgreen" : "\033[32m*\033[0m ", "cyan" : "\033[36m*\033[0m ", "blue" : "\033[94m*\033[0m ", "navy" : "\033[34m*\033[0m ", "black" : "\033[30m*\033[0m " ]; #+END_SRC