diff options
| author | Ralph Amissah <ralph@amissah.com> | 2017-10-17 13:36:41 -0400 | 
|---|---|---|
| committer | Ralph Amissah <ralph@amissah.com> | 2019-04-10 15:14:14 -0400 | 
| commit | 2a359a57ce021ba6ddf7232b3f3d79726d4738ba (patch) | |
| tree | b9e9c11ecf4bb0cc3dab7ea94454f868d69792bf /src/sdp | |
| parent | meta_abstraction, a renaming, minor (diff) | |
sqlite document db discrete & collection, started
- discrete document , drop & recreate document
  --sqlite-disctrete
- document collection
  - create tables
    --sqlite-create
  - populate db with specified document
    --sqlite-update
Diffstat (limited to 'src/sdp')
| -rw-r--r-- | src/sdp/meta/conf_make_meta_sdlang.d | 14 | ||||
| -rw-r--r-- | src/sdp/meta/defaults.d | 204 | ||||
| -rw-r--r-- | src/sdp/meta/metadoc_from_src.d | 27 | ||||
| -rw-r--r-- | src/sdp/output/epub3.d | 1 | ||||
| -rw-r--r-- | src/sdp/output/hub.d | 8 | ||||
| -rw-r--r-- | src/sdp/output/paths_output.d | 26 | ||||
| -rw-r--r-- | src/sdp/output/sqlite.d | 372 | ||||
| -rw-r--r-- | src/sdp/output/sqlite_discrete.d | 1085 | ||||
| -rwxr-xr-x | src/sdp/sdp.d | 6 | 
9 files changed, 1442 insertions, 301 deletions
| diff --git a/src/sdp/meta/conf_make_meta_sdlang.d b/src/sdp/meta/conf_make_meta_sdlang.d index 2bded69..478cea4 100644 --- a/src/sdp/meta/conf_make_meta_sdlang.d +++ b/src/sdp/meta/conf_make_meta_sdlang.d @@ -161,6 +161,7 @@ static template SiSUextractSDLang() {        }        if ("original" in header_sdlang.maybe.tags) {          _conf_composite.meta.original_language       = extractSDLangTabOrAttrib(header_sdlang, "original", "language"); +        _conf_composite.meta.original_language_char  = extractSDLangTabOrAttrib(header_sdlang, "original", "language_char");          _conf_composite.meta.original_source         = extractSDLangTabOrAttrib(header_sdlang, "original", "source");          _conf_composite.meta.original_title          = extractSDLangTabOrAttrib(header_sdlang, "original", "title");        } @@ -168,10 +169,15 @@ static template SiSUextractSDLang() {          // _conf_composite.meta.publisher               = extractSDLangTabOrAttrib(header_sdlang, "publisher", "");        }        if ("rights" in header_sdlang.maybe.tags) { -        _conf_composite.meta.rights_copyright        = extractSDLangTabOrAttrib(header_sdlang, "rights", "copyright"); -        _conf_composite.meta.rights_cover            = extractSDLangTabOrAttrib(header_sdlang, "rights", "cover"); -        _conf_composite.meta.rights_illustrations    = extractSDLangTabOrAttrib(header_sdlang, "rights", "illustrations"); -        _conf_composite.meta.rights_license          = extractSDLangTabOrAttrib(header_sdlang, "rights", "license"); +        _conf_composite.meta.rights_copyright               = extractSDLangTabOrAttrib(header_sdlang, "rights", "copyright"); +        _conf_composite.meta.rights_copyright_text          = extractSDLangTabOrAttrib(header_sdlang, "rights", "copyright_text"); +        _conf_composite.meta.rights_copyright_audio         = extractSDLangTabOrAttrib(header_sdlang, "rights", "copyright_audio"); +        _conf_composite.meta.rights_copyright_cover         = extractSDLangTabOrAttrib(header_sdlang, "rights", "copyright_cover"); +        _conf_composite.meta.rights_copyright_illustrations = extractSDLangTabOrAttrib(header_sdlang, "rights", "copyright_illustrations"); +        _conf_composite.meta.rights_copyright_photographs   = extractSDLangTabOrAttrib(header_sdlang, "rights", "copyright_photographs"); +        _conf_composite.meta.rights_copyright_translation   = extractSDLangTabOrAttrib(header_sdlang, "rights", "copyright_translation"); +        _conf_composite.meta.rights_copyright_video         = extractSDLangTabOrAttrib(header_sdlang, "rights", "copyright_video"); +        _conf_composite.meta.rights_license                 = extractSDLangTabOrAttrib(header_sdlang, "rights", "license");        }        if (_conf_composite.meta.creator_author.empty) {          if ("creator" in header_sdlang.maybe.tags) { diff --git a/src/sdp/meta/defaults.d b/src/sdp/meta/defaults.d index ede1523..e598aa8 100644 --- a/src/sdp/meta/defaults.d +++ b/src/sdp/meta/defaults.d @@ -23,109 +23,119 @@ template SiSUregisters() {      std.utf,      std.conv : to;    struct ConfCompositeMake { -    string bold                    = ""; -    string breaks                  = ""; -    string cover_image             = ""; -    string css                     = ""; -    string emphasis                = ""; -    string footer                  = ""; -    string headings                = ""; -    string home_button_image       = ""; -    string home_button_text        = ""; -    string italics                 = ""; -    string num_top                 = ""; -    string num_depth               = ""; -    string substitute              = ""; -    string texpdf_font             = ""; +    string bold                           = ""; +    string breaks                         = ""; +    string cover_image                    = ""; +    string css                            = ""; +    string emphasis                       = ""; +    string footer                         = ""; +    string headings                       = ""; +    string home_button_image              = ""; +    string home_button_text               = ""; +    string italics                        = ""; +    string num_top                        = ""; +    string num_depth                      = ""; +    string substitute                     = ""; +    string texpdf_font                    = "";    }    struct ConfCompositeMakeStr { -    string bold                    = ""; -    string breaks                  = ""; -    string cover_image             = ""; -    string css                     = ""; -    string emphasis                = ""; -    string footer                  = ""; -    string headings                = ""; -    string home_button_image       = ""; -    string home_button_text        = ""; -    string italics                 = ""; -    string num_top                 = ""; -    string num_depth               = ""; -    string substitute              = ""; -    string texpdf_font             = ""; +    string bold                           = ""; +    string breaks                         = ""; +    string cover_image                    = ""; +    string css                            = ""; +    string emphasis                       = ""; +    string footer                         = ""; +    string headings                       = ""; +    string home_button_image              = ""; +    string home_button_text               = ""; +    string italics                        = ""; +    string num_top                        = ""; +    string num_depth                      = ""; +    string substitute                     = ""; +    string texpdf_font                    = "";    }    struct ConfCompositeSiteLocal { -    string webserv_url_root        = ""; -    string webserv_path            = ""; -    string webserv_images          = ""; -    string webserv_cgi             = ""; -    string webserv_cgi_host        = ""; -    string webserv_cgi_host_path   = ""; -    string webserv_cgi_port        = ""; -    string webserv_cgi_user        = ""; -    string webserv_cgi_file_links  = ""; -    string processing_path         = ""; -    string processing_dir          = ""; -    string processing_concord_max  = ""; -    string flag_act0               = ""; -    string flag_act1               = ""; -    string flag_act2               = ""; -    string flag_act3               = ""; -    string flag_act4               = ""; -    string flag_act5               = ""; -    string flag_act6               = ""; -    string flag_act7               = ""; -    string flag_act8               = ""; -    string flag_act9               = ""; -    string default_papersize       = ""; -    string default_text_wrap       = ""; -    string default_emphasis        = ""; -    string default_language        = ""; -    string default_digest          = ""; -    string permission_share_source = ""; -    string search_flag             = ""; -    string search_action           = ""; -    string search_db               = ""; -    string search_title            = ""; +    string webserv_url_root               = ""; +    string webserv_path                   = ""; +    string webserv_images                 = ""; +    string webserv_cgi                    = ""; +    string webserv_cgi_host               = ""; +    string webserv_cgi_host_path          = ""; +    string webserv_cgi_port               = ""; +    string webserv_cgi_user               = ""; +    string webserv_cgi_file_links         = ""; +    string processing_path                = ""; +    string processing_dir                 = ""; +    string processing_concord_max         = ""; +    string flag_act0                      = ""; +    string flag_act1                      = ""; +    string flag_act2                      = ""; +    string flag_act3                      = ""; +    string flag_act4                      = ""; +    string flag_act5                      = ""; +    string flag_act6                      = ""; +    string flag_act7                      = ""; +    string flag_act8                      = ""; +    string flag_act9                      = ""; +    string default_papersize              = ""; +    string default_text_wrap              = ""; +    string default_emphasis               = ""; +    string default_language               = ""; +    string default_digest                 = ""; +    string permission_share_source        = ""; +    string search_flag                    = ""; +    string search_action                  = ""; +    string search_db                      = ""; +    string search_title                   = "";    }    struct MetaComposite { -    string classify_dewey          = ""; -    string classify_keywords       = ""; -    string classify_loc            = ""; -    string classify_subject        = ""; -    string classify_topic_register = ""; -    string creator_author          = ""; -    string creator_author_email    = ""; -    string creator_illustrator     = ""; -    string creator_translator      = ""; -    string date_added_to_site      = ""; -    string date_available          = ""; -    string date_created            = ""; -    string date_issued             = ""; -    string date_modified           = ""; -    string date_published          = ""; -    string date_valid              = ""; -    string identifier_isbn         = ""; -    string identifier_oclc         = ""; -    string identifier_pg           = ""; -    string links                   = ""; -    string notes_abstract          = ""; -    string notes_description       = ""; -    string original_language       = ""; -    string original_source         = ""; -    string original_title          = ""; -    string publisher               = ""; -    string rights_copyright        = ""; -    string rights_cover            = ""; -    string rights_illustrations    = ""; -    string rights_license          = ""; -    string title_edition           = ""; -    string title_full              = ""; -    string title_language          = ""; -    string title_main              = ""; -    string title_note              = ""; -    string title_sub               = ""; -    string title_subtitle          = ""; +    string classify_dewey                 = ""; +    string classify_keywords              = ""; +    string classify_loc                   = ""; +    string classify_subject               = ""; +    string classify_topic_register        = ""; +    string creator_author                 = ""; +    string creator_author_email           = ""; +    string creator_illustrator            = ""; +    string creator_translator             = ""; +    string date_added_to_site             = ""; +    string date_available                 = ""; +    string date_created                   = ""; +    string date_issued                    = ""; +    string date_modified                  = ""; +    string date_published                 = ""; +    string date_valid                     = ""; +    string identifier_isbn                = ""; +    string identifier_oclc                = ""; +    string identifier_pg                  = ""; +    string language_document              = ""; +    string language_document_char         = ""; +    string links                          = ""; +    string notes_abstract                 = ""; +    string notes_description              = ""; +    string original_language              = ""; +    string original_language_char         = ""; +    string original_publisher             = ""; +    string original_source                = ""; +    string original_title                 = ""; +    string publisher                      = ""; +    string rights_copyright               = ""; +    string rights_copyright_audio         = ""; +    string rights_copyright_cover         = ""; +    string rights_copyright_illustrations = ""; +    string rights_copyright_photographs   = ""; +    string rights_copyright_text          = ""; +    string rights_copyright_translation   = ""; +    string rights_copyright_video         = ""; +    string rights_license                 = ""; +    string title_edition                  = ""; +    string title_full                     = ""; +    string title_language                 = ""; +    string title_main                     = ""; +    string title_note                     = ""; +    string title_short                    = ""; +    string title_sub                      = ""; +    string title_subtitle                 = "";    }    struct ConfComposite {      MetaComposite          meta; diff --git a/src/sdp/meta/metadoc_from_src.d b/src/sdp/meta/metadoc_from_src.d index b4bee7a..80de1f2 100644 --- a/src/sdp/meta/metadoc_from_src.d +++ b/src/sdp/meta/metadoc_from_src.d @@ -1375,7 +1375,8 @@ template SiSUdocAbstraction() {          || (opt_action["html-scroll"])          || (opt_action["html-seg"])          || (opt_action["epub"]) -        || (opt_action["sqlite"]) +        || (opt_action["sqlite-discrete"]) +        || (opt_action["sqlite-update"])          || (opt_action["postgresql"])) {            obj = obj_dom_structure_set_markup_tags(obj, dom_markedup, obj.heading_lev_markup);            obj = obj_dom_set_collapsed_tags(obj, dom_collapsed, obj.heading_lev_collapsed); @@ -1401,7 +1402,8 @@ template SiSUdocAbstraction() {            || (opt_action["html-scroll"])            || (opt_action["html-seg"])            || (opt_action["epub"]) -          || (opt_action["sqlite"]) +          || (opt_action["sqlite-discrete"]) +          || (opt_action["sqlite-update"])            || (opt_action["postgresql"])) {              obj = obj_dom_structure_set_markup_tags(obj, dom_markedup, obj.heading_lev_markup);              obj = obj_dom_set_collapsed_tags(obj, dom_collapsed, obj.heading_lev_collapsed); @@ -1458,7 +1460,8 @@ template SiSUdocAbstraction() {            || (opt_action["html-scroll"])            || (opt_action["html-seg"])            || (opt_action["epub"]) -          || (opt_action["sqlite"]) +          || (opt_action["sqlite-discrete"]) +          || (opt_action["sqlite-update"])            || (opt_action["postgresql"])) {              obj = obj_dom_structure_set_markup_tags(obj, dom_markedup, obj.heading_lev_markup);              obj = obj_dom_set_collapsed_tags(obj, dom_collapsed, obj.heading_lev_collapsed); @@ -1499,7 +1502,8 @@ template SiSUdocAbstraction() {            || (opt_action["html-scroll"])            || (opt_action["html-seg"])            || (opt_action["epub"]) -          || (opt_action["sqlite"]) +          || (opt_action["sqlite-discrete"]) +          || (opt_action["sqlite-update"])            || (opt_action["postgresql"])) {              obj = obj_dom_structure_set_markup_tags(obj, dom_markedup, obj.heading_lev_markup);              obj = obj_dom_set_collapsed_tags(obj, dom_collapsed, obj.heading_lev_collapsed); @@ -1533,7 +1537,8 @@ template SiSUdocAbstraction() {            || (opt_action["html-scroll"])            || (opt_action["html-seg"])            || (opt_action["epub"]) -          || (opt_action["sqlite"]) +          || (opt_action["sqlite-discrete"]) +          || (opt_action["sqlite-update"])            || (opt_action["postgresql"])) {              obj = obj_dom_structure_set_markup_tags(obj, dom_markedup, obj.heading_lev_markup);              obj = obj_dom_set_collapsed_tags(obj, dom_collapsed, obj.heading_lev_collapsed); @@ -1571,7 +1576,8 @@ template SiSUdocAbstraction() {            || (opt_action["html-scroll"])            || (opt_action["html-seg"])            || (opt_action["epub"]) -          || (opt_action["sqlite"]) +          || (opt_action["sqlite-discrete"]) +          || (opt_action["sqlite-update"])            || (opt_action["postgresql"])) {              obj = obj_dom_structure_set_markup_tags(obj, dom_markedup, obj.heading_lev_markup);              obj = obj_dom_set_collapsed_tags(obj, dom_collapsed, obj.heading_lev_collapsed); @@ -1614,7 +1620,8 @@ template SiSUdocAbstraction() {            || (opt_action["html-scroll"])            || (opt_action["html-seg"])            || (opt_action["epub"]) -          || (opt_action["sqlite"]) +          || (opt_action["sqlite-discrete"]) +          || (opt_action["sqlite-update"])            || (opt_action["postgresql"])) {              obj = obj_dom_structure_set_markup_tags(obj, dom_markedup, obj.heading_lev_markup);              obj = obj_dom_set_collapsed_tags(obj, dom_collapsed, obj.heading_lev_collapsed); @@ -1652,7 +1659,8 @@ template SiSUdocAbstraction() {            || (opt_action["html-scroll"])            || (opt_action["html-seg"])            || (opt_action["epub"]) -          || (opt_action["sqlite"]) +          || (opt_action["sqlite-discrete"]) +          || (opt_action["sqlite-update"])            || (opt_action["postgresql"])) {              obj = obj_dom_structure_set_markup_tags(obj, dom_markedup, obj.heading_lev_markup);              obj = obj_dom_set_collapsed_tags(obj, dom_collapsed, obj.heading_lev_collapsed); @@ -1691,7 +1699,8 @@ template SiSUdocAbstraction() {            || (opt_action["html-scroll"])            || (opt_action["html-seg"])            || (opt_action["epub"]) -          || (opt_action["sqlite"]) +          || (opt_action["sqlite-discrete"]) +          || (opt_action["sqlite-update"])            || (opt_action["postgresql"])) {              obj = obj_dom_structure_set_markup_tags(obj, dom_markedup, obj.heading_lev_markup);              obj = obj_dom_set_collapsed_tags(obj, dom_collapsed, obj.heading_lev_collapsed); diff --git a/src/sdp/output/epub3.d b/src/sdp/output/epub3.d index 7851c09..b6987ae 100644 --- a/src/sdp/output/epub3.d +++ b/src/sdp/output/epub3.d @@ -508,6 +508,7 @@ template outputEPub3() {            }          }          if (obj.is_a == "heading") { +          assert(obj.text.length > 0);            if (obj.heading_lev_markup <= 4) {              oepbs_content_parts["manifest_documents"] ~=                format(q"¶      <item id="%s.xhtml" href="%s.xhtml" media-type="application/xhtml+xml" /> diff --git a/src/sdp/output/hub.d b/src/sdp/output/hub.d index d25905f..4f5a363 100644 --- a/src/sdp/output/hub.d +++ b/src/sdp/output/hub.d @@ -8,6 +8,7 @@ template outputHub() {      sdp.output.epub3,      sdp.output.html,      sdp.output.sqlite, +    sdp.output.sqlite_discrete,      sdp.output.xmls,      sdp.output.source_sisupod,      sdp.output.create_zip_file, @@ -73,7 +74,11 @@ template outputHub() {        /+ mixin outputODT; +/        writeln("odt processing");      } -    if (doc_matters.opt_action["sqlite"]) { +    if (doc_matters.opt_action["sqlite-discrete"]) { +      if ((doc_matters.opt_action["verbose"])) { writeln("sqlite processing... "); } +      SQLiteDiscreteBuildTablesAndPopulate!()(doc_abstraction, doc_matters); +    } +    if (doc_matters.opt_action["sqlite-update"]) {        if ((doc_matters.opt_action["verbose"])) { writeln("sqlite processing... "); }        SQLiteBuildTablesAndPopulate!()(doc_abstraction, doc_matters);      } @@ -88,6 +93,7 @@ template outputHubOp() {      sdp.output.epub3,      sdp.output.html,      sdp.output.sqlite, +    sdp.output.sqlite_discrete,      sdp.output.xmls,      sdp.output.source_sisupod,      sdp.output.create_zip_file, diff --git a/src/sdp/output/paths_output.d b/src/sdp/output/paths_output.d index ae4d4ac..d66ada8 100644 --- a/src/sdp/output/paths_output.d +++ b/src/sdp/output/paths_output.d @@ -295,6 +295,32 @@ template SiSUpathsEPUB() {      return _PathsStruct();    }  } +template SiSUpathsSQLiteDiscrete() { +  mixin SiSUrgxInit; +  static auto rgx = Rgx(); +  auto SiSUpathsSQLiteDiscrete(Ps,Lng)( +    Ps  src_pth_info, +    Lng lng, +  ) { +    auto out_pth = SiSUoutPaths!()(src_pth_info, lng); +    string base_dir = "sqlite"; +    struct _PathsStruct { +      string base_filename(string fn_src) { +        return fn_src.baseName.stripExtension; +      } +      string base() { +        return (out_pth.output_base).chainPath(base_dir).array; +      } +      string seg(string fn_src) { +        return base.chainPath(base_filename(fn_src)).array; +      } +      string sqlite_file(string fn_src) { +        return base.chainPath(base_filename(fn_src) ~ ".sqlite").array; +      } +    } +    return _PathsStruct(); +  } +}  template SiSUpathsSQLite() {    mixin SiSUrgxInit;    static auto rgx = Rgx(); diff --git a/src/sdp/output/sqlite.d b/src/sdp/output/sqlite.d index e7ef6bf..69c7d51 100644 --- a/src/sdp/output/sqlite.d +++ b/src/sdp/output/sqlite.d @@ -3,7 +3,6 @@ import sdp.output;  import    std.file,    std.conv : to; -import sdp.output.sqlite;  template SQLiteBuildTablesAndPopulate() {    void SQLiteBuildTablesAndPopulate(D,I)(      auto ref const D    doc_abstraction, @@ -11,7 +10,6 @@ template SQLiteBuildTablesAndPopulate() {    ) {      import d2sqlite3;      import std.typecons : Nullable; -    import sdp.output.sqlite;      mixin SiSUoutputRgxInit;      static auto rgx = Rgx();      template SQLiteFormatAndLoadObject() { @@ -459,128 +457,132 @@ template SQLiteBuildTablesAndPopulate() {          auto ref              I    doc_matters,        ) {          auto pth_sqlite = SiSUpathsSQLite!()(doc_matters.src_path_info, doc_matters.language); -        auto db = Database(pth_sqlite.sqlite_file(doc_matters.source_filename)); +        auto db = Database(pth_sqlite.sqlite_file(doc_matters.environment["pwd"].baseName));          // auto db = Database(":memory:"); // open database in memory -        db.run(" -        DROP TABLE IF EXISTS metadata_and_text; -        DROP TABLE IF EXISTS doc_objects; -        DROP TABLE IF EXISTS urls; -        CREATE TABLE metadata_and_text ( -          tid                              BIGINT            PRIMARY KEY, -          title                            VARCHAR(800)  NOT NULL, -          title_main                       VARCHAR(400)      NULL, /*NOT*/ -          title_sub                        VARCHAR(400)      NULL, -          title_short                      VARCHAR(400)      NULL, -          title_edition                    VARCHAR(10)       NULL, -          title_note                       VARCHAR(2500)     NULL, -          title_language                   VARCHAR(100)      NULL, -          title_language_char              VARCHAR(6)        NULL, -          creator_author                   VARCHAR(600)      NULL, -          creator_author_hon               VARCHAR(100)      NULL, -          creator_author_nationality       VARCHAR(100)      NULL, -          creator_editor                   VARCHAR(600)      NULL, -          creator_contributor              VARCHAR(600)      NULL, -          creator_illustrator              VARCHAR(600)      NULL, -          creator_photographer             VARCHAR(600)      NULL, -          creator_translator               VARCHAR(600)      NULL, -          creator_prepared_by              VARCHAR(600)      NULL, -          creator_digitized_by             VARCHAR(600)      NULL, -          creator_audio                    VARCHAR(600)      NULL, -          creator_video                    VARCHAR(600)      NULL, -          language_document                VARCHAR(100)      NULL, -          language_document_char           VARCHAR(6)        NULL, /*NOT*/ -          language_original                VARCHAR(100)      NULL, -          language_original_char           VARCHAR(6)        NULL, -          date_added_to_site               VARCHAR(10)       NULL, -          date_available                   VARCHAR(10)       NULL, -          date_created                     VARCHAR(10)       NULL, -          date_issued                      VARCHAR(10)       NULL, -          date_modified                    VARCHAR(10)       NULL, -          date_published                   VARCHAR(10)       NULL, -          date_valid                       VARCHAR(10)       NULL, -          date_translated                  VARCHAR(10)       NULL, -          date_original_publication        VARCHAR(10)       NULL, -          date_generated                   VARCHAR(10)       NULL, -          publisher                        VARCHAR(600)      NULL, -          original_publisher               VARCHAR(600)      NULL, -          original_language                VARCHAR(100)      NULL, -          original_language_char           VARCHAR(6)        NULL, -          original_source                  VARCHAR(600)      NULL, -          original_institution             VARCHAR(600)      NULL, -          original_nationality             VARCHAR(100)      NULL, -          rights                           VARCHAR(2500)     NULL, -          rights_copyright_text            VARCHAR(2500)     NULL, -          rights_copyright_translation     VARCHAR(2500)     NULL, -          rights_copyright_illustrations   VARCHAR(2500)     NULL, -          rights_copyright_photographs     VARCHAR(2500)     NULL, -          rights_copyright_preparation     VARCHAR(2500)     NULL, -          rights_copyright_digitization    VARCHAR(2500)     NULL, -          rights_copyright_audio           VARCHAR(2500)     NULL, -          rights_copyright_video           VARCHAR(2500)     NULL, -          rights_license                   VARCHAR(2500)     NULL, -          identifier_oclc                  VARCHAR(30)       NULL, -          identifier_isbn                  VARCHAR(16)       NULL, -          classify_topic_register          VARCHAR(2500)     NULL, -          classify_subject                 VARCHAR(600)      NULL, -          classify_loc                     VARCHAR(30)       NULL, -          classify_dewey                   VARCHAR(30)       NULL, -          classify_keywords                VARCHAR(600)      NULL, -          notes_abstract                   TEXT              NULL, -          notes_description                TEXT              NULL, -          notes_comment                    TEXT              NULL, -          notes_coverage                   VARCHAR(200)      NULL, -          notes_relation                   VARCHAR(200)      NULL, -          notes_history                    VARCHAR(600)      NULL, -          notes_type                       VARCHAR(600)      NULL, -          notes_format                     VARCHAR(600)      NULL, -          notes_prefix                     TEXT              NULL, -          notes_prefix_a                   TEXT              NULL, -          notes_prefix_b                   TEXT              NULL, -          notes_suffix                     TEXT              NULL, -          src_filename                     VARCHAR(256)      NULL, -          src_fingerprint                  VARCHAR(256)      NULL, -          src_filesize                     VARCHAR(10)       NULL, -          src_wordcount                    VARCHAR(10)       NULL, -          src_text                         TEXT              NULL, -          fulltext                         TEXT              NULL, -          links                            TEXT              NULL -        ); -         -        CREATE TABLE doc_objects ( -          lid                              BIGINT PRIMARY KEY, -          metadata_tid                     BIGINT REFERENCES metadata_and_text, -          ocn                              SMALLINT, -          ocnd                             VARCHAR(6), -          ocns                             VARCHAR(6), -          clean                            TEXT NULL, -          body                             TEXT NULL, -          book_idx                         TEXT NULL, -          seg                              VARCHAR(256) NULL, -          lev_an                           VARCHAR(1), -          lev                              SMALLINT NULL, -          lev0                             SMALLINT, -          lev1                             SMALLINT, -          lev2                             SMALLINT, -          lev3                             SMALLINT, -          lev4                             SMALLINT, -          lev5                             SMALLINT, -          lev6                             SMALLINT, -          lev7                             SMALLINT, -          en_a                             SMALLINT NULL, -          en_z                             SMALLINT NULL, -          en_a_asterisk                    SMALLINT NULL, -          en_z_asterisk                    SMALLINT NULL, -          en_a_plus                        SMALLINT NULL, -          en_z_plus                        SMALLINT NULL, -          t_of                             VARCHAR(16), -          t_is                             VARCHAR(16), -          node                             VARCHAR(16) NULL, -          parent                           VARCHAR(16) NULL, -          digest_clean                     CHAR(256), -          digest_all                       CHAR(256), -          types                            CHAR(1) NULL -        ) -        "); +        if (doc_matters.opt_action["sqlite-create"]) { +          if ((doc_matters.opt_action["verbose"])) { writeln("sqlite create tables... "); } +          db.run(" +          DROP TABLE IF EXISTS metadata_and_text; +          DROP TABLE IF EXISTS doc_objects; +          DROP TABLE IF EXISTS urls; +          CREATE TABLE metadata_and_text ( +            tid                              BIGINT            PRIMARY KEY, +            title                            VARCHAR(800)  NOT NULL, +            title_main                       VARCHAR(400)      NULL, /*NOT*/ +            title_sub                        VARCHAR(400)      NULL, +            title_short                      VARCHAR(400)      NULL, +            title_edition                    VARCHAR(10)       NULL, +            title_note                       VARCHAR(2500)     NULL, +            title_language                   VARCHAR(100)      NULL, +            title_language_char              VARCHAR(6)        NULL, +            creator_author                   VARCHAR(600)      NULL, +            creator_author_email             VARCHAR(100)      NULL, +            creator_author_hon               VARCHAR(100)      NULL, +            creator_author_nationality       VARCHAR(100)      NULL, +            creator_editor                   VARCHAR(600)      NULL, +            creator_contributor              VARCHAR(600)      NULL, +            creator_illustrator              VARCHAR(600)      NULL, +            creator_photographer             VARCHAR(600)      NULL, +            creator_translator               VARCHAR(600)      NULL, +            creator_prepared_by              VARCHAR(600)      NULL, +            creator_digitized_by             VARCHAR(600)      NULL, +            creator_audio                    VARCHAR(600)      NULL, +            creator_video                    VARCHAR(600)      NULL, +            language_document                VARCHAR(100)      NULL, +            language_document_char           VARCHAR(6)        NULL, /*NOT*/ +            language_original                VARCHAR(100)      NULL, +            language_original_char           VARCHAR(6)        NULL, +            date_added_to_site               VARCHAR(10)       NULL, +            date_available                   VARCHAR(10)       NULL, +            date_created                     VARCHAR(10)       NULL, +            date_issued                      VARCHAR(10)       NULL, +            date_modified                    VARCHAR(10)       NULL, +            date_published                   VARCHAR(10)       NULL, +            date_valid                       VARCHAR(10)       NULL, +            date_translated                  VARCHAR(10)       NULL, +            date_original_publication        VARCHAR(10)       NULL, +            date_generated                   VARCHAR(10)       NULL, +            publisher                        VARCHAR(600)      NULL, +            original_publisher               VARCHAR(600)      NULL, +            original_language                VARCHAR(100)      NULL, +            original_language_char           VARCHAR(6)        NULL, +            original_source                  VARCHAR(600)      NULL, +            original_institution             VARCHAR(600)      NULL, +            original_nationality             VARCHAR(100)      NULL, +            original_title                   VARCHAR(800)      NULL, +            rights_copyright                 VARCHAR(2500)     NULL, +            rights_copyright_audio           VARCHAR(2500)     NULL, +            rights_copyright_cover           VARCHAR(2500)     NULL, +            rights_copyright_illustrations   VARCHAR(2500)     NULL, +            rights_copyright_photographs     VARCHAR(2500)     NULL, +            rights_copyright_text            VARCHAR(2500)     NULL, +            rights_copyright_translation     VARCHAR(2500)     NULL, +            rights_copyright_video           VARCHAR(2500)     NULL, +            rights_license                   VARCHAR(2500)     NULL, +            identifier_oclc                  VARCHAR(30)       NULL, +            identifier_isbn                  VARCHAR(16)       NULL, +            classify_topic_register          VARCHAR(2500)     NULL, +            classify_subject                 VARCHAR(600)      NULL, +            classify_loc                     VARCHAR(30)       NULL, +            classify_dewey                   VARCHAR(30)       NULL, +            classify_keywords                VARCHAR(600)      NULL, +            notes_abstract                   TEXT              NULL, +            notes_description                TEXT              NULL, +            notes_comment                    TEXT              NULL, +            notes_coverage                   VARCHAR(200)      NULL, +            notes_relation                   VARCHAR(200)      NULL, +            notes_history                    VARCHAR(600)      NULL, +            notes_type                       VARCHAR(600)      NULL, +            notes_format                     VARCHAR(600)      NULL, +            notes_prefix                     TEXT              NULL, +            notes_prefix_a                   TEXT              NULL, +            notes_prefix_b                   TEXT              NULL, +            notes_suffix                     TEXT              NULL, +            src_filename                     VARCHAR(256)      NULL, +            src_fingerprint                  VARCHAR(256)      NULL, +            src_filesize                     VARCHAR(10)       NULL, +            src_wordcount                    VARCHAR(10)       NULL, +            src_text                         TEXT              NULL, +            fulltext                         TEXT              NULL, +            links                            TEXT              NULL +          ); +          /* */ +          CREATE TABLE doc_objects ( +            lid                              BIGINT PRIMARY KEY, +            metadata_tid                     BIGINT REFERENCES metadata_and_text, +            ocn                              SMALLINT, +            ocnd                             VARCHAR(6), +            ocns                             VARCHAR(6), +            clean                            TEXT NULL, +            body                             TEXT NULL, +            book_idx                         TEXT NULL, +            seg                              VARCHAR(256) NULL, +            lev_an                           VARCHAR(1), +            lev                              SMALLINT NULL, +            lev0                             SMALLINT, +            lev1                             SMALLINT, +            lev2                             SMALLINT, +            lev3                             SMALLINT, +            lev4                             SMALLINT, +            lev5                             SMALLINT, +            lev6                             SMALLINT, +            lev7                             SMALLINT, +            en_a                             SMALLINT NULL, +            en_z                             SMALLINT NULL, +            en_a_asterisk                    SMALLINT NULL, +            en_z_asterisk                    SMALLINT NULL, +            en_a_plus                        SMALLINT NULL, +            en_z_plus                        SMALLINT NULL, +            t_of                             VARCHAR(16), +            t_is                             VARCHAR(16), +            node                             VARCHAR(16) NULL, +            parent                           VARCHAR(16) NULL, +            digest_clean                     CHAR(256), +            digest_all                       CHAR(256), +            types                            CHAR(1) NULL +          ) +          "); +        }          Statement insert_metadata = db.prepare("            INSERT INTO metadata_and_text (              tid, @@ -593,6 +595,7 @@ template SQLiteBuildTablesAndPopulate() {              title_language,              title_language_char,              creator_author, +            creator_author_email,              creator_author_hon,              creator_author_nationality,              creator_editor, @@ -625,14 +628,14 @@ template SQLiteBuildTablesAndPopulate() {              original_source,              original_institution,              original_nationality, -            rights, -            rights_copyright_text, -            rights_copyright_translation, +            original_title, +            rights_copyright, +            rights_copyright_audio, +            rights_copyright_cover,              rights_copyright_illustrations,              rights_copyright_photographs, -            rights_copyright_preparation, -            rights_copyright_digitization, -            rights_copyright_audio, +            rights_copyright_text, +            rights_copyright_translation,              rights_copyright_video,              rights_license,              identifier_oclc, @@ -673,6 +676,7 @@ template SQLiteBuildTablesAndPopulate() {              :title_language,              :title_language_char,              :creator_author, +            :creator_author_email,              :creator_author_hon,              :creator_author_nationality,              :creator_editor, @@ -705,14 +709,14 @@ template SQLiteBuildTablesAndPopulate() {              :original_source,              :original_institution,              :original_nationality, -            :rights, -            :rights_copyright_text, -            :rights_copyright_translation, +            :original_title, +            :rights_copyright, +            :rights_copyright_audio, +            :rights_copyright_cover,              :rights_copyright_illustrations,              :rights_copyright_photographs, -            :rights_copyright_preparation, -            :rights_copyright_digitization, -            :rights_copyright_audio, +            :rights_copyright_text, +            :rights_copyright_translation,              :rights_copyright_video,              :rights_license,              :identifier_oclc, @@ -743,74 +747,66 @@ template SQLiteBuildTablesAndPopulate() {              :links            )          "); +        // insert_metadata.bind(":tid",                               ); // unique identifier you could try use sha of title author & language? or auto increment??          insert_metadata.bind(":title",                             doc_matters.conf_make_meta.meta.title_full); -        // insert_metadata.bind(":title_main",                     doc_matters.conf_make_meta.meta.title_main); -        // insert_metadata.bind(":title_sub",                      doc_matters.conf_make_meta.meta.title_subtitle); -        // insert_metadata.bind(":title_short",                    doc_matters.conf_make_meta.meta.title_short); // -        // insert_metadata.bind(":title_edition",                  doc_matters.conf_make_meta.meta.title_edition); -        // insert_metadata.bind(":title_note",                     doc_matters.conf_make_meta.meta.title_note); -        // insert_metadata.bind(":title_language",                 doc_matters.conf_make_meta.meta.title_language); +        insert_metadata.bind(":title_main",                        doc_matters.conf_make_meta.meta.title_main); +        insert_metadata.bind(":title_sub",                         doc_matters.conf_make_meta.meta.title_subtitle); +        insert_metadata.bind(":title_short",                       doc_matters.conf_make_meta.meta.title_short); // +        insert_metadata.bind(":title_edition",                     doc_matters.conf_make_meta.meta.title_edition); +        insert_metadata.bind(":title_language",                    doc_matters.conf_make_meta.meta.title_language);          // insert_metadata.bind(":title_language_char",            doc_matters.conf_make_meta.meta.title_language_char); +        insert_metadata.bind(":classify_dewey",                    doc_matters.conf_make_meta.meta.classify_dewey); +        insert_metadata.bind(":classify_keywords",                 doc_matters.conf_make_meta.meta.classify_keywords); +        insert_metadata.bind(":classify_loc",                      doc_matters.conf_make_meta.meta.classify_loc); +        insert_metadata.bind(":classify_subject",                  doc_matters.conf_make_meta.meta.classify_subject); +        insert_metadata.bind(":classify_topic_register",           doc_matters.conf_make_meta.meta.classify_topic_register);          insert_metadata.bind(":creator_author",                    doc_matters.conf_make_meta.meta.creator_author); -        // insert_metadata.bind(":creator_author_hon",             doc_matters.conf_make_meta.meta.creator_author_hon); -        // insert_metadata.bind(":creator_author_nationality",     doc_matters.conf_make_meta.meta.creator_author_nationality); +        insert_metadata.bind(":creator_author_email",              doc_matters.conf_make_meta.meta.creator_author_email);          // insert_metadata.bind(":creator_editor",                 doc_matters.conf_make_meta.meta.creator_editor);          // insert_metadata.bind(":creator_contributor",            doc_matters.conf_make_meta.meta.creator_contributor); -        // insert_metadata.bind(":creator_illustrator",            doc_matters.conf_make_meta.meta.creator_illustrator); +        insert_metadata.bind(":creator_illustrator",               doc_matters.conf_make_meta.meta.creator_illustrator);          // insert_metadata.bind(":creator_photographer",           doc_matters.conf_make_meta.meta.creator_photographer); -        // insert_metadata.bind(":creator_translator",             doc_matters.conf_make_meta.meta.creator_translator); -        // insert_metadata.bind(":creator_prepared_by",            doc_matters.conf_make_meta.meta.creator_prepared_by); -        // insert_metadata.bind(":creator_digitized_by",           doc_matters.conf_make_meta.meta.creator_digitized_by); +        insert_metadata.bind(":creator_translator",                doc_matters.conf_make_meta.meta.creator_translator);          // insert_metadata.bind(":creator_audio",                  doc_matters.conf_make_meta.meta.creator_audio);          // insert_metadata.bind(":creator_video",                  doc_matters.conf_make_meta.meta.creator_video); -        // insert_metadata.bind(":language_document",              doc_matters.conf_make_meta.meta.language_document); -        // insert_metadata.bind(":language_document_char",         doc_matters.conf_make_meta.meta.language_document_char); -        // insert_metadata.bind(":language_original",              doc_matters.conf_make_meta.meta.language_original); -        // insert_metadata.bind(":language_original_char",         doc_matters.conf_make_meta.meta.language_original_char); -        // insert_metadata.bind(":date_added_to_site",             doc_matters.conf_make_meta.meta.date_added_to_site); -        // insert_metadata.bind(":date_available",                 doc_matters.conf_make_meta.meta.date_available); -        // insert_metadata.bind(":date_created",                   doc_matters.conf_make_meta.meta.date_created); -        // insert_metadata.bind(":date_issued",                    doc_matters.conf_make_meta.meta.date_issued); -        // insert_metadata.bind(":date_modified",                  doc_matters.conf_make_meta.meta.date_modified); -        // insert_metadata.bind(":date_published",                 doc_matters.conf_make_meta.meta.date_published); -        // insert_metadata.bind(":date_valid",                     doc_matters.conf_make_meta.meta.date_valid); +        insert_metadata.bind(":date_added_to_site",                doc_matters.conf_make_meta.meta.date_added_to_site); +        insert_metadata.bind(":date_available",                    doc_matters.conf_make_meta.meta.date_available); +        insert_metadata.bind(":date_created",                      doc_matters.conf_make_meta.meta.date_created); +        insert_metadata.bind(":date_issued",                       doc_matters.conf_make_meta.meta.date_issued); +        insert_metadata.bind(":date_modified",                     doc_matters.conf_make_meta.meta.date_modified); +        insert_metadata.bind(":date_published",                    doc_matters.conf_make_meta.meta.date_published); +        insert_metadata.bind(":date_valid",                        doc_matters.conf_make_meta.meta.date_valid);          // insert_metadata.bind(":date_translated",                doc_matters.conf_make_meta.meta.date_translated);          // insert_metadata.bind(":date_original_publication",      doc_matters.conf_make_meta.meta.date_original_publication);          // insert_metadata.bind(":date_generated",                 doc_matters.conf_make_meta.meta.date_generated); -        // insert_metadata.bind(":publisher",                      doc_matters.conf_make_meta.meta.publisher)); -        // insert_metadata.bind(":original_publisher",             doc_matters.conf_make_meta.meta.original_publisher); -        // insert_metadata.bind(":original_language",              doc_matters.conf_make_meta.meta.original_language); -        // insert_metadata.bind(":original_language_char",         doc_matters.conf_make_meta.meta.original_language_char); -        // insert_metadata.bind(":original_source",                doc_matters.conf_make_meta.meta.original_source); -        // insert_metadata.bind(":original_institution",           doc_matters.conf_make_meta.meta.original_institution); -        // insert_metadata.bind(":original_nationality",           doc_matters.conf_make_meta.meta.original_nationality); +        insert_metadata.bind(":identifier_isbn",                   doc_matters.conf_make_meta.meta.identifier_isbn); +        insert_metadata.bind(":identifier_oclc",                   doc_matters.conf_make_meta.meta.identifier_oclc); +        insert_metadata.bind(":language_document",                 doc_matters.conf_make_meta.meta.language_document); +        insert_metadata.bind(":language_document_char",            doc_matters.conf_make_meta.meta.language_document_char); +        // insert_metadata.bind(":language_original",              doc_matters.conf_make_meta.meta.language_original); +        // insert_metadata.bind(":language_original_char",         doc_matters.conf_make_meta.meta.language_original_char); +        insert_metadata.bind(":notes_abstract",                    doc_matters.conf_make_meta.meta.notes_abstract); +        insert_metadata.bind(":notes_description",                 doc_matters.conf_make_meta.meta.notes_description); +        insert_metadata.bind(":original_publisher",                doc_matters.conf_make_meta.meta.original_publisher); +        insert_metadata.bind(":original_language",                 doc_matters.conf_make_meta.meta.original_language); +        insert_metadata.bind(":original_language_char",            doc_matters.conf_make_meta.meta.original_language_char); +        insert_metadata.bind(":original_source",                   doc_matters.conf_make_meta.meta.original_source); +        insert_metadata.bind(":original_title",                    doc_matters.conf_make_meta.meta.original_title); +        insert_metadata.bind(":publisher",                         doc_matters.conf_make_meta.meta.publisher);          // insert_metadata.bind(":rights",                         doc_matters.conf_make_meta.meta.rights); -        // insert_metadata.bind(":rights_copyright_text",          doc_matters.conf_make_meta.meta.rights_copyright_text); -        // insert_metadata.bind(":rights_copyright_translation",   doc_matters.conf_make_meta.meta.rights_copyright_translation); -        // insert_metadata.bind(":rights_copyright_illustrations", doc_matters.conf_make_meta.meta.rights_illustrations); -        // insert_metadata.bind(":rights_copyright_photographs",   doc_matters.conf_make_meta.meta.rights_photographs); +        insert_metadata.bind(":rights_copyright",                  doc_matters.conf_make_meta.meta.rights_copyright); +        insert_metadata.bind(":rights_copyright_audio",            doc_matters.conf_make_meta.meta.rights_copyright_audio); +        insert_metadata.bind(":rights_copyright_cover",            doc_matters.conf_make_meta.meta.rights_copyright_cover); +        insert_metadata.bind(":rights_copyright_illustrations",    doc_matters.conf_make_meta.meta.rights_copyright_illustrations); +        insert_metadata.bind(":rights_copyright_photographs",      doc_matters.conf_make_meta.meta.rights_copyright_photographs);          // insert_metadata.bind(":rights_copyright_preparation",   doc_matters.conf_make_meta.meta.rights_preparation); +        insert_metadata.bind(":rights_copyright_text",      doc_matters.conf_make_meta.meta.rights_copyright_text); +        insert_metadata.bind(":rights_copyright_translation",      doc_matters.conf_make_meta.meta.rights_copyright_translation); +        insert_metadata.bind(":rights_copyright_video",            doc_matters.conf_make_meta.meta.rights_copyright_video);          // insert_metadata.bind(":rights_copyright_digitization",  doc_matters.conf_make_meta.meta.rights_digitization);          // insert_metadata.bind(":rights_copyright_audio",         doc_matters.conf_make_meta.meta.rights_audio);          // insert_metadata.bind(":rights_copyright_video",         doc_matters.conf_make_meta.meta.rights_video); -        // insert_metadata.bind(":rights_license",                 doc_matters.conf_make_meta.meta.rights_license); -        // insert_metadata.bind(":identifier_oclc",                doc_matters.conf_make_meta.meta.identifier_oclc); -        // insert_metadata.bind(":identifier_isbn",                doc_matters.conf_make_meta.meta.identifier_isbn); -        // insert_metadata.bind(":classify_topic_register",        doc_matters.conf_make_meta.meta.classify_topic_register); -        // insert_metadata.bind(":classify_subject",               doc_matters.conf_make_meta.meta.classify_subject); -        // insert_metadata.bind(":classify_loc",                   doc_matters.conf_make_meta.meta.classify_loc); -        // insert_metadata.bind(":notes_abstract",                 doc_matters.conf_make_meta.meta.notes_abstract); -        // insert_metadata.bind(":notes_description",              doc_matters.conf_make_meta.meta.notes_description); -        // insert_metadata.bind(":notes_comment",                  doc_matters.conf_make_meta.meta.notes_comment); -        // insert_metadata.bind(":notes_coverage",                 doc_matters.conf_make_meta.meta.notes_coverage); -        // insert_metadata.bind(":notes_relation",                 doc_matters.conf_make_meta.meta.notes_relation); -        // insert_metadata.bind(":notes_history",                  doc_matters.conf_make_meta.meta.notes_history); -        // insert_metadata.bind(":notes_type",                     doc_matters.conf_make_meta.meta.notes_type); -        // insert_metadata.bind(":notes_format",                   doc_matters.conf_make_meta.meta.notes_format); -        // insert_metadata.bind(":notes_prefix",                   doc_matters.conf_make_meta.meta.notes_prefix); -        // insert_metadata.bind(":notes_prefix_a",                 doc_matters.conf_make_meta.meta.notes_prefix_a); -        // insert_metadata.bind(":notes_prefix_b",                 doc_matters.conf_make_meta.meta.notes_prefix_b); -        // insert_metadata.bind(":notes_suffix",                   doc_matters.conf_make_meta.meta.notes_suffix); +        insert_metadata.bind(":rights_license",                    doc_matters.conf_make_meta.meta.rights_license);          // insert_metadata.bind(":src_filename",                   doc_matters.conf_make_meta.meta.src_filename);          // insert_metadata.bind(":src_fingerprint",                doc_matters.conf_make_meta.meta.src_fingerprint);          // insert_metadata.bind(":src_filesize",                   doc_matters.conf_make_meta.meta.src_filesize); @@ -822,7 +818,7 @@ template SQLiteBuildTablesAndPopulate() {          /+ watch +/          writeln("sql statement executed");          assert(db.totalChanges == 1); -         +        //          Statement insert_doc_objects = db.prepare("            INSERT INTO doc_objects (              lid, diff --git a/src/sdp/output/sqlite_discrete.d b/src/sdp/output/sqlite_discrete.d new file mode 100644 index 0000000..c8238f4 --- /dev/null +++ b/src/sdp/output/sqlite_discrete.d @@ -0,0 +1,1085 @@ +module sdp.output.sqlite_discrete; +import sdp.output; +import +  std.file, +  std.conv : to; +template SQLiteDiscreteBuildTablesAndPopulate() { +  void SQLiteDiscreteBuildTablesAndPopulate(D,I)( +    auto ref const D    doc_abstraction, +    auto ref I          doc_matters, +  ) { +    import d2sqlite3; +    import std.typecons : Nullable; +    mixin SiSUoutputRgxInit; +    static auto rgx = Rgx(); +    template SQLiteFormatAndLoadObject() { +      auto SQLiteFormatAndLoadObject(I)( +        auto ref              I    doc_matters, +      ) { +        mixin SiSUoutputRgxInit; +        struct sqlite_format_and_load_objects { +          auto generic_munge_sanitize_text_for_search( +            string _txt, +          ) { +            string _notes; +            string _urls; +            _txt = _txt.replaceAll(rgx.inline_fontface_clean, ""); +            if (_txt.matchFirst(rgx.inline_notes_al_gen)) { +              foreach (m; _txt.matchAll(rgx.inline_notes_al_gen_text)) { +                _notes ~= "\n" ~ m["text"]; +              } +              _txt = _txt.replaceAll(rgx.inline_notes_al_gen, ""); +            } +            if (_txt.matchFirst(rgx.inline_link)) { +              foreach (m; _txt.matchAll(rgx.inline_link)) { +                if (m["link"].match(rgx.url)) { +                  _urls ~= "\n" ~ m["link"]; +                } +              } +              _txt = _txt.replaceAll(rgx.inline_link_clean, ""); +            } +            if (_notes.length > 0) { +              _txt ~= _notes; +            } +            if (_urls.length > 0) { +              _txt ~= _urls; +            } +            if (doc_matters.opt_action["debug"]) { +              writeln(_txt, "\n"); +            } +            debug(sql_text_clean) { +              writeln(_txt); +            } +            return _txt; +          } +          auto munge_html(O)( +            auto return ref const O    obj, +          ) { +            string _html_special_characters(string _txt){ +              _txt = (_txt) +                .replaceAll(rgx.xhtml_ampersand,    "&") +                .replaceAll(rgx.xhtml_quotation,    """) +                .replaceAll(rgx.xhtml_less_than,    "<") +                .replaceAll(rgx.xhtml_greater_than, ">") +                .replaceAll(rgx.nbsp_char,          " ") +                .replaceAll(rgx.xhtml_line_break,   "<br />"); +              return _txt; +            } +            string _html_font_face(string _txt){ +              _txt = (_txt) +                .replaceAll(rgx.inline_emphasis,    ("<em>$1</em>")) +                .replaceAll(rgx.inline_bold,        ("<b>$1</b>")) +                .replaceAll(rgx.inline_underscore,  ("<u>$1</u>")) +                .replaceAll(rgx.inline_italics,     ("<i>$1</i>")) +                .replaceAll(rgx.inline_superscript, ("<sup>$1</sup>")) +                .replaceAll(rgx.inline_subscript,   ("<sub>$1</sub>")) +                .replaceAll(rgx.inline_strike,      ("<del>$1</del>")) +                .replaceAll(rgx.inline_insert,      ("<ins>$1</ins>")) +                .replaceAll(rgx.inline_mono,        ("<tt>$1</tt>")) +                .replaceAll(rgx.inline_cite,        ("<cite>$1</cite>")); +              return _txt; +            } +            string _notes; +            string _urls; +            string _txt = _html_font_face(_html_special_characters(obj.text)); +            if (_txt.matchFirst(rgx.inline_notes_al_gen)) { +              foreach (m; _txt.matchAll(rgx.inline_notes_al_gen_text)) { +                _notes ~= "\n" ~ m["text"]; +              } +              _txt = _txt.replaceAll(rgx.inline_notes_al_gen_ref, "<sup>$1</sup> "); +            } +            if (_txt.matchFirst(rgx.inline_link)) { +              foreach (m; _txt.matchAll(rgx.inline_link)) { +              } +              _txt = _txt.replaceAll(rgx.inline_link_clean, ""); +            } +            if (_notes.length > 0) { +              _txt ~= _notes; +            } +            if (doc_matters.opt_action["debug"]) { +              writeln(_txt, "\n"); +            } +            return _txt; +          } +          string html_special_characters(string _txt){ +            _txt = (_txt) +              .replaceAll(rgx.xhtml_ampersand,    "&") +              .replaceAll(rgx.xhtml_quotation,    """) +              .replaceAll(rgx.xhtml_less_than,    "<") +              .replaceAll(rgx.xhtml_greater_than, ">") +              .replaceAll(rgx.nbsp_char,          " ") +              .replaceAll(rgx.xhtml_line_break,   "<br />"); +            return _txt; +          } +          string html_special_characters_code(string _txt){ +            _txt = (_txt) +              .replaceAll(rgx.xhtml_ampersand,    "&") +              .replaceAll(rgx.xhtml_quotation,    """) +              .replaceAll(rgx.xhtml_less_than,    "<") +              .replaceAll(rgx.xhtml_greater_than, ">") +              .replaceAll(rgx.nbsp_char,          " "); +            return _txt; +          } +          string html_font_face(string _txt){ +            _txt = (_txt) +              .replaceAll(rgx.inline_emphasis,    ("<em>$1</em>")) +              .replaceAll(rgx.inline_bold,        ("<b>$1</b>")) +              .replaceAll(rgx.inline_underscore,  ("<u>$1</u>")) +              .replaceAll(rgx.inline_italics,     ("<i>$1</i>")) +              .replaceAll(rgx.inline_superscript, ("<sup>$1</sup>")) +              .replaceAll(rgx.inline_subscript,   ("<sub>$1</sub>")) +              .replaceAll(rgx.inline_strike,      ("<del>$1</del>")) +              .replaceAll(rgx.inline_insert,      ("<ins>$1</ins>")) +              .replaceAll(rgx.inline_mono,        ("<tt>$1</tt>")) +              .replaceAll(rgx.inline_cite,        ("<cite>$1</cite>")); +            return _txt; +          } +          auto html_heading(O)( +            auto return ref const O    obj, +          ) { +            string _txt = munge_html(obj); +            string o = format(q"¶<p class="%s"><b> +                %s +              </b></p>¶", +                obj.is_a, +                _txt, +              ); +            return o; +          } +          auto html_para(O)( +            auto return ref const O    obj, +          ) { +            string _txt = munge_html(obj); +            _txt = (obj.bullet) ? ("●  " ~ _txt) : _txt; +            string o = format(q"¶<p class="%s" indent="h%si%s"> +              %s +            </p>¶", +                obj.is_a, +                obj.indent_hang, +                obj.indent_base, +                _txt +              ); +            return o; +          } +          auto html_quote(O)( +            auto return ref const O    obj, +          ) { +            string _txt = munge_html(obj); +            string o = format(q"¶<p class="%s"> +              %s +            </p>¶", +                obj.is_a, +                _txt +              ); +            return o; +          } +          auto html_group(O)( +            auto return ref const O    obj, +          ) { +            string _txt = munge_html(obj); +            string o = format(q"¶<p class="%s"> +              %s +            </p>¶", +                obj.is_a, +                _txt +              ); +            return o; +          } +          auto html_block(O)( +            auto return ref const O    obj, +          ) { +            string _txt = munge_html(obj); +            string o = format(q"¶ +            <p class="%s">%s</p>¶", +                obj.is_a, +                _txt.stripRight +              ); +            return o; +          } +          auto html_verse(O)( +            auto return ref const O    obj, +          ) { +            string _txt = munge_html(obj); +            string o = format(q"¶<p class="%s">%s</p>¶", +                obj.is_a, +                _txt +              ); +            return o; +          } +          auto html_code(O)( +            auto return ref const O    obj, +          ) { +            string _txt = html_special_characters_code(obj.text); +            string o = format(q"¶<p class="%s">%s</p>¶", +                obj.is_a, +                _txt +              ); +            return o; +          } +          auto html_table(O)( +            auto return ref const O     obj, +          ) { +            auto _tablarize(O)( +              auto return ref const O    obj, +              string                     _txt, +            ) { +              string[] _table_rows = (_txt).split(rgx.table_delimiter_row); +              string[] _table_cols; +              string _table; +              string _tablenote; +              foreach(row_idx, row; _table_rows) { +                _table_cols = row.split(rgx.table_delimiter_col); +                  _table ~= "<tr>"; +                  foreach(col_idx, cell; _table_cols) { +                    if ((_table_cols.length == 1) +                    && (_table_rows.length <= row_idx+2)) { // check row_idx+2 (rather than == ++row_idx) +                      _tablenote ~= cell; +                    } else { +                      string _col_is = (row_idx == 0 && obj.table_heading) ? "th" : "td"; +                      string _align = ("style=\"text-align:" +                      ~ ((obj.table_column_aligns[col_idx] == "l") +                      ? "left\"" : "right\"")); +                      _table ~= "<" ~ _col_is ~ " width=\"" ~ obj.table_column_widths[col_idx].to!string ~ "%\" " ~ _align ~ ">"; +                      _table ~= cell; +                      _table ~= "</" ~ _col_is ~ ">"; +                    } +                  } +                  _table ~= "</tr>"; +                } +              auto t = tuple( +                _table, +                _tablenote, +              ); +              return t; +            } +            string _txt = munge_html(obj); +            auto t = _tablarize(obj, _txt); +            _txt = t[0]; +            string _note = t[1]; +            string o = format(q"¶<p class="%s"> +              <table summary="normal text css" width="95%%" border="0" bgcolor="white" cellpadding="2" align="center"> +                %s +              </table> +              %s +            </p>¶", +              obj.is_a, +              _txt, +              _note +            ); +            return o; +          } +          auto sqlite_load_string(O,Dm)( +            auto return ref const O     obj, +            auto return ref       Dm    doc_matters, +          ) { +            string o; +            return o; +          } +          auto postgresql_load_string(O,Dm)( +            auto return ref const O     obj, +            auto return ref       Dm    doc_matters, +          ) { +            string o; +            return o; +          } +          string sqlite_statement(O)( +            auto return ref const O    obj, +            string                     _txt, +            string                     _html, +          ) { +            void _sql_exe(O)( +              string                   _sql, +            ) { +              writeln(_html); +              writeln(_sql); +            } +            string _sql; +            return _sql; +          } +          auto heading(O)( +            auto return ref const O      obj, +          ) { +            string[string] obj_txt = [ +              "text": generic_munge_sanitize_text_for_search(obj.text), +              "html": html_heading(obj) +            ]; +            if (doc_matters.opt_action["debug"]) { +              debug(sql_txt) { +                writeln(obj_txt["text"]); +              } +              debug(sql_html) { +                writeln(obj_txt["html"]); +              } +            } else { +              // load sql +            } +            return obj_txt; +          } +          auto para(O)( +            auto return ref const O     obj, +          ) { +            string[string] obj_txt = [ +              "text": generic_munge_sanitize_text_for_search(obj.text), +              "html": html_para(obj) +            ]; +            if (doc_matters.opt_action["debug"]) { +              debug(sql_txt) { +                writeln(obj_txt["text"]); +              } +              debug(sql_html) { +                writeln(obj_txt["html"]); +              } +            } else { +              // load sql +            } +            return obj_txt; +          } +          auto quote(O)( +            auto return ref const O     obj, +          ) { +            string[string] obj_txt = [ +              "text": generic_munge_sanitize_text_for_search(obj.text), +              "html": html_quote(obj) +            ]; +            if (doc_matters.opt_action["debug"]) { +              debug(sql_txt) { +                writeln(obj_txt["text"]); +              } +              debug(sql_html) { +                writeln(obj_txt["html"]); +              } +            } else { +              // load sql +            } +            return obj_txt; +          } +          auto group(O)( +            auto return ref const O     obj, +          ) { +            string[string] obj_txt = [ +              "text": generic_munge_sanitize_text_for_search(obj.text), +              "html": html_group(obj) +            ]; +            if (doc_matters.opt_action["debug"]) { +              debug(sql_txt) { +                writeln(obj_txt["text"]); +              } +              debug(sql_html) { +                writeln(obj_txt["html"]); +              } +            } else { +              // load sql +            } +            return obj_txt; +          } +          auto block(O)( +            auto return ref const O     obj, +          ) { +            string[string] obj_txt = [ +              "text": generic_munge_sanitize_text_for_search(obj.text), +              "html": html_block(obj) +            ]; +            if (doc_matters.opt_action["debug"]) { +              debug(sql_txt) { +                writeln(obj_txt["text"]); +              } +              debug(sql_html) { +                writeln(obj_txt["html"]); +              } +            } else { +              // load sql +            } +            return obj_txt; +          } +          auto verse(O)( +            auto return ref const O     obj, +          ) { +            string[string] obj_txt = [ +              "text": generic_munge_sanitize_text_for_search(obj.text), +              "html": html_verse(obj) +            ]; +            if (doc_matters.opt_action["debug"]) { +              debug(sql_txt) { +                writeln(obj_txt["text"]); +              } +              debug(sql_html) { +                writeln(obj_txt["html"]); +              } +            } else { +              // load sql +            } +            return obj_txt; +          } +          auto code(O)( +            auto return ref const O     obj, +          ) { +            string[string] obj_txt = [ +              "text": generic_munge_sanitize_text_for_search(obj.text), +              "html": html_code(obj) +            ]; +            if (doc_matters.opt_action["debug"]) { +              debug(sql_txt) { +                writeln(obj_txt["text"]); +              } +              debug(sql_html) { +                writeln(obj_txt["html"]); +              } +            } else { +              // load sql +            } +            return obj_txt; +          } +          auto table(O)( +            auto return ref const O     obj, +          ) { +            string[string] obj_txt = [ +              "text": generic_munge_sanitize_text_for_search(obj.text), +              "html": html_table(obj) +            ]; +            if (doc_matters.opt_action["debug"]) { +              debug(sql_txt) { +                writeln(obj_txt["text"]); +              } +              debug(sql_html) { +                writeln(obj_txt["html"]); +              } +            } else { +              // load sql +            } +            return obj_txt; +          } +        } +        return sqlite_format_and_load_objects(); +      } +    } +    template SQLiteInstruct() { +      Statement SQLiteInstruct(I)( +        auto ref              I    doc_matters, +      ) { +        auto pth_sqlite = SiSUpathsSQLiteDiscrete!()(doc_matters.src_path_info, doc_matters.language); +        auto db = Database(pth_sqlite.sqlite_file(doc_matters.source_filename)); +        // auto db = Database(":memory:"); // open database in memory +        db.run(" +        DROP TABLE IF EXISTS metadata_and_text; +        DROP TABLE IF EXISTS doc_objects; +        DROP TABLE IF EXISTS urls; +          CREATE TABLE metadata_and_text ( +            tid                              BIGINT            PRIMARY KEY, +            title                            VARCHAR(800)  NOT NULL, +            title_main                       VARCHAR(400)      NULL, /*NOT*/ +            title_sub                        VARCHAR(400)      NULL, +            title_short                      VARCHAR(400)      NULL, +            title_edition                    VARCHAR(10)       NULL, +            title_note                       VARCHAR(2500)     NULL, +            title_language                   VARCHAR(100)      NULL, +            title_language_char              VARCHAR(6)        NULL, +            creator_author                   VARCHAR(600)      NULL, +            creator_author_email             VARCHAR(100)      NULL, +            creator_author_hon               VARCHAR(100)      NULL, +            creator_author_nationality       VARCHAR(100)      NULL, +            creator_editor                   VARCHAR(600)      NULL, +            creator_contributor              VARCHAR(600)      NULL, +            creator_illustrator              VARCHAR(600)      NULL, +            creator_photographer             VARCHAR(600)      NULL, +            creator_translator               VARCHAR(600)      NULL, +            creator_prepared_by              VARCHAR(600)      NULL, +            creator_digitized_by             VARCHAR(600)      NULL, +            creator_audio                    VARCHAR(600)      NULL, +            creator_video                    VARCHAR(600)      NULL, +            language_document                VARCHAR(100)      NULL, +            language_document_char           VARCHAR(6)        NULL, /*NOT*/ +            language_original                VARCHAR(100)      NULL, +            language_original_char           VARCHAR(6)        NULL, +            date_added_to_site               VARCHAR(10)       NULL, +            date_available                   VARCHAR(10)       NULL, +            date_created                     VARCHAR(10)       NULL, +            date_issued                      VARCHAR(10)       NULL, +            date_modified                    VARCHAR(10)       NULL, +            date_published                   VARCHAR(10)       NULL, +            date_valid                       VARCHAR(10)       NULL, +            date_translated                  VARCHAR(10)       NULL, +            date_original_publication        VARCHAR(10)       NULL, +            date_generated                   VARCHAR(10)       NULL, +            publisher                        VARCHAR(600)      NULL, +            original_publisher               VARCHAR(600)      NULL, +            original_language                VARCHAR(100)      NULL, +            original_language_char           VARCHAR(6)        NULL, +            original_source                  VARCHAR(600)      NULL, +            original_institution             VARCHAR(600)      NULL, +            original_nationality             VARCHAR(100)      NULL, +            original_title                   VARCHAR(800)      NULL, +            rights_copyright                 VARCHAR(2500)     NULL, +            rights_copyright_audio           VARCHAR(2500)     NULL, +            rights_copyright_cover           VARCHAR(2500)     NULL, +            rights_copyright_illustrations   VARCHAR(2500)     NULL, +            rights_copyright_photographs     VARCHAR(2500)     NULL, +            rights_copyright_text            VARCHAR(2500)     NULL, +            rights_copyright_translation     VARCHAR(2500)     NULL, +            rights_copyright_video           VARCHAR(2500)     NULL, +            rights_license                   VARCHAR(2500)     NULL, +            identifier_oclc                  VARCHAR(30)       NULL, +            identifier_isbn                  VARCHAR(16)       NULL, +            classify_topic_register          VARCHAR(2500)     NULL, +            classify_subject                 VARCHAR(600)      NULL, +            classify_loc                     VARCHAR(30)       NULL, +            classify_dewey                   VARCHAR(30)       NULL, +            classify_keywords                VARCHAR(600)      NULL, +            notes_abstract                   TEXT              NULL, +            notes_description                TEXT              NULL, +            notes_comment                    TEXT              NULL, +            notes_coverage                   VARCHAR(200)      NULL, +            notes_relation                   VARCHAR(200)      NULL, +            notes_history                    VARCHAR(600)      NULL, +            notes_type                       VARCHAR(600)      NULL, +            notes_format                     VARCHAR(600)      NULL, +            notes_prefix                     TEXT              NULL, +            notes_prefix_a                   TEXT              NULL, +            notes_prefix_b                   TEXT              NULL, +            notes_suffix                     TEXT              NULL, +            src_filename                     VARCHAR(256)      NULL, +            src_fingerprint                  VARCHAR(256)      NULL, +            src_filesize                     VARCHAR(10)       NULL, +            src_wordcount                    VARCHAR(10)       NULL, +            src_text                         TEXT              NULL, +            fulltext                         TEXT              NULL, +            links                            TEXT              NULL +          ); +          /* */ +          CREATE TABLE doc_objects ( +            lid                              BIGINT PRIMARY KEY, +            metadata_tid                     BIGINT REFERENCES metadata_and_text, +            ocn                              SMALLINT, +            ocnd                             VARCHAR(6), +            ocns                             VARCHAR(6), +            clean                            TEXT NULL, +            body                             TEXT NULL, +            book_idx                         TEXT NULL, +            seg                              VARCHAR(256) NULL, +            lev_an                           VARCHAR(1), +            lev                              SMALLINT NULL, +            lev0                             SMALLINT, +            lev1                             SMALLINT, +            lev2                             SMALLINT, +            lev3                             SMALLINT, +            lev4                             SMALLINT, +            lev5                             SMALLINT, +            lev6                             SMALLINT, +            lev7                             SMALLINT, +            en_a                             SMALLINT NULL, +            en_z                             SMALLINT NULL, +            en_a_asterisk                    SMALLINT NULL, +            en_z_asterisk                    SMALLINT NULL, +            en_a_plus                        SMALLINT NULL, +            en_z_plus                        SMALLINT NULL, +            t_of                             VARCHAR(16), +            t_is                             VARCHAR(16), +            node                             VARCHAR(16) NULL, +            parent                           VARCHAR(16) NULL, +            digest_clean                     CHAR(256), +            digest_all                       CHAR(256), +            types                            CHAR(1) NULL +          ) +        "); +        Statement insert_metadata = db.prepare(" +          INSERT INTO metadata_and_text ( +            tid, +            title, +            title_main, +            title_sub, +            title_short, +            title_edition, +            title_note, +            title_language, +            title_language_char, +            creator_author, +            creator_author_email, +            creator_author_hon, +            creator_author_nationality, +            creator_editor, +            creator_contributor, +            creator_illustrator, +            creator_photographer, +            creator_translator, +            creator_prepared_by, +            creator_digitized_by, +            creator_audio, +            creator_video, +            language_document, +            language_document_char, +            language_original, +            language_original_char, +            date_added_to_site, +            date_available, +            date_created, +            date_issued, +            date_modified, +            date_published, +            date_valid, +            date_translated, +            date_original_publication, +            date_generated, +            publisher, +            original_publisher, +            original_language, +            original_language_char, +            original_source, +            original_institution, +            original_nationality, +            original_title, +            rights_copyright, +            rights_copyright_audio, +            rights_copyright_cover, +            rights_copyright_illustrations, +            rights_copyright_photographs, +            rights_copyright_text, +            rights_copyright_translation, +            rights_copyright_video, +            rights_license, +            identifier_oclc, +            identifier_isbn, +            classify_topic_register, +            classify_subject, +            classify_loc, +            classify_dewey, +            classify_keywords, +            notes_abstract, +            notes_description, +            notes_comment, +            notes_coverage, +            notes_relation, +            notes_history, +            notes_type, +            notes_format, +            notes_prefix, +            notes_prefix_a, +            notes_prefix_b, +            notes_suffix, +            src_filename, +            src_fingerprint, +            src_filesize, +            src_wordcount, +            src_text, +            fulltext, +            links +          ) +          VALUES ( +            :tid, +            :title, +            :title_main, +            :title_sub, +            :title_short, +            :title_edition, +            :title_note, +            :title_language, +            :title_language_char, +            :creator_author, +            :creator_author_email, +            :creator_author_hon, +            :creator_author_nationality, +            :creator_editor, +            :creator_contributor, +            :creator_illustrator, +            :creator_photographer, +            :creator_translator, +            :creator_prepared_by, +            :creator_digitized_by, +            :creator_audio, +            :creator_video, +            :language_document, +            :language_document_char, +            :language_original, +            :language_original_char, +            :date_added_to_site, +            :date_available, +            :date_created, +            :date_issued, +            :date_modified, +            :date_published, +            :date_valid, +            :date_translated, +            :date_original_publication, +            :date_generated, +            :publisher, +            :original_publisher, +            :original_language, +            :original_language_char, +            :original_source, +            :original_institution, +            :original_nationality, +            :original_title, +            :rights_copyright, +            :rights_copyright_audio, +            :rights_copyright_cover, +            :rights_copyright_illustrations, +            :rights_copyright_photographs, +            :rights_copyright_text, +            :rights_copyright_translation, +            :rights_copyright_video, +            :rights_license, +            :identifier_oclc, +            :identifier_isbn, +            :classify_topic_register, +            :classify_subject, +            :classify_loc, +            :classify_dewey, +            :classify_keywords, +            :notes_abstract, +            :notes_description, +            :notes_comment, +            :notes_coverage, +            :notes_relation, +            :notes_history, +            :notes_type, +            :notes_format, +            :notes_prefix, +            :notes_prefix_a, +            :notes_prefix_b, +            :notes_suffix, +            :src_filename, +            :src_fingerprint, +            :src_filesize, +            :src_wordcount, +            :src_text, +            :fulltext, +            :links +          ) +        "); +        // insert_metadata.bind(":tid",                               ); // unique identifier you could try use sha of title author & language? or auto increment?? +        insert_metadata.bind(":title",                             doc_matters.conf_make_meta.meta.title_full); +        insert_metadata.bind(":title_main",                        doc_matters.conf_make_meta.meta.title_main); +        insert_metadata.bind(":title_sub",                         doc_matters.conf_make_meta.meta.title_subtitle); +        insert_metadata.bind(":title_short",                       doc_matters.conf_make_meta.meta.title_short); // +        insert_metadata.bind(":title_edition",                     doc_matters.conf_make_meta.meta.title_edition); +        insert_metadata.bind(":title_language",                    doc_matters.conf_make_meta.meta.title_language); +        // insert_metadata.bind(":title_language_char",            doc_matters.conf_make_meta.meta.title_language_char); +        insert_metadata.bind(":classify_dewey",                    doc_matters.conf_make_meta.meta.classify_dewey); +        insert_metadata.bind(":classify_keywords",                 doc_matters.conf_make_meta.meta.classify_keywords); +        insert_metadata.bind(":classify_loc",                      doc_matters.conf_make_meta.meta.classify_loc); +        insert_metadata.bind(":classify_subject",                  doc_matters.conf_make_meta.meta.classify_subject); +        insert_metadata.bind(":classify_topic_register",           doc_matters.conf_make_meta.meta.classify_topic_register); +        insert_metadata.bind(":creator_author",                    doc_matters.conf_make_meta.meta.creator_author); +        insert_metadata.bind(":creator_author_email",              doc_matters.conf_make_meta.meta.creator_author_email); +        // insert_metadata.bind(":creator_editor",                 doc_matters.conf_make_meta.meta.creator_editor); +        // insert_metadata.bind(":creator_contributor",            doc_matters.conf_make_meta.meta.creator_contributor); +        insert_metadata.bind(":creator_illustrator",               doc_matters.conf_make_meta.meta.creator_illustrator); +        // insert_metadata.bind(":creator_photographer",           doc_matters.conf_make_meta.meta.creator_photographer); +        insert_metadata.bind(":creator_translator",                doc_matters.conf_make_meta.meta.creator_translator); +        // insert_metadata.bind(":creator_audio",                  doc_matters.conf_make_meta.meta.creator_audio); +        // insert_metadata.bind(":creator_video",                  doc_matters.conf_make_meta.meta.creator_video); +        insert_metadata.bind(":date_added_to_site",                doc_matters.conf_make_meta.meta.date_added_to_site); +        insert_metadata.bind(":date_available",                    doc_matters.conf_make_meta.meta.date_available); +        insert_metadata.bind(":date_created",                      doc_matters.conf_make_meta.meta.date_created); +        insert_metadata.bind(":date_issued",                       doc_matters.conf_make_meta.meta.date_issued); +        insert_metadata.bind(":date_modified",                     doc_matters.conf_make_meta.meta.date_modified); +        insert_metadata.bind(":date_published",                    doc_matters.conf_make_meta.meta.date_published); +        insert_metadata.bind(":date_valid",                        doc_matters.conf_make_meta.meta.date_valid); +        // insert_metadata.bind(":date_translated",                doc_matters.conf_make_meta.meta.date_translated); +        // insert_metadata.bind(":date_original_publication",      doc_matters.conf_make_meta.meta.date_original_publication); +        // insert_metadata.bind(":date_generated",                 doc_matters.conf_make_meta.meta.date_generated); +        insert_metadata.bind(":identifier_isbn",                   doc_matters.conf_make_meta.meta.identifier_isbn); +        insert_metadata.bind(":identifier_oclc",                   doc_matters.conf_make_meta.meta.identifier_oclc); +        insert_metadata.bind(":language_document",                 doc_matters.conf_make_meta.meta.language_document); +        insert_metadata.bind(":language_document_char",            doc_matters.conf_make_meta.meta.language_document_char); +        // insert_metadata.bind(":language_original",              doc_matters.conf_make_meta.meta.language_original); +        // insert_metadata.bind(":language_original_char",         doc_matters.conf_make_meta.meta.language_original_char); +        insert_metadata.bind(":notes_abstract",                    doc_matters.conf_make_meta.meta.notes_abstract); +        insert_metadata.bind(":notes_description",                 doc_matters.conf_make_meta.meta.notes_description); +        insert_metadata.bind(":original_publisher",                doc_matters.conf_make_meta.meta.original_publisher); +        insert_metadata.bind(":original_language",                 doc_matters.conf_make_meta.meta.original_language); +        insert_metadata.bind(":original_language_char",            doc_matters.conf_make_meta.meta.original_language_char); +        insert_metadata.bind(":original_source",                   doc_matters.conf_make_meta.meta.original_source); +        insert_metadata.bind(":original_title",                    doc_matters.conf_make_meta.meta.original_title); +        insert_metadata.bind(":publisher",                         doc_matters.conf_make_meta.meta.publisher); +        // insert_metadata.bind(":rights",                         doc_matters.conf_make_meta.meta.rights); +        insert_metadata.bind(":rights_copyright",                  doc_matters.conf_make_meta.meta.rights_copyright); +        insert_metadata.bind(":rights_copyright_audio",            doc_matters.conf_make_meta.meta.rights_copyright_audio); +        insert_metadata.bind(":rights_copyright_cover",            doc_matters.conf_make_meta.meta.rights_copyright_cover); +        insert_metadata.bind(":rights_copyright_illustrations",    doc_matters.conf_make_meta.meta.rights_copyright_illustrations); +        insert_metadata.bind(":rights_copyright_photographs",      doc_matters.conf_make_meta.meta.rights_copyright_photographs); +        // insert_metadata.bind(":rights_copyright_preparation",   doc_matters.conf_make_meta.meta.rights_preparation); +        insert_metadata.bind(":rights_copyright_text",      doc_matters.conf_make_meta.meta.rights_copyright_text); +        insert_metadata.bind(":rights_copyright_translation",      doc_matters.conf_make_meta.meta.rights_copyright_translation); +        insert_metadata.bind(":rights_copyright_video",            doc_matters.conf_make_meta.meta.rights_copyright_video); +        // insert_metadata.bind(":rights_copyright_digitization",  doc_matters.conf_make_meta.meta.rights_digitization); +        // insert_metadata.bind(":rights_copyright_audio",         doc_matters.conf_make_meta.meta.rights_audio); +        // insert_metadata.bind(":rights_copyright_video",         doc_matters.conf_make_meta.meta.rights_video); +        insert_metadata.bind(":rights_license",                    doc_matters.conf_make_meta.meta.rights_license); +        // insert_metadata.bind(":src_filename",                   doc_matters.conf_make_meta.meta.src_filename); +        // insert_metadata.bind(":src_fingerprint",                doc_matters.conf_make_meta.meta.src_fingerprint); +        // insert_metadata.bind(":src_filesize",                   doc_matters.conf_make_meta.meta.src_filesize); +        // insert_metadata.bind(":src_wordcount",                  doc_matters.conf_make_meta.meta.src_wordcount); +        // insert_metadata.bind(":src_text",                       doc_matters.conf_make_meta.meta.src_text); +        // insert_metadata.bind(":fulltext",                       doc_matters.conf_make_meta.meta.fulltext); +        // insert_metadata.bind(":links",                          doc_matters.conf_make_meta.meta.links); +        insert_metadata.execute(); insert_metadata.reset(); +        /+ watch +/ +        writeln("sql statement executed"); +        assert(db.totalChanges == 1); +        // +        Statement insert_doc_objects = db.prepare(" +          INSERT INTO doc_objects ( +            lid, +            metadata_tid, +            ocn, +            ocnd, +            ocns, +            clean, +            body, +            book_idx, +            seg, +            lev_an, +            lev, +            lev0, +            lev1, +            lev2, +            lev3, +            lev4, +            lev5, +            lev6, +            lev7, +            en_a, +            en_z, +            en_a_asterisk, +            en_z_asterisk, +            en_a_plus, +            en_z_plus, +            t_of, +            t_is, +            node, +            parent, +            digest_clean, +            digest_all, +            types +          ) +          VALUES ( +            :lid, +            :metadata_tid, +            :ocn, +            :ocnd, +            :ocns, +            :clean, +            :body, +            :book_idx, +            :seg, +            :lev_an, +            :lev, +            :lev0, +            :lev1, +            :lev2, +            :lev3, +            :lev4, +            :lev5, +            :lev6, +            :lev7, +            :en_a, +            :en_z, +            :en_a_asterisk, +            :en_z_asterisk, +            :en_a_plus, +            :en_z_plus, +            :t_of, +            :t_is, +            :node, +            :parent, +            :digest_clean, +            :digest_all, +            :types +          ) +        "); +        return insert_doc_objects; +      } +    } +    template SQLiteObjectsLoop() { +      void SQLiteObjectsLoop(P)( +        auto ref P          doc_parts, +      ) { +        Statement insert_doc_objects = SQLiteInstruct!()(doc_matters); +        auto format_and_sqlite_load = SQLiteFormatAndLoadObject!()(doc_matters); +        string[string] obj_txt; +        string doc_text; +        foreach (part; doc_parts) { +          foreach (obj; doc_abstraction[part]) { +            switch (obj.of_part) { +            case "frontmatter":              assert(part == "head"); +              switch (obj.is_of) { +              case "para": +                switch (obj.is_a) { +                case "heading": +                  obj_txt = format_and_sqlite_load.heading(obj); +                  break; +                default: +                  if ((doc_matters.opt_action["debug"])) { +                    writeln(__FILE__, ":", __LINE__, ": ", obj.is_a); +                  } +                  break; +                } +                break; +              default: +                if ((doc_matters.opt_action["debug"])) { +                  writeln(__FILE__, ":", __LINE__, ": ", obj.is_of); +                } +                break; +              } +              break; +            case "body": //                    assert(part == "body"); // TODO broken +              switch (obj.is_of) { +              case "para": +                switch (obj.is_a) { +                case "heading": +                  debug (asserts) { // TODO consider and fix or remove +                    if (part != "body") { +                      writeln(__LINE__, ": ", obj.text); +                    } +                  } +                  obj_txt = format_and_sqlite_load.heading(obj); +                  break; +                case "para": +                  obj_txt = format_and_sqlite_load.para(obj); +                  break; +                default: +                  if ((doc_matters.opt_action["debug"])) { +                    writeln(__FILE__, ":", __LINE__, ": ", obj.is_a); +                  } +                  break; +                } +                break; +              case "block": +                switch (obj.is_a) { +                case "quote": +                  obj_txt = format_and_sqlite_load.quote(obj); +                  break; +                case "group": +                  obj_txt = format_and_sqlite_load.group(obj); +                  break; +                case "block": +                  obj_txt = format_and_sqlite_load.block(obj); +                  break; +                case "poem":                        // double check on keeping both poem & verse +                  break; +                case "verse": +                  obj_txt = format_and_sqlite_load.verse(obj); +                  break; +                case "code": +                  obj_txt = format_and_sqlite_load.code(obj); +                  break; +                case "table": +                  obj_txt = format_and_sqlite_load.table(obj); +                  break; +                default: +                  if ((doc_matters.opt_action["debug"])) { +                    writeln(__FILE__, ":", __LINE__, ": ", obj.is_a); +                  } +                  break; +                } +                break; +              default: +                if ((doc_matters.opt_action["debug"])) { +                  writeln(__FILE__, ":", __LINE__, ": ", obj.is_of); +                } +                break; +              } +              break; +            case "backmatter": +              assert(part == "endnotes" || "glossary" || "bibliography" || "bookindex_scroll" || "blurb" || "tail"); +              switch (obj.is_of) { +              case "para": +                switch (obj.is_a) { +                case "heading": +                  obj_txt = format_and_sqlite_load.heading(obj); +                  break; +                case "endnote":              assert(part == "endnotes"); +                  obj_txt = format_and_sqlite_load.para(obj); +                  break; +                case "glossary":             assert(part == "glossary"); +                  obj_txt = format_and_sqlite_load.para(obj); +                  break; +                case "bibliography":         assert(part == "bibliography"); +                  obj_txt = format_and_sqlite_load.para(obj); +                  break; +                case "bookindex":            assert(part == "bookindex_scroll"); +                  obj_txt = format_and_sqlite_load.para(obj); +                  break; +                case "blurb":                assert(part == "blurb"); +                  obj_txt = format_and_sqlite_load.para(obj); +                  break; +                default: +                  if ((doc_matters.opt_action["debug"])) { +                    writeln(__FILE__, ":", __LINE__, ": ", obj.is_a); +                  } +                  break; +                } +                break; +              default: +                if ((doc_matters.opt_action["debug"])) { +                  writeln(__FILE__, ":", __LINE__, ": ", obj.is_of); +                } +                break; +              } +              break; +            case "comment": +              break; +            default: +              if ((doc_matters.opt_action["debug"])) { +                writeln(__FILE__, ":", __LINE__, ": ", obj.of_part); // check where empty value could come from +                writeln(__FILE__, ":", __LINE__, ": ", obj.is_a); +                writeln(__FILE__, ":", __LINE__, ": ", obj.text); // check where empty value could come from +              } +              break; +            } +            if (obj.is_a == "heading") { +              writeln( +                "markup: ", obj.heading_lev_markup, +                "> ", obj.dom_markedup, +                "; collapsed: ", obj.heading_lev_collapsed, +                "> ", obj.dom_collapsed, +                "; ocn: ", obj.ocn, +                " node: ", obj.node, +                "; parent: ", obj.parent_lev_markup, +                "; ocn: ", obj.parent_ocn, +                "; ", +              ); +            } +            insert_doc_objects.bind(":t_of",        obj.is_of); +            insert_doc_objects.bind(":t_is",        obj.is_a); +            insert_doc_objects.bind(":ocn",         obj.ocn); +            insert_doc_objects.bind(":clean",       obj_txt["text"]); // consider whether book index info should be made available within clear text for search +            insert_doc_objects.bind(":body",        obj_txt["html"]); +            // insert_doc_objects.bind(":book_idx",    ""); // not needed, but, consider whether should be made available within object for clear text search +            insert_doc_objects.bind(":lev",         obj.heading_lev_markup); +            // // insert_doc_objects.bind(":dom_markedup",    ""); // should make lev sequence below obsolete +            // // insert_doc_objects.bind(":dom_collapsed", ""); // should add info +            // insert_doc_objects.bind(":lev0",        ""); +            // insert_doc_objects.bind(":lev1",        ""); +            // insert_doc_objects.bind(":lev2",        ""); +            // insert_doc_objects.bind(":lev3",        ""); +            // insert_doc_objects.bind(":lev4",        ""); +            // insert_doc_objects.bind(":lev5",        ""); +            // insert_doc_objects.bind(":lev6",        ""); +            // insert_doc_objects.bind(":lev7",        ""); +            // insert_doc_objects.bind(":node",        ""); +            // insert_doc_objects.bind(":type",        ""); +            // insert_doc_objects.bind(":parent_ocn",                ""); +            // insert_doc_objects.bind(":ancestors",                 ""); +            // insert_doc_objects.bind(":heading_lev_markup",        ""); +            // insert_doc_objects.bind(":heading_lev_collapsed",     ""); +            // insert_doc_objects.bind(":parent_lev_markup",        ""); +            // insert_doc_objects.bind(":heading_ancestors",         ""); +            // insert_doc_objects.bind(":node",                      ""); +            insert_doc_objects.execute(); insert_doc_objects.reset(); +          } +        } +      } +    } +    SQLiteObjectsLoop!()(doc_matters.keys_seq.sql); +  } +} +template SQLiteDiscreteTablesCreate() { +  void SQLiteDiscreteTablesCreate()() { +    writeln("table create"); +  } +} +template SQLiteDiscreteTablesDrop() { +  void SQLiteDiscreteTablesDrop()() { +    writeln("table drop"); +  } +} diff --git a/src/sdp/sdp.d b/src/sdp/sdp.d index c3b307c..00afb54 100755 --- a/src/sdp/sdp.d +++ b/src/sdp/sdp.d @@ -77,7 +77,8 @@ void main(string[] args) {      "qrcode"             : false,      "sisupod"            : false,      "source"             : false, -    "sqlite"             : false, +    "sqlite-discrete"    : false, +    "sqlite-update"      : false,      "sqlite-create"      : false,      "sqlite-drop"        : false,      "text"               : false, @@ -116,9 +117,10 @@ void main(string[] args) {      "qrcode",             "--qrcode with document metadata",                            &opts["qrcode"],      "sisupod",            "--sisupod sisupod source content bundled",                   &opts["sisupod"],      "source",             "--source markup source text content",                        &opts["source"], +    "sqlite-discrete",    "--sqlite process discrete sqlite output",                    &opts["sqlite-discrete"],      "sqlite-create",      "--sqlite-create create db, create tables",                   &opts["sqlite-create"],      "sqlite-drop",        "--sqlite-drop drop tables & db",                             &opts["sqlite-drop"], -    "sqlite",             "--sqlite process sqlite output",                             &opts["sqlite"], +    "sqlite-update",      "--sqlite process sqlite output",                             &opts["sqlite-update"],      "text",               "--text process text output",                                 &opts["text"],      "txt",                "--txt process text output",                                  &opts["text"],      "verbose|v",          "--verbose output to terminal",                               &opts["verbose"], | 
