module dom_persist; import std.file; import std.array; //https://dlang.org/phobos/std_array.html import std.conv; import std.stdio; import std.format; import std.exception : enforce; import std.traits; import d2sqlite3; // https://d2sqlite3.dpldocs.info/v1.0.0/d2sqlite3.database.Database.this.html version(unittest){ //stuff only compiled for unittests string sqlite_filename = "dom_persist_test.db"; } unittest { writeln( "Testing tree creation (old code)" ); db_drop( sqlite_filename ); assert( !db_exists( sqlite_filename ) ); Database db = db_create( sqlite_filename, 1 ); assert( db_exists( sqlite_filename ) ); assert(db.tableColumnMetadata("params", "ID") == TableColumnMetadata("INTEGER", "BINARY", false, true, true)); Tree_Db.db_create_schema( db ); assert(db.tableColumnMetadata("doctree", "ID") == TableColumnMetadata("INTEGER", "BINARY", false, true, true)); Tree_Db_Base tdb = new Tree_Db_Base( db ); long tree_id = tdb.create_tree("mytree"); long nid = tdb.appendChild( tree_id, tree_id, TreeNodeType.docType, "html" ); long html_nid = tdb.appendChild( tree_id, tree_id, TreeNodeType.element, "html" ); long head_id = tdb.appendChild( tree_id, html_nid, TreeNodeType.element, "head" ); tdb.appendChild( tree_id, head_id, TreeNodeType.comment, "This is my comment" ); long body_id = tdb.appendChild( tree_id, html_nid, TreeNodeType.element, "body" ); tdb.appendChild( tree_id, body_id, TreeNodeType.text, "This is some text" ); tdb.appendChild( tree_id, body_id, TreeNodeType.text, " with more text" ); tdb.appendChildElement( tree_id, body_id, "input" ); string html_out = tdb.getTreeAsText( tree_id ); //writeln( html_out ); assert( html_out == "<DOCTYPE html><html><head><!--This is my comment--></head><body>This is some text with more text<input/></body></html>"); db.close(); } unittest{ auto db = Database( sqlite_filename ); Tree_Db tree = Tree_Db.createTree( db, "mytree-new" ); TreeNode* tree_node = tree.getTreeNode(); NodeData nd = tree_node.node_data; assert( nd.pid == 0); assert( nd.e_data == "mytree-new"); // flush the empty tree tree.flush(); } unittest{ writeln( "Testing DocOrderIterator" ); auto db = Database( sqlite_filename ); TreeNameID[] tree_list = Tree_Db.getTreeList( db ); Tree_Db tree = Tree_Db.loadTree( db, tree_list[0].tree_id ); TreeNode* tree_node = tree.getTreeNode(); DocOrderIterator it = new DocOrderIterator( tree_node ); int i=0; TreeNode* nxt; while( (nxt=it.nextNode) !is null ){ switch(i){ case 0: assert( (*nxt).node_data.type == TreeNodeType.tree ); break; case 1: assert( (*nxt).node_data.type == TreeNodeType.docType ); break; case 2,3,5,8: assert( (*nxt).node_data.type == TreeNodeType.element ); break; case 4: assert( (*nxt).node_data.type == TreeNodeType.comment ); break; case 6,7: assert( (*nxt).node_data.type == TreeNodeType.text ); break; default: } i+=1; } } bool db_exists( string sqlite_filename ){ return sqlite_filename.exists; } void db_drop( string sqlite_filename ){ if( sqlite_filename.exists ){ sqlite_filename.remove(); } } Database db_create( string sqlite_filename, int db_ver ){ auto db = Database( sqlite_filename ); db.run("CREATE TABLE \"Params\"(\"ID\" INTEGER, \"Name\" TEXT NOT NULL UNIQUE, \"Val\" TEXT, PRIMARY KEY(\"ID\" AUTOINCREMENT))"); db.run("insert into params(Name, Val) values('DB_VERSION','"~to!string(db_ver)~"')"); return db; } enum TreeNodeType { nulltype=-2, // indicates a type read from the database which is not one of the recognised types tree=-1, docType, element, text, comment } TreeNodeType getTreeNodeType( int tip ){ auto tnts = [EnumMembers!TreeNodeType]; foreach( tnt; tnts ){ if( tnt==tip ) return tnt; } return TreeNodeType.nulltype; } /** * This class provides direct database access to all trees in the database table. You can also obtain from it * an instance of class Tree_Dd for a specific tree given its root node id. */ class Tree_Db_Base { protected: Database* db; static long node_count = 0; public: this( ref Database db ){ this.db = &db; } /** * Create a new tree in the tree table and return the ID of the tree node. Note that the tree node is * the parent of the root node, doctype and maybe other node data. * * The tree node is marked with '0' (zero) since it has no parent. */ long create_tree( string tree_name ){ return appendChild( 0, 0, TreeNodeType.tree, tree_name); } /** * Read the DOM from this database for the given tree ID (tid) and return as * an html (or xml) string. * * Note that the tree node (type==0) does not have a string representation. */ string getTreeAsText( long tid ){ //NodeData cTree = getChild( tid ); //we don't want to print the 'tree' node return getTreeAsText_r( tid ); } string getTreeAsText_r( long tid ){ string strRtn = ""; NodeData[] children = getChildren( tid ); foreach( child; children){ strRtn ~= get_openTag_commence( child.type, child.e_data ); // --> add attributes if required strRtn ~= get_openTag_end( child.type, child.e_data ); strRtn ~= getTreeAsText_r( child.ID ); strRtn ~= get_closeTag( child.type, child.e_data ); } return strRtn; } /** * Return the (ordered) child node IDs of the given parent_id. */ NodeData[] getChildren( long parent_id ){ NodeData[] child_nodes; auto results = db.execute( format("select ID, e_data, p_id, t_id from doctree where p_id=%d", parent_id) ); foreach (row; results){ //assert(row.length == 3); child_nodes ~= NodeData( row.peek!long(0), row.peek!string(1), row.peek!long(2), getTreeNodeType( row.peek!int(3) ) ); } return child_nodes; } NodeData getChild( long cid ){ auto results = db.execute( format("select ID, e_data, p_id, t_id from doctree where id=%d", cid) ); foreach (row; results){ //assert(row.length == 1); return NodeData( row.peek!long(0), row.peek!string(1), row.peek!long(2), getTreeNodeType( row.peek!int(3) ) ); } throw new Exception( format( "Child with ID(%d) not found", cid) ); } /** * Append a new element to the given parent id (pid) */ long appendChildElement( long tree_id, long pid, string elem_name ){ enforce(elem_name!=null && elem_name.length>0 ); return appendChild( tree_id, pid, TreeNodeType.element, elem_name ); } /** * Append new text to the given parent id (pid). * Returns the ID of the text node if appended or -1 otherwise. */ long appendChildText( long tree_id, long pid, string text ){ if(text==null || text.length==0 ) return -1; return appendChild( tree_id, pid, TreeNodeType.text, text ); } /** * Append new text to the given parent id (pid). * Returns the ID of the text node if appended or -1 otherwise. */ long appendChildComment( long tree_id, long pid, string text ){ if(text==null || text.length==0 ) return -1; return appendChild( tree_id, pid, TreeNodeType.comment, text ); } /** * Append a new node to the given parent pid. * node_data is used only for doctype, element and text * * The ID of the new node is returned. */ long appendChild( long tree_id, long pid, TreeNodeType nt, string node_data = "" ){ if( nt == TreeNodeType.docType ){ //we might store the extra data as an attribute but this will suffice for the moment node_data = "DOCTYPE "~node_data; } db.run( format("insert into doctree(e_data, p_id, t_id, tree_id, c_order ) values( '%s', %d, %d, %d, %d )", node_data, pid, nt, tree_id, node_count ) ); node_count+=1; return db.lastInsertRowid; } /** * Close this object AND the underlying DB connection. */ void close(){ db.close(); db=null; } long getRootId(){ return -1; } } string get_openTag_commence( TreeNodeType nt, string e_data ){ switch( nt ){ case TreeNodeType.text: return e_data; case TreeNodeType.comment: return "<!--"~e_data; default: return "<"~e_data; } } string get_openTag_end( TreeNodeType nt, string e_data ){ switch( nt ){ case TreeNodeType.comment: case TreeNodeType.text: return ""; default: switch(e_data){ case "input": case "br": return "/>"; default: } return ">"; } } string get_closeTag( TreeNodeType nt, string e_data ){ switch( nt ){ case TreeNodeType.docType: case TreeNodeType.text: return ""; case TreeNodeType.comment: return "-->"; default: switch(e_data){ case "input": case "br": return ""; default: } return format("</%s>", e_data); } } struct NodeData { long ID; string e_data; long pid; TreeNodeType type; bool dirty = false; this( long ID, string e_data, long pid, TreeNodeType type){ this.ID = ID; this.e_data = e_data; this.pid = pid; this.type = type; } } struct TreeNameID { long tree_id; string name; } struct TreeNode { private: Tree_Db owner_tree; public: NodeData node_data; TreeNode*[] child_nodes; bool dirty; // true indicates a change in child_nodes this( Tree_Db owner_tree, NodeData node_data){ this.owner_tree = owner_tree; this.node_data = node_data; } /** * Returns the parent node of this node or null if no parent exists (i.e. tree-root) */ TreeNode* parentNode(){ if(node_data.pid==0) return null; return owner_tree.getTreeNodeById( node_data.pid ); } /** * Returns the next sibling of this node or null if none exists */ TreeNode* nextSibling(){ if(node_data.pid==0) return null; TreeNode* p_node = owner_tree.getTreeNodeById( node_data.pid ); foreach( i, c_node; p_node.child_nodes){ if(c_node==&this){ if( i == p_node.child_nodes.length-1) return null; return p_node.child_nodes[i+1]; } } throw new Exception("Damaged tree, possibly incorrect parent id for a child."); } bool hasChildNodes(){ return child_nodes.length>0; } TreeNode* firstChild(){ if( child_nodes.length==0 ) return null; return child_nodes[0]; } /** * Set the data for this node. * * The data is interpreted using the type of node. For example, the text content of a text node is * the data whereas for element types, the data is used to hold the element name. */ void setData( string nData ){ node_data.e_data = nData; node_data.dirty = true; } /** * Insert a new child node at the position indicated. */ void insertChild( TreeNodeType n_type, string e_data, int pos ){ owner_tree.insertChild( &this, n_type, e_data, pos ); } } /** * An instance of this class contains access to a single tree. Tree operations are cached in RAM and only written to * disk during a save operation. This can be done safely because of the single user access to Sqlite. * * Multiple database connections should work on the same thread provided each is using a different tree. * * Instantiation of the tree involves only one database select. */ class Tree_Db { private: this( Database* db, long tid, string tree_name = null ){ this.db = db; if(tid==0){ //new tree tree_id = getNextNodeId(); TreeNode tn = TreeNode( this, NodeData( tree_id, tree_name, 0, TreeNodeType.tree) ); this.all_nodes[ tree_id ] = tn; return; } tree_id = tid; //load the tree in one hit using the tree_id //also order by the parent_id so that we know all siblings are grouped together //and then by child order auto results = db.execute( format("select ID, e_data, p_id, t_id from doctree where tree_id=%d or id=%d order by p_id,c_order", tid, tid) ); foreach (row; results){ long id = row.peek!long(0); long p_id = row.peek!long(2); TreeNode tn = TreeNode( this, NodeData( id, row.peek!string(1), p_id, getTreeNodeType( row.peek!int(3) ) )); all_nodes[id] = tn; if(p_id==0) continue; all_nodes[p_id].child_nodes ~= &all_nodes[id]; } } // end private protected: long tree_id; Database* db; long nnid = 0; TreeNode[long] all_nodes; long getNextNodeId(){ nnid -= 1; return nnid; } // end protected public: static void db_create_schema( ref Database db ){ db.run("CREATE TABLE IF NOT EXISTS doctree (ID INTEGER, e_data TEXT,p_id INTEGER,t_id INTEGER NOT NULL,tree_id INTEGER NOT NULL, c_order INTEGER, PRIMARY KEY( ID AUTOINCREMENT))"); } /** * Return a list of all trees in the database with their ID's and names. */ static TreeNameID[] getTreeList( ref Database db ){ TreeNameID[] tree_list; auto results = db.execute( format("select ID, e_data from doctree where p_id=0") ); foreach (row; results){ tree_list ~= TreeNameID ( row.peek!long(0), row.peek!string(1) ); } return tree_list; } /** * Create a new tree in RAM. No database activity takes place at this time. */ static Tree_Db createTree( ref Database db, string tree_name ){ return new Tree_Db( &db, 0, tree_name ); } /** * Load a tree into RAM from database given the tree ID. */ static Tree_Db loadTree( ref Database db, long tree_id ){ return new Tree_Db( &db, tree_id ); } /** * Returns the root node of this tree. This is special node holds the tree name and ID and is not * usually part of the document but rather the parent container. */ TreeNode* getTreeNode(){ return &all_nodes[tree_id]; } /** * Return any node given its ID. * * Note about IDs: * positive IDs indicate that the record exists on the database and the ID is the database ID of that node. * negative IDs indicate that the record is a new one existing in RAM only until such times as 'flush' is called. * */ TreeNode* getTreeNodeById( long id ){ return &all_nodes[id]; } /** * Return the tree as html text. This is the cached tree with all changes and not from the database. */ string getTreeAsText( ){ return getTreeAsText_r( all_nodes[tree_id] ); } /** * Insert a new child of parent node (p_node) at the position (pos) indicated. */ void insertChild( TreeNode* p_node, TreeNodeType n_type, string e_data, int pos ){ /* Algorithm: add into the correct place in ram, assign a new id <=-1. An ID is required to add to the map. Using negative IDs indicates that it is not a DB ID. Mark the TreeNode parent as dirty indicating that children need adding and re-ordering flush: insert (into db) all nodes first then set c_order column for those with dirty parents(!) */ long id = getNextNodeId(); TreeNode tn = TreeNode( this, NodeData( id, e_data, p_node.node_data.ID, n_type) ); this.all_nodes[ id ] = tn; p_node.child_nodes.insertInPlace( pos, &this.all_nodes[ id ]); p_node.dirty = true; } /** * Save all edits to the tree to the database. After this call, the database values will be in sync * with the memory tree. */ void flush(){ // nodes must be written in document order so that a valid database ID is always available as a parent //ID for subsequent child writes. This is because the child update will write long new_tree = tree_id<0; DocOrderIterator it = new DocOrderIterator( &all_nodes[tree_id] ); TreeNode* tnode; while( (tnode=it.nextNode) !is null ){ NodeData* nd = &tnode.node_data; //writeln("todo create:", nd ); //first we check the ID<0 which implies it is a new node if( nd.ID<0 ){ if(new_tree) tree_id=0; db.run( format("insert into doctree(e_data, p_id, t_id, tree_id ) values( '%s', %d, %d, %d )", nd.e_data, nd.pid, nd.type, tree_id ) ); //update the node id long old_id = nd.ID; nd.ID = db.lastInsertRowid; if(new_tree) tree_id = nd.ID; //update the map TreeNode tn = all_nodes[old_id]; all_nodes[nd.ID] = tn; all_nodes.remove(old_id); }else if( nd.dirty ){ db.run( format("update doctree set e_data='%s' where id=%d", nd.e_data, nd.ID ) ); nd.dirty = false; } } //Re-enumerate any children that have shifted positions (or are new) according to their array positions it.reset(); while( (tnode=it.nextNode) !is null ){ if( tnode.dirty ){ foreach( i, cNode; tnode.child_nodes){ db.run( format("update doctree set c_order=%d where id=%d", i, cNode.node_data.ID ) ); } tnode.dirty = false; } } } protected: string getTreeAsText_r( ref TreeNode tn ){ string strRtn = ""; TreeNode*[] children = tn.child_nodes; foreach( child; children){ NodeData nd = child.node_data; strRtn ~= get_openTag_commence( nd.type, nd.e_data ); // --> add attributes if required strRtn ~= get_openTag_end( nd.type, nd.e_data ); strRtn ~= getTreeAsText_r( *child ); strRtn ~= get_closeTag( nd.type, nd.e_data ); } return strRtn; } } /* Delete node (branch) If the id<=-1, then it was a new node, unsaved, can be removed entirely Otherwise, move the node and all children into a delete-map. Mark the TreeNode parent as dirty indicating that children need removing. Re-ordering is not required but may be advantageous flush: Delete entries using the delete-map and clear the map. Move node Move the node and all children into new parent (same parent also works) Mark old parent TreeNode as dirty indicating a re-order is necessary, re-order ram children Mark new parent TreeNode as dirty indicating a re-order is necessary, re-order ram children update parent id of moved child */ unittest{ writeln( "Testing tree loading" ); auto db = Database( sqlite_filename ); TreeNameID[] tree_list = Tree_Db.getTreeList( db ); assert( tree_list.length==2 ); Tree_Db tree = Tree_Db.loadTree( db, tree_list[0].tree_id ); TreeNode* tree_node = tree.getTreeNode(); NodeData nd_t = tree_node.node_data; assert( nd_t.ID == tree_list[0].tree_id ); assert( nd_t.e_data == tree_list[0].name ); assert( nd_t.pid == 0 ); assert( nd_t.type == TreeNodeType.tree ); TreeNode* html_node; int i=0; foreach( node_ptr; tree_node.child_nodes ){ NodeData c_node = (*node_ptr).node_data; switch(i){ case 0: assert( c_node.ID == 2 ); assert( c_node.e_data == "DOCTYPE html" ); assert( c_node.pid == tree_list[0].tree_id ); assert( c_node.type == TreeNodeType.docType ); break; case 1: html_node = node_ptr; assert( c_node.ID == 3 ); assert( c_node.e_data == "html" ); assert( c_node.pid == tree_list[0].tree_id ); assert( c_node.type == TreeNodeType.element ); break; default: } i+=1; } string html_out = tree.getTreeAsText( ); assert( html_out == "<DOCTYPE html><html><head><!--This is my comment--></head><body>This is some text with more text<input/></body></html>"); writeln( "Testing tree element insertion" ); //get head element TreeNode* tn_head = html_node.child_nodes[0]; //add an element to the head at position zero tn_head.insertChild( TreeNodeType.element, "script", 0 ); html_out = tree.getTreeAsText( ); assert( html_out == "<DOCTYPE html><html><head><script></script><!--This is my comment--></head><body>This is some text with more text<input/></body></html>"); writeln( "Testing tree editing" ); //edit the comment node (id=5) TreeNode* tn = tree.getTreeNodeById( 5 ); tn.setData( "An edit took place"); html_out = tree.getTreeAsText( ); assert( html_out == "<DOCTYPE html><html><head><script></script><!--An edit took place--></head><body>This is some text with more text<input/></body></html>"); //check that the database entry is unchanged auto results = db.execute( "select e_data from doctree where id=5" ); foreach (row; results){ assert( "This is my comment" == row.peek!string(0) ); } // save to database tree.flush(); //check db contents using a new tree Tree_Db tree2 = Tree_Db.loadTree( db, tree_list[0].tree_id ); html_out = tree2.getTreeAsText( ); assert( html_out == "<DOCTYPE html><html><head><script></script><!--An edit took place--></head><body>This is some text with more text<input/></body></html>"); } /** * Iterator starting at any given TreeNode, traversing each of the descendent nodes, depth first and increasing child index. */ class DocOrderIterator { TreeNode* start_node; TreeNode* next_node; this( TreeNode* n ){ start_node = n; next_node = n; } void reset(){ next_node = start_node; } /** * The initial TreeNode is the first node to be returned. */ TreeNode* nextNode(){ //the node we will return this time TreeNode* rtnNode = next_node; if(rtnNode==null) return null; //now work out the node for the next call if( rtnNode.hasChildNodes() ){ next_node = rtnNode.firstChild(); return rtnNode; } TreeNode* anc_node = rtnNode; while( anc_node !is null && anc_node.nextSibling() is null){ anc_node = anc_node.parentNode(); if( anc_node == start_node ){ anc_node=null; break; } } if(anc_node is null) { next_node=null; return rtnNode; } next_node = anc_node.nextSibling(); return rtnNode; } }