<pre>//
//  File:   hzDocHtml.cpp
//
//  Legal Notice:   This file is part of the HadronZoo C++ Class Library. Copyright 2025 HadronZoo Project (http://www.hadronzoo.com)
//
//  The HadronZoo C++ Class Library is free software: You can redistribute it, and/or modify it under the terms of the GNU Lesser General Public License, as published by the Free
//  Software Foundation, either version 3 of the License, or any later version.
//
//  The HadronZoo C++ Class Library is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR
//  A PARTICULAR PURPOSE. See the GNU Lesser General Public License for more details.
//
//  You should have received a copy of the GNU Lesser General Public License along with the HadronZoo C++ Class Library. If not, see http://www.gnu.org/licenses.
//</pre>
			<pre>//
//  Management of HTML documents
//</pre>
			<pre>#include &lt;fstream&gt;</pre>
			<pre>#include &lt;sys/stat.h&gt;</pre>
			<pre>#include "hzChars.h"
#include "hzTextproc.h"
#include "hzDirectory.h"
#include "hzDocument.h"
#include "hzProcess.h"</pre>
			<pre>using namespace std ;</pre>
			<pre>/*
**  Variables
*/</pre>
			<pre>static  hzMapS&lt;hzString,hzHtagform&gt;     s_htagNam ;     //  All HTML tags by name
static  hzMapS&lt;hzHtagtype,hzHtagform&gt;   s_htagTyp ;     //  All HTML tags by type</pre>
			<pre>static  hzHtagform  s_tagformDuff ;                     //  Null tag form
static  uint32_t    s_htagPop ;                         //  This is set by InitHtml() to the number of HTML tags, to indicate that the tags have been set up.</pre>
			<pre>/*
**  SECTION 1:  HTML Tag Types
*/</pre>
			<pre>hzEcode InitHtml    (void)
{
    //  Category:   Data Initialization
    //
    //  Populate the map of tag names to tag forms and the map of tag types to tag forms (see hzHtagform definition). This facilitates HTML tag lookup for such
    //  purposes as the import and processing of HTML documents.
    //
    //  Arguments:  None
    //
    //  Returns:    E_SETONCE   If the HTML maps are already populated
    //              E_OK        If the operation was successful</pre>
			<pre>    _hzfunc(__func__) ;</pre>
			<pre>    if (s_htagPop)
        return E_SETONCE ;</pre>
			<pre>    hzHtagform  t ;     //  Full tag info for insertion</pre>
			<pre>    //  Default (invalid)
    t.klas=HTCLASS_NUL; t.rule=HTRULE_NULL; t.type=HTAG_NULL;           t.name=(char*)0;            s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);</pre>
			<pre>    //  Page structure tags
    t.klas=HTCLASS_HDR; t.rule=HTRULE_SINGLE; t.type=HTAG_DOCTYPE;      t.name="!DOCTYPE";          s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_HDR; t.rule=HTRULE_PAIRED; t.type=HTAG_HTML;         t.name="html";              s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_HDR; t.rule=HTRULE_PAIRED; t.type=HTAG_HEAD;         t.name="head";              s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_HDR; t.rule=HTRULE_PAIRED; t.type=HTAG_TITLE;        t.name="title";             s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_HDR; t.rule=HTRULE_PAIRED; t.type=HTAG_META;         t.name="meta";              s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_HDR; t.rule=HTRULE_PAIRED; t.type=HTAG_BODY;         t.name="body";              s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_HDR; t.rule=HTRULE_PAIRED; t.type=HTAG_BASE;         t.name="base";              s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_HDR; t.rule=HTRULE_PAIRED; t.type=HTAG_BASEFONT;     t.name="basefont";          s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_HDR; t.rule=HTRULE_PAIRED; t.type=HTAG_STYLE;        t.name="style";             s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);</pre>
			<pre>    //  Programing tags
    t.klas=HTCLASS_HDR; t.rule=HTRULE_PAIRED; t.type=HTAG_SCRIPT;       t.name="script";            s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_HDR; t.rule=HTRULE_PAIRED; t.type=HTAG_NOFRAMES;     t.name="noframes";          s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_HDR; t.rule=HTRULE_PAIRED; t.type=HTAG_NOSCRIPT;     t.name="noscript";          s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_HDR; t.rule=HTRULE_PAIRED; t.type=HTAG_APPLET;       t.name="applet";            s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);</pre>
			<pre>    //  Frames   
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_FRAME;        t.name="frame";             s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_FRAMESET;     t.name="frameset";          s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_IFRAME;       t.name="iframe";            s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_SINGLE; t.type=HTAG_PARAM;        t.name="param";             s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);</pre>
			<pre>    //  System tags
    t.klas=HTCLASS_SYS; t.rule=HTRULE_PAIRED; t.type=HTAG_EMBED;        t.name="embed";             s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_SYS; t.rule=HTRULE_PAIRED; t.type=HTAG_NOEMBED;      t.name="noembed";           s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);</pre>
			<pre>    //  Font control or text tags - no content
    t.klas=HTCLASS_TXT; t.rule=HTRULE_PAIRED; t.type=HTAG_BOLD;         t.name="b";                 s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_TXT; t.rule=HTRULE_PAIRED; t.type=HTAG_ULINE;        t.name="u";                 s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_TXT; t.rule=HTRULE_PAIRED; t.type=HATG_ITALIC;       t.name="i";                 s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_TXT; t.rule=HTRULE_PAIRED; t.type=HTAG_EM;           t.name="em";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_TXT; t.rule=HTRULE_PAIRED; t.type=HTAG_STRONG;       t.name="strong";            s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_TXT; t.rule=HTRULE_PAIRED; t.type=HTAG_CENTER;       t.name="center";            s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_TXT; t.rule=HTRULE_PAIRED; t.type=HTAG_FONT;         t.name="font";              s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_TXT; t.rule=HTRULE_PAIRED; t.type=HTAG_BIG;          t.name="big";               s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_TXT; t.rule=HTRULE_PAIRED; t.type=HTAG_SMALL;        t.name="small";             s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_TXT; t.rule=HTRULE_SINGLE; t.type=HATG_BR;           t.name="br";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_TXT; t.rule=HTRULE_SINGLE; t.type=HTAG_HR;           t.name="hr";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);</pre>
			<pre>    //  Text description tags
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_HEADER;       t.name="header";            s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_FOOTER;       t.name="footer";            s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_SECTION;      t.name="section";           s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_ARTICLE;      t.name="article";           s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_ASIDE;        t.name="aside";             s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_DETAILS;      t.name="details";           s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_SUMMARY;      t.name="summary";           s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_DIALOG;       t.name="dialog";            s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);</pre>
			<pre>    //  Text grouping tags
    t.klas=HTCLASS_TXT; t.rule=HTRULE_PAIRED; t.type=HTAG_STRIKE;       t.name="strike";            s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_TXT; t.rule=HTRULE_PAIRED; t.type=HTAG_S;            t.name="s";                 s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_TXT; t.rule=HTRULE_PAIRED; t.type=HTAG_DEL;          t.name="del";               s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_TXT; t.rule=HTRULE_PAIRED; t.type=HTAG_INS;          t.name="ins";               s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_TXT; t.rule=HTRULE_PAIRED; t.type=HTAG_KBD;          t.name="kbd";               s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_TXT; t.rule=HTRULE_PAIRED; t.type=HTAG_SPAN;         t.name="span";              s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);</pre>
			<pre>    //  Text control tags
    t.klas=HTCLASS_DAT; t.rule=HTRULE_OPTION; t.type=HTAG_PARAG;        t.name="p";                 s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_QUOTATION;    t.name="q";                 s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_H1;           t.name="h1";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_H2;           t.name="h2";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_H3;           t.name="h3";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_H4;           t.name="h4";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_H5;           t.name="h5";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_H6;           t.name="h6";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);</pre>
			<pre>    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HATG_TT;           t.name="tt";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_CODE;         t.name="code";              s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_SAMP;         t.name="samp";              s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_CITE;         t.name="cite";              s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_CAPTION;      t.name="caption";           s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_VAR;          t.name="var";               s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_PRE;          t.name="pre";               s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_BQ;           t.name="bq";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_BLOCKQUOTE;   t.name="blockquote";        s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAB_BDO;          t.name="bdo";               s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_SUBSCRIPT;    t.name="sub";               s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_SUPERSCRIPT;  t.name="sup";               s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);</pre>
			<pre>    //  Data/layout tags
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_TABLE;        t.name="table";             s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_OPTION; t.type=HTAG_TCOL;         t.name="col";               s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_OPTION; t.type=HTAG_TCOLGRP;      t.name="colgroup";          s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_TH;           t.name="th";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_TR;           t.name="tr";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_TBL_CEL;      t.name="td";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_DIV;          t.name="div";               s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_TBODY;        t.name="tbody";             s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_THEAD;        t.name="thead";             s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_TFOOT;        t.name="tfoot";             s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_FIELDSET;     t.name="fieldset";          s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_LEGEND;       t.name="legend";            s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_MENU;         t.name="menu";              s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_DT;           t.name="dt";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_DD;           t.name="dd";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_DFN;          t.name="dfn";               s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_DIR;          t.name="dir";               s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_DLIST;        t.name="dl";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_OLIST;        t.name="ol";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_ULIST;        t.name="ul";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_ITEM;         t.name="li";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_HGROUP;       t.name="hgroup";            s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_DAT; t.rule=HTRULE_PAIRED; t.type=HTAG_TIME;         t.name="time";              s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);</pre>
			<pre>    //  Link tags
    t.klas=HTCLASS_LNK; t.rule=HTRULE_PAIRED; t.type=HTAG_ANCHOR;       t.name="a";                 s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_LNK; t.rule=HTRULE_PAIRED; t.type=HTAG_NAV;          t.name="nav";               s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_LNK; t.rule=HTRULE_PAIRED; t.type=HTAG_LINK;         t.name="link";              s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);</pre>
			<pre>    //  Input/form tags
    t.klas=HTCLASS_INP; t.rule=HTRULE_PAIRED; t.type=HTAG_FORM;         t.name="form";              s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_INP; t.rule=HTRULE_SINGLE; t.type=HTAG_INPUT;        t.name="input";             s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_INP; t.rule=HTRULE_PAIRED; t.type=HTAG_TEXTAREA;     t.name="textarea";          s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_INP; t.rule=HTRULE_PAIRED; t.type=HTAG_SELECT;       t.name="select";            s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_INP; t.rule=HTRULE_PAIRED; t.type=HTAG_OPTGROUP;     t.name="optgroup";          s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_INP; t.rule=HTRULE_PAIRED; t.type=HTAG_OPTION;       t.name="option";            s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_INP; t.rule=HTRULE_PAIRED; t.type=HTAG_BUTTON;       t.name="button";            s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_INP; t.rule=HTRULE_PAIRED; t.type=HTAG_LABEL;        t.name="label";             s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);</pre>
			<pre>    //  Information tags
    t.klas=HTCLASS_INF; t.rule=HTRULE_PAIRED; t.type=HTAG_ABBR;         t.name="abbr";              s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_INF; t.rule=HTRULE_PAIRED; t.type=HTAG_ACRONYM;      t.name="acronym";           s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_INF; t.rule=HTRULE_PAIRED; t.type=HTAG_ADDRESS;      t.name="address";           s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);</pre>
			<pre>    //  Image tags
    t.klas=HTCLASS_IMG; t.rule=HTRULE_SINGLE; t.type=HTAG_IMG;          t.name="img";               s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_IMG; t.rule=HTRULE_PAIRED; t.type=HTAG_MAP;          t.name="map";               s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_IMG; t.rule=HTRULE_PAIRED; t.type=HTAG_AREA;         t.name="area";              s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_IMG; t.rule=HTRULE_PAIRED; t.type=HTAG_OBJECT;       t.name="object";            s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_IMG; t.rule=HTRULE_PAIRED; t.type=HTAG_MARQUEE;      t.name="marquee";           s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_IMG; t.rule=HTRULE_PAIRED; t.type=HTAG_CANVAS;       t.name="canvas";            s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_IMG; t.rule=HTRULE_PAIRED; t.type=HTAG_FIGURE;       t.name="figure";            s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_IMG; t.rule=HTRULE_PAIRED; t.type=HTAG_FIGCAPTION;   t.name="figcaption" ;       s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);</pre>
			<pre>    //  Image SVG tags
    t.klas=HTCLASS_IMG;
    t.rule=HTRULE_PAIRED;
    t.type=HTAG_SVG;                   t.name="svg";                    s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_ANIMATE;           t.name="animate";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_ANIMATEMOTION;     t.name="animateMotion";          s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_ANIMATEXFORM;      t.name="animateTransform";       s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_CIRCLE;            t.name="circle";                 s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_CLIPPATH;          t.name="clipPath";               s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_DEFS;              t.name="defs";                   s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_DESC;              t.name="desc";                   s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_DISCARD;           t.name="discard";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_ELLIPSE;           t.name="ellipse";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_BLEND;             t.name="feBlend";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_COLORMATRIX;       t.name="feColorMatrix";          s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_COMPONENTXFER;     t.name="feComponentTransfer";    s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_COMPOSITE;         t.name="feComposite";            s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_CONVOLVEMATRIX;    t.name="feConvolveMatrix";       s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_DIFFUSELIGHTING;   t.name="feDiffuseLighting";      s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_DISPLACEMENTMAP;   t.name="feDisplacementMap";      s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_DISTANTLIGHT;      t.name="feDistantLight";         s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_DROPSHADOW;        t.name="feDropShadow";           s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_FLOOD;             t.name="feFlood";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_FUNC_A;            t.name="feFuncA";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_FUNC_B;            t.name="feFuncB";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_FUNC_G;            t.name="feFuncG";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_FUNC_R;            t.name="feFuncR";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_DEGAUSS;           t.name="feGaussianBlur";         s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_IMAGE;             t.name="feImage";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_MERGE;             t.name="feMerge";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_MERGENODE;         t.name="feMergeNode";            s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_MORPHOLOGY;        t.name="feMorphology";           s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_OFFSET;            t.name="feOffset";               s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_POINTLIGHT;        t.name="fePointLight";           s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_SPECLIGHT;         t.name="feSpecularLighting";     s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_SPOTLIGHT;         t.name="feSpotLight";            s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_TITLE;             t.name="feTile";                 s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_TURBULENCE;        t.name="feTurbulence";           s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_FILTER;            t.name="filter";                 s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_FOREIGNOBJECT;     t.name="foreignObject";          s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_GENERIC;           t.name="g";                      s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_HATCH;             t.name="hatch";                  s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_HATCHPATH;         t.name="hatchpath";              s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_LINE;              t.name="line";                   s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_lINEARGRADIENT;    t.name="linearGradient";         s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_MARKER;            t.name="marker";                 s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_MASK;              t.name="mask";                   s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_METADATA;          t.name="metadata";               s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_MPATH;             t.name="mpath";                  s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_PATH;              t.name="path";                   s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_PATTERN;           t.name="pattern";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_POLYGON;           t.name="polygon";                s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_POLYLINE;          t.name="polyline";               s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_RADIALGRADIENT;    t.name="radialGradient";         s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_RECT;              t.name="rect";                   s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_SET;               t.name="set";                    s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_STOP;              t.name="stop";                   s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_SWITCH;            t.name="switch";                 s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_SYMBOL;            t.name="symbol";                 s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_TEXT;              t.name="text";                   s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_TEXTPATH;          t.name="textPath";               s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_TSPAN;             t.name="tspan";                  s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_USE;               t.name="use";                    s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.type=HTAG_SVG_VIEW;              t.name="view";                   s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);</pre>
			<pre>    //  Audio/Video Tags
    t.klas=HTCLASS_IMG; t.rule=HTRULE_PAIRED; t.type=HTAG_AUDIO;        t.name="audio";             s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_IMG; t.rule=HTRULE_PAIRED; t.type=HTAG_SOURCE;       t.name="source";            s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_IMG; t.rule=HTRULE_PAIRED; t.type=HTAG_TRACK;        t.name="track";             s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);
    t.klas=HTCLASS_IMG; t.rule=HTRULE_PAIRED; t.type=HTAG_VIDEO;        t.name="video";             s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);</pre>
			<pre>    //  Third party tags
    t.klas=HTCLASS_3RD; t.rule=HTRULE_SINGLE; t.type=HTAG_FBLIKE;       t.name="fb:like";           s_htagTyp.Insert(t.type,t); s_htagNam.Insert(t.name,t);</pre>
			<pre>    s_htagPop = s_htagNam.Count() ;
    return E_OK ;
}</pre>
			<pre>const char* Doctype2Txt (hzDoctype dtype)
{
    //  Category:   Diagnostics
    //
    //  Convert hzDoctype enum to text for diagnostics
    //
    //  Arguments:  1)  dtype   The enumerated document type (either HTML or XML)
    //
    //  Returns:    Pointer to the doctype text form</pre>
			<pre>    static  const char* strings [] =
    {
        "DOCTYPE_UNDEFINED",
        "DOCTYPE_HTML",
        "DOCTYPE_XML",
        ""
    } ;</pre>
			<pre>    if (dtype &lt; 0 || dtype &gt;= DOCTYPE_XML)
        return strings[0] ;
    return strings[dtype] ;
}
    
hzString    Tagtype2Txt (hzHtagtype type)
{
    //  Category:   Diagnostics
    //
    //  Convert a HTML tag type (enum) into a string naming the type
    //
    //  Arguments:  1)  dtype   The enumerated document type (either HTML or XML)
    //
    //  Returns:    Instance of hzString by value</pre>
			<pre>    //  If tagmap not loaded, load it
    if (!s_htagNam.Count())
        InitHtml() ;</pre>
			<pre>    if (type &lt; HTAG_NULL)
        return s_tagformDuff.name ;</pre>
			<pre>    if (s_htagTyp.Count() &lt;= (uint32_t) type)
        return s_tagformDuff.name ;</pre>
			<pre>    return s_htagTyp[type].name ;
}</pre>
			<pre>hzHtagtype  Txt2Tagtype (const hzString&amp; htag)
{
    //  Category:   Config
    //
    //  Convert a string representing a HTML tag type, into the HTML tag type.
    //
    //  Arguments:  1)  htag    A string presumed to be one of the allowed HTML5 tags
    //
    //  Returns:    Enumerated hzHtagtype</pre>
			<pre>    _hzfunc(__func__) ;</pre>
			<pre>    hzHtagform  tf ;        //  HTML tag info
    hzString    S ;         //  HTML tag search string</pre>
			<pre>    //  If tagmap not loaded, load it
    if (!s_htagPop)
        InitHtml() ;</pre>
			<pre>    S = htag ;
    S.ToLower() ;</pre>
			<pre>    tf = s_htagNam[S] ;</pre>
			<pre>    return tf.type ;
}</pre>
			<pre>const hzHtagform&amp;   TagLookup   (const hzString&amp; htag)
{
    //  Category:   Internet
    //
    //  Lookup and return the hzHtagform (tag function class). The search is by tagname.
    //
    //  Arguments:  1)  htag    A string presumed to be one of the allowed HTML5 tags
    //
    //  Returns:    Reference to the tag form for the tag</pre>
			<pre>    //  If tagmap not loaded, load it
    if (!s_htagNam.Count())
        InitHtml() ;</pre>
			<pre>    return s_htagNam[htag] ;
}</pre>
			<pre>const hzHtagform&amp;   TagLookup   (chIter&amp; ci)
{
    //  Category:   Internet
    //
    //  Determine if the supplied chain iterator, is at the start of a legal HTML tag or anti-tag
    //
    //  Arguments:  1)  ci  A chain iterator to be tested to see if it is at the begening of an allowed HTML5
    //
    //  Returns:    Reference to the tag form for the tag</pre>
			<pre>    hzChain     W ;         //  Working chain
    chIter      xi ;        //  Internal chain iterator
    hzString    word ;      //  Individual word</pre>
			<pre>    //  If tagmap not loaded, load it
    if (!s_htagNam.Count())
        InitHtml() ;</pre>
			<pre>    xi = ci ;
    if (*xi != CHAR_LESS)
        return s_tagformDuff ;
    xi++ ;
    if (*xi == CHAR_FWSLASH)
        xi++ ;</pre>
			<pre>    for (;;)
    {
        if (*xi == CHAR_SPACE)  break ;
        if (*xi == CHAR_MORE)   break ;</pre>
			<pre>        W.AddByte(*xi) ;
        xi++ ;
    }</pre>
			<pre>    word = W ;
    word.ToLower() ;
    return s_htagNam[word] ;
}</pre>
			<pre>/*
**  Tag cleanup
*/</pre>
			<pre>hzHtagInd   AtHtmlTag   (hzString&amp; tagseq, chIter&amp; ci)
{
    //  Category:   Text Processing
    //
    //  Determines if the supplied chain iterator marks the start of a sequence that amounts to a legal HTML tag or anti-tag. If it does not 0 is returned and
    //  the supplied string will be empty. If the sequence has the right form, a case-insensitive lookup is performed to test the name part against all known
    //  HTML5 tags. If this finds a match the supplied string will be populated with the sequence (including the opening and closing angle brackets). The return
    //  value will then be either 1 for the tag or 2 for the anti-tag.
    //
    //  Arguments:  1)  tagseq  If a tag is found, this string reference will be populated by it.
    //              2)  ci      The test chain iterator
    //
    //  Returns:    HTRULE_NULL     If the sequence is not a known HTML tag or antitag.
    //              HTRULE_PAIRED   If the sequence is a HTML tag.
    //              HTRULE_SINGLE   If the sequence is a HTML antitag.
    //              HTRULE_OPTION   If the sequence is both a HTML tag and antitag (eg &lt;br/&gt;).</pre>
			<pre>    _hzfunc(__func__) ;</pre>
			<pre>    hzChain     W ;             //  For building tagname
    chIter      zi ;            //  Used to iterate whole tag sequence.
    hzHtagform  tf ;            //  The tag form for the found tag (if any).
    hzString    tagname ;       //  The tag name
    hzHtagInd   retval ;        //  Return value (0 invalid, 1 tag, 2 anti-tag)</pre>
			<pre>    //  If tagmap not loaded, load it
    if (!s_htagNam.Count())
        InitHtml() ;</pre>
			<pre>    //  Clear the supplied tag and set chain iter
    tagseq.Clear() ;
    zi = ci ;</pre>
			<pre>    if (*zi != CHAR_LESS)
        return HTAG_IND_NULL ;</pre>
			<pre>    zi++ ;
    if (*zi == CHAR_FWSLASH)
        { retval = HTAG_IND_ANTI ; zi++ ; }
    else
        retval = HTAG_IND_OPEN ;</pre>
			<pre>    for (; !zi.eof() &amp;&amp; IsAlpha(*zi) ; zi++)
        W.AddByte(*zi) ;
    if (!W.Size())
        return HTAG_IND_NULL ;</pre>
			<pre>    tagname = W ;
    W.Clear() ;
    tagname.ToLower() ;
    tf = s_htagNam[tagname] ;
    if (tf.type == HTAG_NULL)
        return HTAG_IND_NULL ;</pre>
			<pre>    //  We have a HTML tag so build the complete tag for populating tagseq
    for (zi = ci ; !zi.eof() ; zi++)
    {
        W.AddByte(*zi) ;</pre>
			<pre>        if (*zi == CHAR_DQUOTE)
        {
            for (zi++ ; !zi.eof() ; zi++)
            {
                W.AddByte(*zi) ;</pre>
			<pre>                if (*zi == CHAR_BKSLASH)
                    { zi++ ; W.AddByte(*zi) ; }</pre>
			<pre>                if (*zi == CHAR_DQUOTE)
                    break ;
            }
            continue ;
        }</pre>
			<pre>        if (*zi == CHAR_FWSLASH)
        {
            if (zi == "/&gt;")
                { retval = HTAG_IND_SELF ; zi++ ; W.AddByte(*zi) ; }
        }</pre>
			<pre>        if (*zi == CHAR_MORE)
            break ;
    }
            
    if (*zi != CHAR_MORE)
        return HTAG_IND_NULL ;</pre>
			<pre>    tagseq = W ;
    return retval ;
}</pre>
			<pre>void    XmlCleanHtags   (hzChain&amp; output, const hzChain&amp; input)
{
    //  Category:   Text Processing
    //
    //  Remove all instance of &lt;, &gt; and &amp; and replace them with &lt;, &gt; and &amp; respectively
    //
    //  Arguments:  1)  output  The cleaned output
    //              2)  input   The unclean input
    //
    //  Returns:    None</pre>
			<pre>    chIter      zi ;        //  Chain iterator
    uint32_t    ent ;       //  Entity value (needed by call to AtEntity)
    uint32_t    entLen ;    //  Entity value (needed by call to AtEntity)</pre>
			<pre>    for (zi = input ; !zi.eof() ; zi++)
    {
        if (*zi == CHAR_LESS)
            output &lt;&lt; "&lt;" ;
        else if (*zi == CHAR_MORE)
            output &lt;&lt; "&gt;" ;
        else if (*zi == CHAR_AMPSAND)
        {
            if (AtEntity(ent, entLen, zi))
                output.AddByte(*zi) ;
            else
                output &lt;&lt; "&amp;" ;
        }
        else
            output.AddByte(*zi) ;
    }
}</pre>
			<pre>hzEcode hzDocument::Init    (const hzUrl&amp; url)
{
    //  Initialize a hzDocument with a URL
    //
    //  Arguments:  1)  url     The URL of the document
    //
    //  Returns:    E_INITDUP   If the document is already associated with a URL
    //              E_OK        If the document URL is set</pre>
			<pre>    _hzfunc("hzDocument::Init") ;</pre>
			<pre>    if (*m_Info.m_urlReq)
    {
        if (m_Info.m_urlReq == url)
            hzerr(E_INITDUP, "Duplicate call. Address already set to &#37;s\n", *m_Info.m_urlReq) ;
        else
            hzerr(E_INITDUP, "Duplicate call. Addr=&#37;s, arg=&#37;s\n", *m_Info.m_urlReq, *url) ;
        return E_INITDUP ;
    }</pre>
			<pre>    m_Info.m_urlReq = url ;</pre>
			<pre>    return E_OK ;
}</pre>
			<pre>hzDocHtml::hzDocHtml   (void)
{
    m_pRoot = 0 ;
    m_pHead = 0 ;
    m_pBody = 0 ;
    _hzGlobal_Memstats.m_numDochtm++ ;
}</pre>
			<pre>hzDocHtml::~hzDocHtml  (void)
{
    _hzGlobal_Memstats.m_numDochtm-- ;
    Clear() ;
}</pre>
			<pre>hzHtmElem*  hzDocHtml::_proctag (hzHtmElem* pParent, chIter&amp; ci, hzHtagtype type)
{
    //  This assumes the chain iterator is currently at a '&lt;' char and that this is the start of an HTML tag or ant-tag. To succeed the tag must be
    //  both a known HTML tag and of the correct form.
    //
    //  If successful, the iterator will be advanced to one place beyond the terminating '&gt;'. If unsuccessful, the iterator will be left unchanged.
    //
    //  Arguments:  1)  The parent node
    //              2)  The iterator.
    //              3)  The current tag type. This determines how structural defects are to be handled.#
    //
    //  Returns:    Pointer to a new hzHtmElem if the operation was sussessful
    //              NULL if function could not identify a tag
    //
    //  Scope:      Private to the hzDocHtml class.</pre>
			<pre>    _hzfunc("hzDocHtml::_proctag") ;</pre>
			<pre>    hzChain         theTag ;        //  The full text of the tag
    hzChain         Z ;             //  For building param names and values
    hzAttrset       ai ;            //  Attribute iterator
    chIter          end ;           //  End of tag marker
    chIter          xi ;            //  Main operating chain iterator
    chIter          yi ;            //  Shadow chain iterator
    hzHtmElem*      pX ;            //  Parent element
    hzHtmElem*      pNewnode ;      //  Tag found (new copy created)
    hzUrl           link_url ;      //  URL for links
    //hzNumPair     attr ;          //  Attribute name/value pair
    hzPair          attr ;          //  Attribute name/value pair
    hzString        tnam ;          //  Tag name
    hzString        attrName ;      //  Attr name
    hzString        attrValue ;     //  Attr value
    hzString        S ;             //  Temporary string
    uint32_t        nLine ;         //  Line number of tag
    hzHtagtype      ptype ;         //  Parent tag's type</pre>
			<pre>    //bool  bQuot = false ;
    bool    bError = false ;</pre>
			<pre>    //  Check validity of call
    if (ci.eof())
        { threadLog("Invalid iterator\n") ; return 0 ; }</pre>
			<pre>    nLine = ci.Line() ;</pre>
			<pre>    if (*ci != '&lt;')
        { threadLog("Line &#37;d Wrong call\n", nLine) ; return 0 ; }</pre>
			<pre>    switch  (type)
    {
    case HTAG_META:         //  Examininig a &lt;META ...&gt; tag
    case HTAG_STYLE:        //  Examininig a &lt;META ...&gt; tag
    case HTAG_SCRIPT:       //  Examininig a &lt;SCRIPT .&gt; tag
    case HTAG_LINK:         //  Examininig a &lt;LINK ...&gt; tag
    case HTAG_HTML:         //  Examininig a &lt;HTML ...&gt; tag (header)
    case HTAG_BODY:         //  Examininig a &lt;BODY ...&gt; tag (body)
        break ;
    default:
        break ;
    }</pre>
			<pre>    //  Pre-process the tag and get tag name
    xi = ci ;
    xi++ ;</pre>
			<pre>    if (!IsAlpha(*xi))
        { threadLog("Line &#37;d Non-tag (&lt; followed by non-alpha &#37;d)\n", nLine, *xi) ; return 0 ; }</pre>
			<pre>    for (; !xi.eof() &amp;&amp; (*xi == CHAR_COLON || IsAlphanum(*xi)) ; xi++)
        theTag.AddByte(*xi) ;</pre>
			<pre>    if (!theTag.Size())
        { threadLog("Line &#37;d Tag un-named\n", nLine) ; return 0 ; }
    tnam = theTag ;</pre>
			<pre>    //  Check if tag is known as a HTML tag
    if (type == HTAG_TABLE)
        pNewnode = new hzHtmTbl() ;
    else
        pNewnode = new hzHtmElem() ;
    pNewnode-&gt;Init(this, pParent, tnam, type, m_vecTags.Count(), ci.Line()) ;
    m_vecTags.Add(pNewnode) ;</pre>
			<pre>    //  Collect tag attributes if any
    for (; !xi.eof() ;)
    {
        if (IsWhite(*xi))
            { xi++ ; continue ; }</pre>
			<pre>        if (*xi == CHAR_FWSLASH)
        {
            if (xi == "/&gt;")
                { pNewnode-&gt;_setanti(xi.Line()) ; xi++ ; end = xi ; break ; }
        }</pre>
			<pre>        if (*xi == CHAR_MORE)
            { end = xi ; break ; }</pre>
			<pre>        //  Not at end of tag, so should have attr=value sequence (otherwise error)
        if (!IsAlpha(*xi))
            { threadLog("Line &#37;d Error. Unexpected char is [&#37;c]\n", nLine, *xi) ; xi++ ; continue ; }</pre>
			<pre>        Z.Clear() ;
        for (; !xi.eof() &amp;&amp; (IsUrlnorm(*xi) || *xi == CHAR_COLON || *xi == CHAR_PERIOD || *xi == CHAR_MINUS || *xi == CHAR_USCORE) ; xi++)
            Z.AddByte(*xi) ;
        attrName = Z ;</pre>
			<pre>        Z.Clear() ;
        attrValue = (char*)0 ;</pre>
			<pre>        for (; !xi.eof() &amp;&amp; IsWhite(*xi) ; xi++) ;</pre>
			<pre>        if (*xi != CHAR_EQUAL)
        {
            //  Tag attribute does not have a value assignent part (="some_val"). This is an error although there are some slopy exceptions,
            //  eg 'allowfullscreen' in the &lt;tframe&gt; tag.</pre>
			<pre>            if (pNewnode-&gt;Type() == HTAG_IFRAME || pNewnode-&gt;Type() == HTAG_TIME)
            {
                attrValue = attrName ;
                //pNewnode-&gt;AddAttr(attrName, attrValue) ;</pre>
			<pre>                //attr.m_A = m_Dict.Insert(*attrName) ;
                //attr.m_B = m_Dict.Insert(*attrValue) ;
                attr.name = attrName ;
                attr.value = attrValue ;
                
                m_NodeAttrs.Insert(pNewnode-&gt;GetUid(), attr) ;</pre>
			<pre>                continue ;
            }</pre>
			<pre>            threadLog("Line &#37;d Tag &#37;s param &#37;s not assigned\n", nLine, *tnam, *attrName) ;
            return 0 ;
        }</pre>
			<pre>        //  Get attribute value
        for (xi++ ; !xi.eof() &amp;&amp; IsWhite(*xi) ; xi++) ;</pre>
			<pre>        Z.Clear() ;
        if (*xi == CHAR_DQUOTE)
        {
            for (xi++ ; !xi.eof() &amp;&amp; *xi != CHAR_DQUOTE ; xi++)
                Z.AddByte(*xi) ;
            if (xi.eof())
                { threadLog("Line &#37;d Double-quote non-closure disqualifies tag\n", nLine) ; return 0 ; }
            xi++ ;
        }
        else if (*xi == CHAR_SQUOTE)
        {
            for (xi++ ; !xi.eof() &amp;&amp; *xi != CHAR_SQUOTE ; xi++)
                Z.AddByte(*xi) ;
            if (xi.eof())
                { threadLog("Line &#37;d Single-quote non-closure disqualifies tag\n", nLine) ; return 0 ; }
            xi++ ;
        }
        else
        {
            for (; !xi.eof() &amp;&amp; IsUrlresv(*xi) ; xi++)
            Z.AddByte(*xi) ;
        }
        attrValue = Z ;</pre>
			<pre>        //  If the tag is a link/anchor and attr is named 'href' then add link to the list of links found in the page
        if ((pNewnode-&gt;Type() == HTAG_LINK || pNewnode-&gt;Type() == HTAG_ANCHOR) &amp;&amp; attrName.Equiv("href"))
        {
            //threadLog("Considering link &#37;s\n", *attrValue) ;</pre>
			<pre>            //  Is the link a mailto ?
            if (!attrValue)
            {
                S = theTag ;
                threadLog("Line &#37;d null link in tag &#37;s\n", nLine, *S) ;
            }
            else
            {
                if (attrValue[0] != CHAR_HASH)
                {
                    if (memcmp(*attrValue, "mailto:", 7) == 0)
                    {
                        S = *attrValue + 7 ;
                        m_Emails.Insert(S) ;
                    }
                    else
                    {
                        //  Add the link</pre>
			<pre>                        if (m_Base &amp;&amp; attrValue[0] == CHAR_FWSLASH)
                        {
                            link_url.SetValue(m_Base, attrValue) ;
                            if (!link_url)
                                threadLog("not a link case 1: &#37;s\n", *attrValue) ;
                        }
                        else if (m_Info.Domain())
                        {
                            link_url.SetValue(m_Info.Domain(), attrValue) ;
                            if (!link_url)
                                threadLog("not a link case 2: &#37;s\n", *attrValue) ;
                        }
                        else
                        {
                            link_url = attrValue ;
                            if (!link_url)
                                threadLog("not a link case 3: &#37;s\n", *attrValue) ;
                        }</pre>
			<pre>                        if (!link_url.Domain())
                            threadLog("not a link case 4: &#37;s\n", *link_url) ;</pre>
			<pre>                        if (link_url)
                        {
                            S = *link_url ;</pre>
			<pre>                            //attr.m_A = m_Dict.Insert(*attrName) ;
                            //attr.m_B = m_Dict.Insert(*attrValue) ;
                            attr.name = attrName ;
                            attr.value = attrValue ;
                            m_NodeAttrs.Insert(pNewnode-&gt;GetUid(), attr) ;</pre>
			<pre>                            if (!m_setLinks.Exists(link_url))
                            {
                                m_setLinks.Insert(link_url) ;
                                m_vecLinks.Add(link_url) ;
                            }
                        }
                    }
                }
            }
        }
        else
        {
            //pNewnode-&gt;AddAttr(attrName, attrValue) ;</pre>
			<pre>            //attr.m_A = m_Dict.Insert(*attrName) ;
            //attr.m_B = m_Dict.Insert(*attrValue) ;
            attr.name = attrName ;
            attr.value = attrValue ;
            m_NodeAttrs.Insert(pNewnode-&gt;GetUid(), attr) ;
        }
    }</pre>
			<pre>    if (xi.eof())
        { threadLog("Line &#37;d A. non-closure disqualifies tag\n", nLine) ; return 0 ; }</pre>
			<pre>    if (*xi != CHAR_MORE)
        { S = theTag ; threadLog("Line &#37;d C. malformed tag &lt;&#37;s&gt; pnam=&#37;s, attrValue=&#37;s [&#37;c]\n", nLine, *S, *attrName, *attrValue, *xi) ; return 0 ; }</pre>
			<pre>    for (xi++ ; !xi.eof() &amp;&amp; IsWhite(*xi) ; xi++) ;
    end = xi ;</pre>
			<pre>    //  Check for correct parentage
    if (pParent)
    {
        //  Some tag-type rules</pre>
			<pre>        ptype = pParent-&gt;Type() ;</pre>
			<pre>        if (type == HTAG_TBL_CEL)
        {
            if (ptype == HTAG_TBL_CEL)
            {
                //  This is where the author has forgotton to close a &lt;td&gt; and is now adding the next &lt;td&gt; in the row. We
                //  seek back to the &lt;tr&gt; (the true parent).</pre>
			<pre>                threadLog("WARNING: Missing &lt;/td&gt; anti-tag\n") ;</pre>
			<pre>                pX = pParent-&gt;Parent() ;
                if (pX)
                {
                    ptype = pX-&gt;Type() ;
                    if (ptype != HTAG_TH || ptype != HTAG_TR)
                        pParent = pX ;
                }
            }
        }</pre>
			<pre>        if (bError)
            threadLog("WARNING: New &lt;&#37;s&gt; tag has parent of &lt;&#37;s&gt;\n", *Tagtype2Txt(type), *Tagtype2Txt(ptype)) ;
    }</pre>
			<pre>    ci = end ;
    //m_mapTags.Insert(pNewnode-&gt;Name(), pNewnode) ;
    return pNewnode ;
}</pre>
			<pre>hzEcode hzDocHtml::_htmPreproc  (hzChain&amp; Z)
{
    //  Remove comments and non applicable conditional comments from HTML
    //
    //  Arguments:  1)  Reference to chain to be pre-processed
    //
    //  Returns:    E_FORMAT    If the HTML is malformed
    //              E_OK        If the HTML was successfully processed</pre>
			<pre>    _hzfunc("hzDocHtml::_htmPreproc") ;</pre>
			<pre>    chIter  zi ;        //  Iterator of input
    hzChain X ;         //  Target chain
    hzChain word ;      //  Diagnostics chain
    bool    bIn ;       //  In a conditional comment</pre>
			<pre>    if (Z.Size() == 0)
        return E_OK ;</pre>
			<pre>    for (zi = Z ; !zi.eof() ;)
    {
        if (*zi != CHAR_LESS)
            { X.AddByte(*zi) ; zi++ ; continue ; }</pre>
			<pre>        if (zi == "&lt;!--&gt;")
            { zi += 5 ; continue ; }</pre>
			<pre>        //  Ignore deleted text within comment (&lt;!-- and --&gt;) tags. Note these cannot be nested
        bIn = false ;</pre>
			<pre>        if (zi == "&lt;!--[if")
            { bIn = true ; zi += 7 ; }
        if (zi == "&lt;![if")
            { bIn = true ; zi += 5 ; }</pre>
			<pre>        if (bIn)
        {
            for (; !zi.eof() &amp;&amp; *zi &lt;= CHAR_SPACE ;)
                zi++ ;</pre>
			<pre>            if (zi == "!IE")
            {
                //  Specific non-IE comment. Content herein must be allowed through.</pre>
			<pre>                for (zi += 2 ; !zi.eof() &amp;&amp; *zi != CHAR_MORE ; zi++) ;
                if (zi.eof())
                {
                    threadLog("Unterminated conditional comment (line &#37;d)\n", zi.Line()) ;
                    return E_FORMAT ;
                }</pre>
			<pre>                zi++ ;
                if (zi == "--&gt;")
                    zi += 3 ;</pre>
			<pre>                for (; !zi.eof() ; zi++)
                {
                    if (*zi == CHAR_LESS)
                    {
                        if (zi == "&lt;![endif]&gt;")         { zi += 10 ; break ; }
                        if (zi == "&lt;![endif]--&gt;")       { zi += 12 ; break ; }
                        if (zi == "&lt;![endif]&gt;--&gt;")      { zi += 13 ; break ; }
                        if (zi == "&lt;!--&lt;![endif]--&gt;")   { zi += 16 ; break ; }
                    }</pre>
			<pre>                    word.AddByte(*zi) ;
                    X.AddByte(*zi) ;
                }</pre>
			<pre>                //threadLog("word is &#37;s\n", *word
                //m_Error &lt;&lt; "\nword is: " &lt;&lt; word ;
                //m_Error.AddByte(CHAR_NL) ;
                word.Clear() ;
                continue ;
            }</pre>
			<pre>            if (zi == "!(")
                zi += 2 ;</pre>
			<pre>            if (zi == "lte IE" || zi == "lt IE" || zi == "gte IE" || zi == "gt IE" || zi == "IE")
            {
                //  We are not and never will be IE so ignore conditional comment
                //  threadLog("Stripping IE cond comment line &#37;d - ", zi.Line()) ;</pre>
			<pre>                for (zi += 2 ; !zi.eof() ; zi++)
                {
                    if (zi == "&lt;![endif]&gt;")     { zi += 10 ; break ; }
                    if (zi == "&lt;![endif]--&gt;")   { zi += 12 ; break ; }
                }
                continue ;
            }</pre>
			<pre>            //  Include non IE stuff
            //  threadLog("Stripping non-IE cond comment line &#37;d - ", zi.Line()) ;</pre>
			<pre>            for (zi += 2 ; !zi.eof() &amp;&amp; *zi != CHAR_MORE ; zi++) ;
            if (zi.eof())
            {
                threadLog("Unterminated conditional comment (line &#37;d)\n", zi.Line()) ;
                return E_FORMAT ;
            }</pre>
			<pre>            zi++ ;
            if (zi == "&lt;!--&gt;")
                zi += 5 ;
            if (zi == "--&gt;")
                zi += 3 ;</pre>
			<pre>            for (; !zi.eof() ; zi++)
            {
                if (*zi == CHAR_LESS)
                {
                    if (zi == "&lt;![endif]&gt;")         { zi += 10 ; break ; }
                    if (zi == "&lt;![endif]--&gt;")       { zi += 12 ; break ; }
                    if (zi == "&lt;![endif]&gt;--&gt;")      { zi += 13 ; break ; }
                    if (zi == "&lt;!--&lt;![endif]--&gt;")   { zi += 16 ; break ; }
                }</pre>
			<pre>                word.AddByte(*zi) ;
                X.AddByte(*zi) ;
            }</pre>
			<pre>            //m_Error &lt;&lt; "\nword is: " &lt;&lt; word ;
            //m_Error.AddByte(CHAR_NL) ;
            word.Clear() ;
            continue ;
        }</pre>
			<pre>        if (zi == "&lt;!--")
        {
            for (zi += 4 ; !zi.eof() ; zi++)
            {
                if (zi == "--&gt;")
                    { zi += 3 ; break ; }
            }</pre>
			<pre>            if (zi.eof())
            {
                threadLog("_htmPreproc. Unterminated normal comment starting on line &#37;d\n", zi.Line()) ;
                return E_FORMAT ;
            }
            continue ;
        }</pre>
			<pre>        X.AddByte(*zi) ;
        zi++ ;
    }</pre>
			<pre>    if (X.Size() == Z.Size())
        return E_OK ;</pre>
			<pre>    Z.Clear() ;
    Z = X ;
    return E_OK ;
}</pre>
			<pre>hzEcode hzDocHtml::Load (hzChain&amp; Z)
{
    //  Populate the hzDocHtml object with HTML source code in the supplied chain.
    //
    //  Two scenarios are permitted - Full or Partial as follows:-
    //      1)  Full:       If the HTML source has the &lt;html&gt; as its first tag it will be considered as a full page and tested as such.
    //                      It will be expected to have the standard sub-tags of &lt;head&gt; and &lt;body&gt; and thier corresponding anti-tags.
    //                      If either of these are missing or in error (malformed or containing unxpected or malformed tags) the HTML
    //                      source code is deemed to be syntactically in error and the load fails.
    //
    //      2)  Partial:    If the opening tag of the HTML source code is not the &lt;html&gt; tag it is viable only if it would be viable as
    //                      a HTML fragment that could be seemlessly inserted into the &lt;body&gt; part of a whole HTML page. This is to say
    //                      that all it's tags must be legal sub-tags of &lt;body&gt; and not of &lt;head&gt; and nor must the &lt;body&gt; or &lt;head&gt; tag
    //                      or anti-tag be present.
    //
    //  In either case, tags are loaded into a tree of nodes (tags). The nodes/tags may be searched for and examined. 
    //
    //  Arguments:  1)  Z   The chain containing the HTML document
    //
    //  Returns:    E_FORMAT    If the HTML was rejected by the the HTML pre-processor _htmlPreproc() OR if any tags could not be processed by _proctag()
    //              E_OK        If the HTML was loaded successfully
    //
    //  Note:   Unlike XML where tags are named so that content in the tree can be searched directly, the nodes in HTML are not named
    //  named and so cannot be definitely referenced (they only have type). Some other process must apply application specific criteria
    //  to read meaning into the data.</pre>
			<pre>    _hzfunc("hzDocHtml::Load") ;</pre>
			<pre>    hzChain         nc ;            //  Node content
    hzChain         T ;             //  For token building
    hzChain         W ;             //  For token building
    chIter          zi ;            //  Chain iterator
    chIter          tw_start ;      //  Start of tagword marker
    chIter          tmp ;           //  Start of tagword marker
    chIter          limit ;         //  End of tag marker - Protection against malformed tags (NLA style)
    hzHtmElem*      pCN = 0 ;       //  Current HTML node
    hzHtmElem*      pNN ;           //  New HTML node
    hzHtmElem*      pX ;            //  HTML node for diagnostics
    hzHtmElem*      pCurForm = 0 ;  //  HTML node for diagnostics
    hzAttrset       ai ;            //  Attribute iterator
    hzHtmForm*      pForm = 0 ;     //  Form found in page
    hzPair          P ;             //  Name value pair (for forms and fields)
    hzString        strval ;        //  To test if current tag is being closed
    hzString        tagword ;       //  From MakeTag - just the tagname.
    hzString        wholetag ;      //  From MakeTag - the entire opening sequence if applicable
    hzString        anam ;          //  Attribute name
    hzString        aval ;          //  Attribute value
    hzHtagform      tf ;            //  Tag form
    uint32_t        nX ;            //  For nesting levels/general iteration
    uint32_t        nColon ;        //  Does the tagname contain a colon (3rd party tag)
    uint32_t        nLine ;         //  Line number for errors
    uint32_t        quote ;         //  Are we in a quoted string
    bool            bAnti ;         //  Tag is an anti-tag
    int32_t         cDelim ;        //  Delimiting char (single/double quote)
    hzEcode         rc = E_OK ;     //  return code</pre>
			<pre>    Clear() ;
    //m_Error.Clear() ;</pre>
			<pre>    //  Pre-process the HTML
    rc = _htmPreproc(Z) ;
    if (rc != E_OK)
        return rc ;</pre>
			<pre>    m_Content = Z ;</pre>
			<pre>    //  Make sure the HTML tags are loading into the lookup table
    if (!s_htagNam.Count())
        InitHtml() ;</pre>
			<pre>    //  Init the iterator
    zi = Z ;
    zi.Skipwhite() ;</pre>
			<pre>    //  Bypass the doctype if present
    if (zi.Equiv("&lt;!DOCTYPE"))
    {
        quote = 0 ;
        for (zi += 9 ; !zi.eof() ; zi++)
        {
            if (quote)
            {
                if (*zi == CHAR_DQUOTE)
                    quote = 0 ;
                continue ;
            }</pre>
			<pre>            if (*zi == CHAR_MORE)
                { zi++ ; break ; }</pre>
			<pre>            if (*zi == CHAR_DQUOTE)
                quote = 1 ;
        }</pre>
			<pre>        zi.Skipwhite() ;
    }</pre>
			<pre>    //  Look for the opening &lt;html&gt;
    for (; !zi.eof() ; zi++)
    {
        if (zi.Equiv("&lt;html"))
        {
            m_pRoot = _proctag(0, zi, HTAG_HTML) ;
            if (!m_pRoot)
                { threadLog("Could not establist root node (the &lt;html&gt; tag)\n") ; return E_FORMAT ; }
            break ;
        }
    }</pre>
			<pre>    if (!m_pRoot)
    {
        threadLog("No valid contents found before expected &lt;html&gt; tag - assuming a partial page\n") ;
        zi = Z ;
        zi.Skipwhite() ;
        pCN = new hzHtmElem() ;
        pCN-&gt;Init(this, 0, tagword, HTAG_NULL, m_vecTags.Count(), zi.Line()) ;
        m_vecTags.Add(pCN) ;
    }
    else
    {
        //  A &lt;html&gt; tag has been found so this is a full page. Look for &lt;head&gt; next
        for (; !zi.eof() ;)
        {
            if (zi.Equiv("&lt;head"))
            {
                m_pHead = _proctag(m_pRoot, zi, HTAG_HEAD) ;
                if (!m_pHead)
                    { threadLog("Could not process &lt;head&gt; tag\n") ; return E_FORMAT ; }
                break ;
            }
            zi++ ;
        }</pre>
			<pre>        if (!m_pHead)
            { threadLog("Expected a &lt;head&gt; tag\n") ; return E_FORMAT ; }
        pCN = m_pHead ;</pre>
			<pre>        //  Now get the subtags of &lt;head&gt;
        for (; rc == E_OK &amp;&amp; pCN &amp;&amp; !zi.eof() ;)
        {
            //  Handle tag content
            if (*zi != CHAR_LESS)
            {
                //  Ignore certain constructs
                if (zi == "//")
                {
                    for (zi += 2 ; !zi.eof() &amp;&amp; *zi != CHAR_NL ; zi++) ;
                    continue ;
                }</pre>
			<pre>                //  If not part of a construct, just agregate the char to the current tag's content, striping leading whitespace
                if (*zi &lt;= CHAR_SPACE &amp;&amp; pCN-&gt;m_tmpContent.Size() == 0)
                    { zi++ ; continue ; }
                pCN-&gt;m_tmpContent.AddByte(*zi) ;
                zi++ ;
                continue ;
            }</pre>
			<pre>            //  Ignore deleted text within comment (&lt;!-- and --&gt;) tags. Note these cannot be nested
            nLine = zi.Line() ;</pre>
			<pre>            if (zi == "&lt;!--[if")
            {
                for (zi += 7 ; !zi.eof() ; zi++)
                {
                    if (zi == "&lt;![endif]&gt;")     { zi += 10 ; break ; }
                    if (zi == "&lt;![endif]--&gt;")   { zi += 12 ; break ; }
                }
                continue ;
            }</pre>
			<pre>            if (zi == "&lt;![if")
            {
                for (zi += 5 ; !zi.eof() ; zi++)
                {
                    if (zi == "&lt;![endif]&gt;")     { zi += 10 ; break ; }
                    if (zi == "&lt;![endif]--&gt;")   { zi += 12 ; break ; }
                }
                continue ;
            }</pre>
			<pre>            if (zi == "&lt;!--")
            {
                for (zi += 4 ; !zi.eof() ; zi++)
                {
                    if (zi == "--&gt;")
                        { zi += 3 ; break ; }
                }
                continue ;
            }</pre>
			<pre>            //  Handle &lt;![CDATA[...]]&gt; block by converting the innards to straight data (apparently CDATA now legal in HTML)
            if (zi == "&lt;![CDATA[")
            {
                for (zi += 9 ; !zi.eof() ; zi++)
                {
                    if (zi == "]]&gt;")
                        { zi += 3 ; break ; }
                    pCN-&gt;m_tmpContent.AddByte(*zi) ;
                }
                continue ;
            }</pre>
			<pre>            //  Eliminate &lt;noscript&gt; tags from header (we don't use them)
            if (zi == "&lt;noscript")
            {
                for (zi += 9 ; !zi.eof() ; zi++)
                {
                    if (zi == "&lt;/noscript&gt;")
                        { zi += 11 ; break ; }
                }
                if (zi.eof())
                    { threadLog("Unclosed &lt;noscript&gt; block\n") ; rc = E_FORMAT ; break ; }
                continue ;
            }</pre>
			<pre>            //  At this point we have the '&lt;' start of tag char. Establish whole and tagword of possible HTML tag</pre>
			<pre>            wholetag.Clear() ;
            tagword.Clear() ;
    
            limit = zi ;
            limit++ ;
            W.AddByte(CHAR_LESS) ;
            bAnti = false ;
            if (*limit == CHAR_FWSLASH)
                { W.AddByte(CHAR_FWSLASH) ; bAnti = true ; limit++ ; }</pre>
			<pre>            nColon = 0 ;
            for (tw_start = limit ; !limit.eof() ; limit++)
            {
                if (*limit == CHAR_COLON || IsAlphanum(*limit))
                {
                    if (*limit == CHAR_COLON)
                        nColon++ ;</pre>
			<pre>                    T.AddByte(*limit) ;
                    W.AddByte(*limit) ;
                    continue ;
                }
                break ;
            }
            tagword = T ;
            T.Clear() ;
        
            for (; !limit.eof() ;)
            {
                W.AddByte(*limit) ;</pre>
			<pre>                if (*limit == CHAR_DQUOTE || *limit == CHAR_SQUOTE)
                {
                    cDelim = *limit ;</pre>
			<pre>                    for (limit++ ; !limit.eof() ; limit++)
                    {
                        if (*limit == CHAR_BKSLASH)
                        {
                            limit++ ;
                            if (*limit == cDelim)
                                continue ;
                        }
                        if (*limit == cDelim)
                            break ;
                    }
                }</pre>
			<pre>                if (*limit == CHAR_MORE)
                    break ;
                limit++ ;
            }</pre>
			<pre>            wholetag = W ;
            W.Clear() ;</pre>
			<pre>            if (*limit != CHAR_MORE)
            {
                threadLog("Malformed tag (&#37;s)\n", *wholetag) ;
                zi = limit ;
                continue ;
            }
            limit++ ;</pre>
			<pre>            //tagword.ToLower() ;</pre>
			<pre>            if (nColon)
            {
                if (!s_htagNam.Exists(tagword))
                {
                    tf.klas = HTCLASS_3RD ;
                    tf.rule = HTRULE_OPTION ;
                    tf.name = tagword ;
                    s_htagTyp.Insert(tf.type, tf) ;
                    s_htagNam.Insert(tf.name, tf) ;
                    threadLog("Inserted 3rd party HTML tag &#37;s\n", *tagword) ;
                }
            }</pre>
			<pre>            if (!s_htagNam.Exists(tagword))
            {
                if (bAnti)
                    threadLog("Line &#37;d case 1 Unknown lookup anti-tag &lt;/&#37;s&gt; (&#37;s)\n", zi.Line(), *tagword, *wholetag) ;
                else
                    threadLog("Line &#37;d Case 1 Unknown lookup tag &lt;&#37;s&gt; (&#37;d bytes)\n", zi.Line(), *tagword, wholetag.Length()) ;</pre>
			<pre>                pCN-&gt;m_tmpContent &lt;&lt; wholetag ;
                zi = limit ;
                continue ;
            }</pre>
			<pre>            tf = s_htagNam[tagword] ;</pre>
			<pre>            if (tf.type == HTAG_NULL)
            {
                if (bAnti)
                    threadLog("Line &#37;d case 2 Unknown lookup anti-tag &lt;/&#37;s&gt; (&#37;s)\n", zi.Line(), *tagword, *wholetag) ;
                else
                    threadLog("Line &#37;d Case 2 Unknown lookup tag &lt;&#37;s&gt; (&#37;d bytes)\n", zi.Line(), *tagword, wholetag.Length()) ;</pre>
			<pre>                pCN-&gt;m_tmpContent &lt;&lt; wholetag ;
                zi = limit ;
                continue ;
            }</pre>
			<pre>            //  Obtain tag name
            if (bAnti == false)
            {
                if (zi.Equiv("&lt;title&gt;"))
                {
                    pCN = _proctag(m_pHead, zi, HTAG_TITLE) ;
                    if (!pCN)
                        { rc = E_FORMAT ; threadLog("Line &#37;d Could not process &lt;meta&gt; tags\n", zi.Line()) ; }
                }
                else if (zi.Equiv("&lt;meta"))
                {
                    pCN = _proctag(m_pHead, zi, HTAG_META) ;
                    if (!pCN)
                        { rc = E_FORMAT ; threadLog("Line &#37;d Could not process &lt;meta&gt; tags\n", zi.Line()) ; }
                }
                else if (zi.Equiv("&lt;style"))
                {
                    pCN = _proctag(m_pHead, zi, HTAG_STYLE) ;
                    if (!pCN)
                        { rc = E_FORMAT ; threadLog("Line &#37;d Could not process &lt;style&gt; tags\n", zi.Line()) ; }
                }
                else if (zi.Equiv("&lt;script"))
                {
                    pCN = _proctag(m_pHead, zi, HTAG_SCRIPT) ;
                    if (!pCN)
                        { rc = E_FORMAT ; threadLog("Line &#37;d Could not process &lt;script&gt; tags\n", zi.Line()) ; }
                }
                else if (zi.Equiv("&lt;link"))
                {
                    pCN = _proctag(m_pHead, zi, HTAG_LINK) ;
                    if (!pCN)
                        { rc = E_FORMAT ; threadLog("Line &#37;d Could not process &lt;link&gt; tags\n", zi.Line()) ; }
                }
                else if (zi.Equiv("&lt;base"))
                {
                    pCN = _proctag(m_pHead, zi, HTAG_BASE) ;
                    if (!pCN)
                        { rc = E_FORMAT ; threadLog("Line &#37;d Could not process &lt;link&gt; tags\n", zi.Line()) ; }
                    //  Set m_Base
                    if (pCN-&gt;m_tmpContent.Size())
                        m_Base = pCN-&gt;m_tmpContent ;
                    else
                    {
                        //  set the m_Base to the first param
                        ai = pCN ;
                        if (ai.Value())
                            m_Base = ai.Value() ;
                        //  pAttr = pCN-&gt;GetFirstAttr() ;
                        //  if (pAttr)
                        //      m_Base = pAttr-&gt;value ;
                    }
                }
                else
                    { rc = E_FORMAT ; threadLog("Line &#37;d Could not process &lt;&#37;s&gt; tag within &lt;head&gt;\n", zi.Line(), *tagword) ; }</pre>
			<pre>                continue ;
            }</pre>
			<pre>            //  Handle antitag
            if (bAnti)
            {
                if (zi.Equiv("&lt;/head&gt;"))
                    { zi += 7 ; break ; }</pre>
			<pre>                //  Inactive (text rendering only) anti-tags
                if (tf.klas == HTCLASS_TXT)
                    { pCN-&gt;m_tmpContent &lt;&lt; wholetag ; zi = limit ; continue ; }</pre>
			<pre>                //  { zi = limit ; continue ; }</pre>
			<pre>                zi = limit ;</pre>
			<pre>                if (pCN-&gt;Type() == tf.type || tf.rule == HTRULE_SINGLE)
                    pCN = pCN-&gt;Parent() ;
                else
                {
                    threadLog("case 1 Tag mis-match. Current highest tag is &lt;&#37;s id=&#37;d, level=&#37;d&gt; but on line &#37;d we have an anti-tag for &#37;s\n",
                        *Tagtype2Txt(pCN-&gt;Type()), pCN-&gt;GetUid(), pCN-&gt;Level(), zi.Line(), *Tagtype2Txt(tf.type)) ;</pre>
			<pre>                    if (tf.rule == HTRULE_SINGLE)
                    {
                        //pCN = pX ;
                        pCN = pCN-&gt;Parent() ;
                        threadLog("Case 2 Corrected by allowing last tag as anti-tag\n") ;
                    }</pre>
			<pre>                    if (pCN-&gt;Type() == HTAG_TBL_CEL &amp;&amp; tf.type == HTAG_TR)
                    {
                        for (pX = pCN ; pX ; pX = pX-&gt;Parent())
                        {
                            if (pX-&gt;Type() == tf.type)
                            {
                                pCN = pX ;
                                threadLog("Corrected by decending to level &#37;d\n", pCN-&gt;Level()) ;
                                break ;
                            }
                        }
                    }
                }
                continue ;
            }</pre>
			<pre>            //  If none of the above just advance
            zi++ ;
        }</pre>
			<pre>        //  Advance to the &lt;body&gt; tag
        for (; !zi.eof() ;)
        {
            if (zi.Equiv("&lt;body"))
            {
                m_pBody = _proctag(m_pRoot, zi, HTAG_BODY) ;
                if (!m_pBody)
                    { threadLog("Expected an actual body\n") ; return E_FORMAT ; }
                break ;
            }
            zi++ ;
        }</pre>
			<pre>        if (!m_pBody)
            { threadLog("Expected a &lt;body&gt; tag\n") ; return E_FORMAT ; }
        pCN = m_pBody ;
    }</pre>
			<pre>    //
    //  Process document body. Here everything is either a tag, an anti-tag or it is tag-content. Both tags and antitags begin with a '&lt;' so the
    //  raw HTML is iterated and whenever the &lt; is found, it is tested for a known tag/antitag. In the general case of "&lt;tag&gt;content&lt;/tag&gt;", the
    //  process is to call _procTag() to parse the tag, garner the attributes and to create a new element (which the current element is then set
    //  to). Bytes after the tag are agregated to the current element's content until the antitag occurs (at which point the current element is
    //  then set back to the parent tag).
    //
    //  The exceptions to the general case:-
    //
    //  1)  Paragraph tags can be left open (antitag omited). These tags are closed by the parent antitag or by another paragraph tag.
    //
    //  2)  Print control tags which are completely ignored. These can never become the current tag so any content they have is aggregated to
    //      their parent tag.
    //
    //  3)  Links which do become current, but will have thier content aggregated to the parent tag.
    //</pre>
			<pre>    for (; pCN &amp;&amp; !zi.eof() ;)
    {
        //  Handle tag content
        if (*zi != CHAR_LESS)
        {
            if (pCN-&gt;Type() != HTAG_ANCHOR)
            {
                if (*zi &lt;= CHAR_SPACE &amp;&amp; pCN-&gt;m_tmpContent.Size() == 0)
                    { zi++ ; continue ; }
                pCN-&gt;m_tmpContent.AddByte(*zi) ;
            }
            else
            {
                if (pCN-&gt;Parent())
                    pCN-&gt;Parent()-&gt;m_tmpContent.AddByte(*zi) ;
            }</pre>
			<pre>            zi++ ;
            continue ;
        }</pre>
			<pre>        //  Ignore deleted text within &lt;strike&gt;&lt;/strike&gt; tags
        nLine = zi.Line() ;</pre>
			<pre>        if (zi == "&lt;strike&gt;")
        {
            for (zi += 8 ; !zi.eof() ; zi++)
            {
                if (zi == "&lt;/strike&gt;")
                    { zi += 9 ; break ; }
            }
            if (zi.eof())
                { threadLog("Unclosed comment block\n") ; rc = E_FORMAT ; break ; }
            continue ;
        }</pre>
			<pre>        if (zi == "&lt;fb:like&gt;")
        {
            for (zi += 9 ; !zi.eof() ; zi++)
            {
                if (zi == "&lt;/fb:like&gt;")
                    { zi += 10 ; break ; }
            }
            if (zi.eof())
                { threadLog("Facebook special\n") ; rc = E_FORMAT ; break ; }
            continue ;
        }</pre>
			<pre>        if (zi == "&lt;g:plusone&gt;")
        {
            for (zi += 11 ; !zi.eof() ; zi++)
            {
                if (zi == "&lt;/g:plusone&gt;")
                    { zi += 12 ; break ; }
            }
            if (zi.eof())
                { threadLog("Google special\n") ; rc = E_FORMAT ; break ; }
            continue ;
        }</pre>
			<pre>        //  Ignore deleted text within comment (&lt;!-- and --&gt;) tags
        if (zi == "&lt;!--[if")
        {
            for (zi += 7 ; !zi.eof() ; zi++)
            {
                if (zi == "&lt;![endif]&gt;")     { zi += 10 ; break ; }
                if (zi == "&lt;![endif]--&gt;")   { zi += 12 ; break ; }
            }
            if (zi.eof())
                { threadLog("Unterminated &lt;!--[if cond]..&gt; tag starting line &#37;d\n", nLine) ; rc = E_FORMAT ; break ; }
            continue ;
        }</pre>
			<pre>        if (zi == "&lt;![if")
        {
            for (zi += 5 ; !zi.eof() ; zi++)
            {
                if (zi == "&lt;![endif]&gt;")     { zi += 10 ; break ; }
                if (zi == "&lt;![endif]--&gt;")   { zi += 12 ; break ; }
            }
            if (zi.eof())
                { threadLog("Unterminated &lt;![if cond]..&gt; tag starting line &#37;d\n", nLine) ; rc = E_FORMAT ; break ; }
            continue ;
        }</pre>
			<pre>        if (zi == "&lt;!--")
        {
            for (zi += 4 ; !zi.eof() ; zi++)
            {
                if (zi == "--&gt;")
                    { zi += 3 ; break ; }
            }
            if (zi.eof())
                { threadLog("Unterminated &lt;!--&gt; tag starting line &#37;d\n", nLine) ; rc = E_FORMAT ; break ; }
            continue ;
        }</pre>
			<pre>        /*
        **  At this point we have the '&lt;' start of tag char. Establish whole and tagword of possible HTML tag
        */</pre>
			<pre>        wholetag.Clear() ;
        tagword.Clear() ;
    
        limit = zi ;
        limit++ ;
        W.AddByte(CHAR_LESS) ;
        bAnti = false ;
        if (*limit == CHAR_FWSLASH)
            { W.AddByte(CHAR_FWSLASH) ; bAnti = true ; limit++ ; }</pre>
			<pre>        nColon = 0 ;
        for (tw_start = limit ; !limit.eof() ; limit++)
        {
            if (*limit == CHAR_COLON || IsAlphanum(*limit))
            {
                if (*limit == CHAR_COLON)
                    nColon++ ;</pre>
			<pre>                T.AddByte(*limit) ;
                W.AddByte(*limit) ;
                continue ;
            }
            break ;
        }
        tagword = T ;
        T.Clear() ;
        
        for (; !limit.eof() ;)
        {
            W.AddByte(*limit) ;</pre>
			<pre>            if (*limit == CHAR_DQUOTE || *limit == CHAR_SQUOTE)
            {
                cDelim = *limit ;</pre>
			<pre>                for (limit++ ; !limit.eof() ; limit++)
                {
                    if (*limit == CHAR_BKSLASH)
                    {
                        limit++ ;
                        if (*limit == cDelim)
                            continue ;
                    }
                    if (*limit == cDelim)
                        break ;
                }
            }</pre>
			<pre>            if (*limit == CHAR_MORE)
                break ;
            limit++ ;
        }</pre>
			<pre>        wholetag = W ;
        W.Clear() ;</pre>
			<pre>        if (*limit != CHAR_MORE)
        {
            threadLog("Malformed tag (&#37;s)\n", *wholetag) ;
            zi = limit ;
            continue ;
        }</pre>
			<pre>        tagword.ToLower() ;</pre>
			<pre>        if (nColon)
        {
            if (!s_htagNam.Exists(tagword))
            {
                tf.klas=HTCLASS_3RD ;
                tf.rule=HTRULE_OPTION ;
                tf.name = tagword ;
                s_htagTyp.Insert(tf.type, tf) ;
                s_htagNam.Insert(tf.name, tf) ;
                threadLog("Inserted 3rd party HTML tag &#37;s\n", *tagword) ;
            }
        }</pre>
			<pre>        //  if (bAnti)
        //      threadLog("Case 2 line &#37;d Doing antitag &#37;s\n", zi.Line(), *tagword) ;
        //  else
        //      threadLog("Case 2 line &#37;d Doing tag &#37;s\n", zi.Line(), *tagword) ;</pre>
			<pre>        tf = s_htagNam[tagword] ;</pre>
			<pre>        if (tf.type == HTAG_NULL)
        {
            //  Unrecognized tags are just made part of the content of the currently applicable tag</pre>
			<pre>            if (bAnti)
                threadLog("Line &#37;d Unknown lookup anti-tag &lt;/&#37;s&gt; (&#37;s)\n", zi.Line(), *tagword, *wholetag) ;
            else
                threadLog("Line &#37;d Case 3 Unknown lookup tag &lt;&#37;s&gt; (&#37;d bytes)\n", zi.Line(), *tagword, wholetag.Length()) ;</pre>
			<pre>            pCN-&gt;m_tmpContent &lt;&lt; wholetag ;
            zi = limit ;
            continue ;
        }</pre>
			<pre>        if (bAnti == false)
        {
            //  Ignore graphic tags
            if (tf.klas == HTCLASS_IMG)
                { zi = limit ; continue ; }</pre>
			<pre>            //  Ignore self-closed 'system' tags
            if (tf.klas == HTCLASS_SYS)
            {
                if (tf.type == HTAG_EMBED)
                    pCN-&gt;m_tmpContent &lt;&lt; "&lt;embed/&gt;" ;</pre>
			<pre>                if (tf.type == HTAG_NOEMBED)
                    pCN-&gt;m_tmpContent &lt;&lt; "&lt;noembed/&gt;" ;</pre>
			<pre>                for (; !zi.eof() ; zi++)
                {
                    if (*zi == CHAR_MORE)
                        { zi++ ; break ; }
                }</pre>
			<pre>                threadLog("Line &#37;d Bypassed system tag &lt;&#37;s&gt; (&#37;s)\n", zi.Line(), *tagword, *wholetag) ;
                zi = limit ;
                continue ;
            }</pre>
			<pre>            //  Handle HTCLASS_TXT 'in-content' tags. We just copy these through, complete with tag, antitag and content, to the content of the
            //  current tag. However these tags should still be placed in the m_mapTags and m_vecTags member.</pre>
			<pre>            if (tf.klas == HTCLASS_TXT) // || tf.type == HTAG_ANCHOR)
            {
                pCN-&gt;m_tmpContent &lt;&lt; wholetag ; zi = limit ;
                continue ;
            }</pre>
			<pre>            //  If we are suppressing anchors, we only want the content of a &lt;a href=...&gt;...&lt;/a&gt; sequence.
            //if (m_bOpflags &amp; HDOC_SUPPRESS_LINKS &amp;&amp; tf.klas == HTCLASS_LNK &amp;&amp; tf.type == HTAG_ANCHOR)
            //if (bFlags &amp; HDOC_ONLOAD_LINKS &amp;&amp; tf.klas == HTCLASS_LNK &amp;&amp; tf.type == HTAG_ANCHOR)
            //  { zi = limit ; continue ; }</pre>
			<pre>            //  Eliminate scripts (may revisit)
            if (zi.Equiv("&lt;script"))
            {
                //  plog-&gt;Out("&#37;s. ignoring a script tag ...\n", __FUNCTION__) ;</pre>
			<pre>                for (tmp = zi ; !tmp.eof() ; tmp++)
                {
                    if (tmp.Equiv("&lt;/script&gt;"))
                        { tmp += 9 ; zi = tmp ; break ; }
                }
                if (zi.eof())
                    { threadLog("Unclosed script tag\n") ; rc = E_FORMAT ; break ; }
                continue ;
            }</pre>
			<pre>            /*
            **  Process 'data structure' tags into nodes. These are tables (with there rows and columns) but also menus
            **  and ordered and unordered lists.
            */</pre>
			<pre>            pNN = 0 ;
            pNN = _proctag(pCN, zi, tf.type) ;</pre>
			<pre>            if (!pNN)
            {
                threadLog("No node allocated for tag &lt;&#37;s&gt;\n", *Tagtype2Txt(tf.type)) ;
                return E_FORMAT ;
            }</pre>
			<pre>            pCN = pNN ;</pre>
			<pre>            zi = limit ;</pre>
			<pre>            /*
            **  Handle the &lt;input&gt; tag. As this is it's own anti-tag it has no content, only parameters. We need to include the tag
            **  in the tree as it is active, but we need to effect the anti-tag aspect as well (so the level is not raised)
            */</pre>
			<pre>            if (tf.type == HTAG_INPUT)
                pCN = pCN-&gt;Parent() ;</pre>
			<pre>            continue ;
        }</pre>
			<pre>        //  Handle anti-tags
        if (bAnti)
        {
            //  Inactive (text rendering only) anti-tags
            if (tf.klas == HTCLASS_TXT) // || tf.type == HTAG_ANCHOR)
                { pCN-&gt;m_tmpContent &lt;&lt; wholetag ; zi = limit ; continue ; }</pre>
			<pre>            //  Ignore self-closed 'system' tags
            if (tf.klas == HTCLASS_SYS)
            {
                if (tf.type == HTAG_EMBED)
                    pCN-&gt;m_tmpContent &lt;&lt; "&lt;/embed&gt;" ;</pre>
			<pre>                if (tf.type == HTAG_NOEMBED)
                    pCN-&gt;m_tmpContent &lt;&lt; "&lt;/noembed&gt;" ;</pre>
			<pre>                for (; !zi.eof() ; zi++)
                {
                    if (*zi == CHAR_MORE)
                        { zi++ ; break ; }
                }</pre>
			<pre>                threadLog("Line &#37;d Bypassed system anti-tag &lt;&#37;s&gt; (&#37;s)\n", zi.Line(), *tagword, *wholetag) ;
                zi = limit ;
                continue ;
            }</pre>
			<pre>            zi = limit ;</pre>
			<pre>            if (pCN-&gt;Type() == tf.type || tf.rule == HTRULE_SINGLE)
                pCN = pCN-&gt;Parent() ;
            else
            {
                threadLog("case 2 Tag mis-match. Current highest tag is &lt;&#37;s id=&#37;d, level=&#37;d&gt; but on line &#37;d we have an anti-tag for &#37;s\n",
                    *Tagtype2Txt(pCN-&gt;Type()), pCN-&gt;GetUid(), pCN-&gt;Level(), zi.Line(), *Tagtype2Txt(tf.type)) ;</pre>
			<pre>                if (tf.rule == HTRULE_SINGLE)
                {
                    //pCN = pX ;
                    pCN = pCN-&gt;Parent() ;
                    threadLog("Case 1 Corrected by allowing last tag as anti-tag\n") ;
                }</pre>
			<pre>                if (pCN-&gt;Type() == HTAG_TBL_CEL &amp;&amp; tf.type == HTAG_TR)
                {
                    for (pX = pCN ; pX ; pX = pX-&gt;Parent())
                    {
                        if (pX-&gt;Type() == tf.type)
                        {
                            pCN = pX ;
                            threadLog("Corrected by decending to level &#37;d\n", pCN-&gt;Level()) ;
                            break ;
                        }
                    }
                }
            }
            continue ;
        }</pre>
			<pre>        threadLog("HANDLING ABD &#37;s (&#37;s)\n", *tagword, *wholetag) ;
    }</pre>
			<pre>    if (pCN)
        threadLog("End of file encountered whilst inside tag definition\n") ;</pre>
			<pre>    //  Move thru the tags in thier order of appearence and reduce where appropriate, the tag content held in chains to strings. Place forms in
    //  the list of forms and place form field tags with thier host forms.</pre>
			<pre>    for (nX = 0 ; nX &lt; m_vecTags.Count() ; nX++)
    {
        pX = m_vecTags[nX] ;</pre>
			<pre>        if (pX-&gt;Type() == HTAG_FORM)
        {
            //  Add the form to to m_Forms and set this to the current form
            pCurForm = pX ;
            pForm = new hzHtmForm() ;
            m_Forms.Add(pForm) ;
            continue ;
        }</pre>
			<pre>        if (pCurForm)
        {
            if (pX-&gt;Type() == HTAG_INPUT)
            {
                //  Add this field to the current form (report error if not in a current form)
                if (pX-&gt;Line() &lt; pCurForm-&gt;Anti())
                {
                    P.name = pX-&gt;Name() ;</pre>
			<pre>                    //  for (pAttr = pX-&gt;GetFirstAttr() ; pAttr ; pAttr = pAttr-&gt;next)
                    //  {
                    //      if (pAttr-&gt;name == "value")
                    //          { P.value = pAttr-&gt;value ; break ; }
                    //  }
                    for (ai = pX ; ai.Valid() ; ai.Advance())
                    {
                        anam = ai.Name() ; aval = ai.Value() ;</pre>
			<pre>                        if (anam == "value")
                            { P.value = aval ; break ; }
                    }</pre>
			<pre>                    pForm-&gt;fields.Add(P) ;
                }
                continue ;
            }</pre>
			<pre>            if (pX-&gt;Line() &gt; pCurForm-&gt;Anti())
                pCurForm = 0 ;
        }
    }</pre>
			<pre>    threadLog("END OF LOAD page has &#37;d links\n", m_vecLinks.Count()) ;</pre>
			<pre>    return rc ;
}</pre>
			<pre>hzEcode hzDocHtml::Load (const char* fpath)
{
    //  Loads an XML document into a tree of XML nodes
    //
    //  Arguments:  1)  fpath   Source file of HTML document
    //
    //  Returns:    E_ARGUMENT  If no file path is supplied
    //              E_NOTFOUND  If the file does not exist
    //              E_NODATA    If the file is empty
    //              E_OPENFAIL  If the file cannot be read
    //              E_FORMAT    If a format error caused the file load to fail
    //              E_OK        If the operation is successful</pre>
			<pre>    _hzfunc("hzDocXml::Load") ;</pre>
			<pre>    ifstream    is ;    //  Input stream
    hzChain     Z ;     //  Chain for holding file content
    hzEcode     rc ;    //  Return code</pre>
			<pre>    //  Load document into a working chain
    rc = OpenInputStrm(is, fpath) ;
    if (rc == E_OK)
    {
        Z &lt;&lt; is ;
        is.close() ;
        rc = Load(Z) ;
    }</pre>
			<pre>    return rc ;
}</pre>
			<pre>hzHtmElem*  hzHtmElem::GetFirstChild    (void) const
{
    _hzfunc("hzHtmElem::GetFirstChild") ;</pre>
			<pre>    if (!m_pHostDoc)
        hzexit(E_NOINIT, "Element &#37;s: Node has no host document", *m_Name) ;</pre>
			<pre>    if (!m_Children)
        return 0 ;</pre>
			<pre>    return m_pHostDoc-&gt;m_arrNodes.InSitu(m_Children-1) ;
}</pre>
			<pre>hzHtmElem*  hzHtmElem::Sibling  (void) const
{
    _hzfunc("hzHtmElem::Sibling") ;</pre>
			<pre>    if (!m_pHostDoc)
        hzexit(E_NOINIT, "Element &#37;s: Node has no host document", *m_Name) ;</pre>
			<pre>    if (!m_Sibling)
        return 0 ;</pre>
			<pre>    return m_pHostDoc-&gt;m_arrNodes.InSitu(m_Sibling-1) ;
}</pre>
			<pre>hzHtmElem*  hzHtmElem::Parent   (void) const
{
    _hzfunc("hzHtmElem::Parent") ;</pre>
			<pre>    if (!m_pHostDoc)
        hzexit(E_NOINIT, "Element &#37;s: Node has no host document", *m_Name) ;</pre>
			<pre>    if (!m_Parent)
        return 0 ;</pre>
			<pre>    return m_pHostDoc-&gt;m_arrNodes.InSitu(m_Parent-1) ;
}</pre>
			<pre>hzDocHtml*  hzHtmElem::GetTree  (void)
{
    //  Return the HTML document whose tree of HTML elemnents this hzHtmElem is a part. We start at the current node and follow the parentage all the way back
    //  to the base of the tree.
    //
    //  Arguments:  None
    //  Returns:    Pointer to root node of the tree to which the current node (element) belongs</pre>
			<pre>    hzHtmElem*  pN ;    //  Current tree node</pre>
			<pre>    if (!m_Parent)
        Fatal("hzHtmElem::GetTree. 1. Tag &#37;s (line &#37;d, level &#37;d) has no parent\n", *m_Name, m_nLine, m_nLevel) ;</pre>
			<pre>    for (pN = this ; pN-&gt;m_nLevel ; pN = pN-&gt;Parent()) ;
        if (!pN-&gt;m_Parent)
            Fatal("hzHtmElem::GetTree. 2. Tag &#37;s (line &#37;d, level &#37;d) has no parent\n", *pN-&gt;m_Name, pN-&gt;m_nLine, pN-&gt;m_nLevel) ;</pre>
			<pre>    return (hzDocHtml*) pN-&gt;Parent() ;
}</pre>
			<pre>uint32_t    hzHtmElem::_testnode    (hzVect&lt;hzHtmElem*&gt;&amp; tmpResult, const char* srchExp, uint32_t&amp; nLimit, uint32_t nLevel, bool bLog)
{
    //  Recursive support function to the non-recursive FindSubnodes function.
    //
    //  Split up first part of search expression (up to first period or null terminator), to a node/tag name and if present, a content speciifer
    //  (="some_value"), an attribute name (-&gt;"attr_name") an attribute content specifer.
    //
    //  We now apply the test to the current node and when required, to the children. We do not operate where nodes are at a higher
    //  level than the limit. This is because the FindSubnodes function is looking for the set of nodes matching the search expression that are
    //  found at the lowest level
    //
    //  Arguments:  1)  tmpResult   Vector of HTML elements this function will add to
    //              2)  srchExp     HTML element selection criteria
    //              3)  nLimit      Depth limit for probing of child nodes
    //              4)  nLevel      Depth level of this HTML element
    //              5)  bLog        Print log flag
    //
    //  Returns:    Number of elements added during this call on this element</pre>
			<pre>    _hzfunc("hzHtmElem::_testnode") ;</pre>
			<pre>    hzChain         Z ;                 //  For extracting search expression components
    hzHtmElem*      pNode ;             //  Node to be returned
    const char*     i ;                 //  Search expression iterator
    const char*     cpNext = 0 ;        //  Next part of search expression if present
    hzAttrset       ai ;                //  Attribute iterator
    hzString        cont ;              //  Convert elemnet's content to temp string
    hzString        reqNode_name ;      //  Required name of node
    hzString        reqChild_name ;     //  Required name of node child
    hzString        reqNode_cont ;      //  Required content of node
    hzString        reqAttr_name ;      //  Required name of attribute
    hzString        reqAttr_value ;     //  Required value of attribute
    hzString        anam ;              //  Attribute name
    hzString        aval ;              //  Attribute value
    uint32_t        nTotal ;            //  Total nodes found matching search expression
    bool            bFound ;            //  Does this node pass this part of search expression</pre>
			<pre>    //  If we are already at too high a level, return
    if (nLimit &amp;&amp; (m_nLevel &gt; nLimit))
    {
        if (bLog)
            threadLog("\t-&gt; Out of range, returning 0\n") ;
        return 0 ;
    }</pre>
			<pre>    //  Get required name of node
    for (i = srchExp ; IsAlpha(*i) ; i++)
        Z.AddByte(*i) ;
    reqNode_name = Z ;
    Z.Clear() ;</pre>
			<pre>    if (*i == CHAR_PERIOD)
    {
        i++ ;
        if (!IsAlpha(*i))
        {
            if (bLog)
                threadLog("Malformed criteria (&#37;s)\n", srchExp) ;
            return 0 ;
        }</pre>
			<pre>        cpNext = i ;
        for (; IsAlpha(*i) ; i++)
            Z.AddByte(*i) ;
        reqChild_name = Z ;
        Z.Clear() ;
    }</pre>
			<pre>    //  Get name of attribute if applicable
    if (i[0] == CHAR_MINUS &amp;&amp; i[1] == CHAR_MORE)
    {
        for (i += 2 ; IsUrlnorm(*i) ; i++)
            Z.AddByte(*i) ;
        reqAttr_name = Z ;
        Z.Clear() ;
    }</pre>
			<pre>    //  An equal sign after the tag name specifies what the tag contents must be for the tag to qualify
    if (*i == CHAR_EQUAL)
    {
        for (i += 2 ; *i != CHAR_DQUOTE ; i++)
            Z.AddByte(*i) ;
        reqAttr_value = Z ;
        Z.Clear() ;
    }</pre>
			<pre>    /*
    if (bLog)
    {
        threadLog("On-node [&#37;s] (&#37;d) Testing node with reqNode_name=&#37;s, reqChild_name=&#37;s, reqAttr_name=&#37;s, reqAttr_value=&#37;s level=&#37;d, slct=&#37;s\n",
            *Lineage(), m_nLevel, *reqNode_name, *reqChild_name, *reqAttr_name, *reqAttr_value, nLevel, srchExp) ;
        for (pNode = m_Children ; pNode ; pNode = pNode-&gt;m_Sibling)
            threadLog("\t-&gt; child: &#37;s\n", *pNode-&gt;m_Name) ;
    }
    */</pre>
			<pre>    //  Now we have the first part of the search expression, we test to see if this node meets this. If it does we still have to establish if
    //  the remainder of the search expression (if it exists) is satisfied.</pre>
			<pre>    //pAttr = 0 ;
    bFound = false ;</pre>
			<pre>    if (m_Name == reqNode_name)
    {
        //  We are on the specified node so if the value is not right, any named attribute does not exist or it does but with the
        //  wrong value, we return a zero (to end the examination of this branch of nodes)</pre>
			<pre>        bFound = true ;</pre>
			<pre>        if (!reqChild_name)
        {
            //  No child node has been specified so this node must be the last to check</pre>
			<pre>            if (reqNode_cont)
            {
                cont = m_tmpContent ;
                if (reqNode_cont != cont)
                    return 0 ;
            }</pre>
			<pre>            if (bFound &amp;&amp; reqAttr_name)
            {
                //  See if we can find an attribute of the requrired name on this node
                for (ai = this ; ai.Valid() ; ai.Advance())
                {
                    anam = ai.Name() ; aval = ai.Value() ;</pre>
			<pre>                    threadLog("Compare attr names (&#37;s to param-&gt;name of &#37;s)\n", *reqAttr_name, *anam) ;
                    if (anam == reqAttr_name)
                    {
                        threadLog("Found a attr name match ") ;
                        if (reqAttr_value)
                        {
                            if (reqAttr_value != aval)
                            {
                                threadLog("but not a pvalue match (&#37;s not param-&gt;val of &#37;s)\n", *reqAttr_value, *aval) ;
                                continue ;
                            }
                        }
                        threadLog(" - bingo\n") ;
                        break ;
                    }
                }</pre>
			<pre>                //  if (!pAttr)
                //      { threadLog("Oops - run out of params\n") ; return 0 ; }
            }
        }
    }</pre>
			<pre>    if (bFound)
    {
        /*
        **  Now we have passed the first part of the search expression, we can add this node to the results if there is no furthur search expression. But
        **  if there is, we have to establish if the remainder of the search expression is satisfied. This will nessesitate a recursive call of
        **  this function for each and every child of this node with the search expression pointer advanced. Only if at least one of these calls
        **  succeeds (returns a positive integer for nodes added to the result), can this call succeed.
        */</pre>
			<pre>        if (!cpNext)
        {
            //threadLog("\tMatched. Adding &#37;s at level &#37;d and position &#37;d to array\n", *Lineage(), m_nLevel, tmpResult.Count()) ;</pre>
			<pre>            nLimit = m_nLevel ;
            tmpResult.Add(this) ;
            return 1 ;
        }</pre>
			<pre>        //  Test children on the further search expression
        nTotal = 0 ;
        for (pNode = GetFirstChild() ; pNode ; pNode = pNode-&gt;Sibling())
        {
            //  if (!pNode-&gt;IsAncestor(this))
            //      Fatal("Case 2: Proported child failes to be ancestor of this\n") ;</pre>
			<pre>            if (nLimit &amp;&amp; (pNode-&gt;m_nLevel &gt; nLimit))
                continue ;</pre>
			<pre>            nTotal += pNode-&gt;_testnode(tmpResult, cpNext, nLimit, nLevel + 1, bLog) ;
        }
        return nTotal ;
    }</pre>
			<pre>    /*
    **  This node does not have the required name and so does not meet the first part of the search expression. However a child might meet the
    **  search expression so we try each in turn.
    */</pre>
			<pre>    nTotal = 0 ;
    for (pNode = GetFirstChild() ; pNode ; pNode = pNode-&gt;Sibling())
    {
        if (nLimit &amp;&amp; (pNode-&gt;m_nLevel &gt; nLimit))
            continue ;</pre>
			<pre>        if (pNode-&gt;Name() == reqNode_name)
            nTotal += pNode-&gt;_testnode(tmpResult, srchExp, nLimit, nLevel + 1, bLog) ;
    }</pre>
			<pre>    return nTotal ;
}</pre>
			<pre>void    hzHtmElem::FindSubnodes (hzVect&lt;hzHtmElem*&gt;&amp; result, const char* srchExp, bool bLog)
{
    //  From the current node (the node used to call this member function), find all sub-nodes matching the supplied search expression.
    //
    //  This function does not simply locate nodes that are children of the calling node whose name matches the supplied search expression. The aim is
    //  to locate descenant nodes, however far down the tree they are.
    //
    //  Note:   The search expression will be of the form of one or more name-value pairs as follows:-
    //
    //      1)  name="some_name";       - Only applies if the element is given an id which is often not the case
    //      2)  type="html_tagtype";    - The element is of the right type, eg &lt;table&gt;
    //      3)  class="class_value";    - The element has the given class value
    //      4)  pname="param_name";     - The element has the parameter
    //      4)  pvalue="param_value";   - The element has the parameter value
    //      6)  cont="content_value";   - The element has contents of the given value
    //
    //  Arguments:  1)  elements    The vector of elements found and in thier actual order of incidence.
    //              2)  srchExp     Search expression
    //              3)  bLog        Set if detailed logging is required
    //
    //  Returns:    None</pre>
			<pre>    hzDocHtml*  pTree ;         //  The Tree holding this node
    uint32_t    nLimit = 0 ;    //  Level limit</pre>
			<pre>    //  Check we have a tree
    pTree = GetTree() ;
    if (!pTree)
        Fatal("No tree - aborting\n") ;</pre>
			<pre>    //  Recursively call _testnode
    result.Clear() ;
    _testnode(result, srchExp, nLimit, 0, bLog) ;
    //threadLog("hzHtmElem::FindSubnodes: found &#37;d results, set limit to &#37;d\n", result.Count(), nLimit) ;
}</pre>
			<pre>uint32_t    hzDocHtml::ExtractLinksBasic    (hzVect&lt;hzUrl&gt;&amp; links, const hzSet&lt;hzString&gt;&amp; domains, const hzString&amp; form)
{
    //  Find all links on a page lying within a set of acceptable domains and matching any supplied criteria. These are aggregated to the supplied vector of link
    //  URLs. If no domains or criteria are supplied, all the links in the page will be aggregated.
    //
    //  Note the links in a page are established in the Load() function. This function meerly filters them. It does not read the page content.
    //
    //  Arguments:  1)  links:      The vector or set of URLs (links) found in the document
    //              2)  domains:    The set of domains that links must belong to in order to be included
    //              3)  form:       The search criteria is any
    //
    //  Returns:    Number of links that meet the supplied criteria</pre>
			<pre>    hzUrl       link ;          //  URL of link
    uint32_t    nIndex ;        //  Links iterator</pre>
			<pre>    links.Clear() ;</pre>
			<pre>    for (nIndex = 0 ; nIndex &lt; m_vecLinks.Count() ; nIndex++)
    {
        link = m_vecLinks[nIndex] ;</pre>
			<pre>        //  Ignore empty links (should not be any)
        if (!link)
            continue ;</pre>
			<pre>        //  Ignore links to domains not on the list of acceptable domains (usually the website domain only)
        if (domains.Count())
        {
            if (!domains.Exists(link.Domain()))
                continue ;
        }</pre>
			<pre>        //  Now apply criteria
        if (form)
        {
            if (!FormCheckCstr(*link, *form))
                continue ;
        }</pre>
			<pre>        links.Add(link) ;
    }</pre>
			<pre>    return links.Count() ;
}</pre>
			<pre>uint32_t    hzDocHtml::ExtractLinksContent  (hzMapS&lt;hzUrl,hzString&gt;&amp; links, const hzSet&lt;hzString&gt;&amp; domains, const hzString&amp; criteria)
{
    //  Find all links on a page lying within a set of acceptable domains and matching any supplied criteria. These are aggregated to the supplied map of link
    //  URLs to link content. If no domains or criteria are supplied, all the links in the page will be aggregated.
    //
    //  Note the links in a page are established in the Load() function. This function meerly filters them. It does not read the page content.
    //
    //  Arguments:  1) links:   The vector or set of URLs (links) found in the document
    //              2) domains: The set of domains that links must belong to in order to be included
    //              3) form:    The search criteria is any
    //
    //  Returns:    Number of links that meet the supplied criteria</pre>
			<pre>    hzHtmElem*      pElement ;  //  HTML node
    hzAttrset       ai ;        //  Attribute iterator
    hzString        anam ;      //  Attribute name
    hzString        S ;         //  Content of link node
    hzUrl           link ;      //  URL of link
    uint32_t        nIndex ;    //  Links iterator</pre>
			<pre>    links.Clear() ;</pre>
			<pre>    for (nIndex = 0 ; nIndex &lt; m_vecTags.Count() ; nIndex++)
    {
        pElement = m_vecTags[nIndex] ;</pre>
			<pre>        if (pElement-&gt;Type() != HTAG_ANCHOR)
            continue ;</pre>
			<pre>        //for (pm = pElement-&gt;GetFirstAttr() ; pm ; pm = pm-&gt;next)
        for (ai = pElement ; ai.Valid() ; ai.Advance())
        {
            anam = ai.Name() ;</pre>
			<pre>            if (anam.Equiv("href"))
            {
                link = ai.Value() ;</pre>
			<pre>                //  Ignore empty links (should not be any)
                if (!link)
                    continue ;</pre>
			<pre>                //  Ignore links to domains not on the list of acceptable domains (usually the website domain only)
                if (domains.Count())
                {
                    if (!domains.Exists(link.Domain()))
                        continue ;
                }</pre>
			<pre>                //  Enforce limiting criteria
                if (criteria)
                {
                    if (!FormCheckCstr(*link, *criteria))
                        continue ;
                }</pre>
			<pre>                S = pElement-&gt;m_tmpContent ;
                links.Insert(link, S) ;
            }
        }
    }</pre>
			<pre>    return links.Count() ;
}</pre>
			<pre>hzEcode hzDocHtml::Import   (const hzString&amp; path)
{
    //  Loads an HTML document into a tree of HTML nodes
    //
    //  Arguments:  1)  path    The full pathname of the file to load
    //
    //  Returns:    E_ARGUMENT  If no file path is supplied
    //              E_NOTFOUND  If the file does not exist
    //              E_NODATA    If the file is empty
    //              E_OPENFAIL  If the file cannot be read
    //              E_FORMAT    If a format error caused the file load to fail
    //              E_OK        If the operation is successful</pre>
			<pre>    _hzfunc("hzDocHtml::Import") ;</pre>
			<pre>    ifstream    is ;    //  Input stream
    hzChain     Z ;     //  Chain for holding file content
    hzEcode     rc ;    //  Return code</pre>
			<pre>    //  Check path and load document
    rc = OpenInputStrm(is, path) ;
    if (rc == E_OK)
    {
        Z &lt;&lt; is ;
        is.close() ;</pre>
			<pre>        rc = Load(Z) ;
    }</pre>
			<pre>    return rc ;
}</pre>
			<pre>void    hzDocHtml::_report  (hzLogger&amp; xlog, hzHtmElem* node)
{
    //  Category:   Diagnostics
    //
    //  Recursive suport function for non-recursive hzDocHtml::Report
    //
    //  Arguments:  1)  xlog    The logfile to write report to
    //              2)  node    The starting node
    //
    //  Returns:    None</pre>
			<pre>    hzHtmElem*      pSub ;      //  Subnodes
    hzChain         ult ;       //  Final version of node contents
    chIter          x ;         //  Content iterator
    hzAttrset       ai ;        //  Attribute iterator
    int             n ;         //  Level iterator</pre>
			<pre>    if (!node)
        { xlog.Out("hzDocHtml::_report: ERROR No HTML element suppled\n") ; return ; }</pre>
			<pre>    /*
    **  Write out the opening of the tag
    */</pre>
			<pre>    xlog.Out("&#37;2d: ", node-&gt;Level()) ;
    for (n = node-&gt;Level() ; n ; n--)
        xlog &lt;&lt; ". " ;</pre>
			<pre>    xlog.Out("&lt;&#37;s", *Tagtype2Txt(node-&gt;Type())) ;</pre>
			<pre>    for (ai = node ; ai.Valid() ; ai.Advance())
        xlog.Out(" &#37;s=\"&#37;s\"", ai.Name(), ai.Value()) ;</pre>
			<pre>    xlog &lt;&lt; "&gt;\n" ;</pre>
			<pre>    /*
    **  First visit higher level tags if any
    */</pre>
			<pre>    //pSub = node-&gt;FirstSubnode() ;
    pSub = node-&gt;GetFirstChild() ;
    if (pSub)
    {
        //for (; pSub ; pSub = pSub-&gt;NextSubnode())
        for (; pSub ; pSub = pSub-&gt;Sibling())
            _report(xlog, pSub) ;
    }</pre>
			<pre>    /*
    **  Then do content
    */</pre>
			<pre>    if (node-&gt;m_tmpContent.Size())
    {
        for (x = node-&gt;m_tmpContent ; !x.eof() ; x++)
        {
            if (*x &lt;= CHAR_SPACE)
                continue ;
            break ;
        }
        for (; !x.eof() ; x++)
        {
            if (x == "\r\n")
                { x++ ; continue ; }
            ult.AddByte(*x) ;
        }</pre>
			<pre>        if (ult.Size())
        {
            xlog.Out("&#37;2d: ", node-&gt;Level()) ;
            for (n = node-&gt;Level() ; n ; n--)
                xlog &lt;&lt; "  " ;</pre>
			<pre>            xlog &lt;&lt; "[" &lt;&lt; ult &lt;&lt; "]\n" ;
        }
    }</pre>
			<pre>    /*
    **  Write out the closing of the tag
    */</pre>
			<pre>    xlog.Out("&#37;2d: ", node-&gt;Level()) ;
    for (n = node-&gt;Level() ; n ; n--)
        xlog &lt;&lt; ". " ;
    xlog.Out("&lt;/&#37;s&gt;\n", *Tagtype2Txt(node-&gt;Type())) ;
}</pre>
			<pre>void    hzDocHtml::Report   (hzLogger&amp; xlog)
{
    //  Show list of nodes plus content
    //
    //  Arguments:  1)  xlog    The logfile to write report to
    //  Returns:    None</pre>
			<pre>    _hzfunc("hzDocHtml::Report") ;</pre>
			<pre>    hzHtmElem*  pE ;            //  Current node
    hzString    S ;             //  Tag content holder
    uint32_t    nIndex ;        //  Document tag iterator</pre>
			<pre>    if (!m_vecTags.Count())
        xlog.Out("PAGE is EMPTY - No nodes in Vector\n") ;
    else
    {
        for (nIndex = 0 ; nIndex &lt; m_vecTags.Count() ; nIndex++)
        {
            pE = m_vecTags[nIndex] ;</pre>
			<pre>            S = pE-&gt;m_tmpContent ;</pre>
			<pre>            xlog.Out("id=&#37;d par=&#37;d subs=&#37;d nxt=&#37;d lev=&#37;d: &#37;s [&#37;s]\n",
                pE-&gt;GetUid(),
                pE-&gt;Parent() ? pE-&gt;Parent()-&gt;GetUid() : 0,
                pE-&gt;GetFirstChild() ? pE-&gt;GetFirstChild()-&gt;GetUid() : 0,
                pE-&gt;Sibling() ? pE-&gt;Sibling()-&gt;GetUid() : 0,
                pE-&gt;Level(),
                *Tagtype2Txt(pE-&gt;Type()),
                *S) ;
        }
    }</pre>
			<pre>    //  Show tree of nodes plus content
    if (!m_pRoot)
        xlog.Out("PAGE is EMPTY - No subnodes of root\n") ;
    else
        _report(xlog, m_pRoot) ;
}</pre>
			<pre>hzEcode hzDocHtml::_xport   (hzChain&amp; Z, hzHtmElem* node)
{
    //  Recursive support function for hzDocHtml::Export. It exports the full tag (including attributes and content) of the supplied node and all
    //  subnodes, to the supplied chain.
    //
    //  Arguments:  1)  Z       The output chain
    //              2)  node    The current node
    //
    //  Returns:    E_ARGUMENT  If no HTML element is supplied
    //              E_OK        If the operation was successful
    //
    //  Note this is a support function for hzDocHtml::Export</pre>
			<pre>    hzChain         ult ;       //  Final version of node contents
    chIter          x ;         //  Content iterator
    hzHtmElem*      pSub ;      //  Subnodes
    hzAttrset       ai ;        //  Attribute iterator
    int             n ;         //  Level iterator</pre>
			<pre>    if (!node)
        return E_ARGUMENT ;</pre>
			<pre>    //  Write out the opening of the tag
    Z.Printf("&#37;2d: ", node-&gt;Level()) ;
    for (n = node-&gt;Level() ; n ; n--)
        Z &lt;&lt; ". " ;
    Z.Printf("&lt;&#37;s", *Tagtype2Txt(node-&gt;Type())) ;</pre>
			<pre>    for (ai = node ; ai.Valid() ; ai.Advance())
        Z.Printf(" &#37;s=\"&#37;s\"", ai.Name(), ai.Value()) ;
    Z &lt;&lt; "&gt;\n" ;</pre>
			<pre>    //  Then do content
    if (node-&gt;m_tmpContent.Size())
    {
        for (x = node-&gt;m_tmpContent ; !x.eof() ; x++)
        {
            if (*x &lt;= CHAR_SPACE)
                continue ;
            break ;
        }
        for (; !x.eof() ; x++)
        {
            if (x == "\r\n")
                { x++ ; continue ; }
            ult.AddByte(*x) ;
        }</pre>
			<pre>        if (ult.Size())
        {
            Z.Printf("&#37;2d: ", node-&gt;Level()) ;
            for (n = node-&gt;Level() ; n ; n--)
                Z &lt;&lt; "  " ;</pre>
			<pre>            Z.AddByte('[') ;
            Z &lt;&lt; ult ;
            Z.AddByte(']') ;
            Z.AddByte(CHAR_NL) ;
        }
    }</pre>
			<pre>    //  First visit higher level tags if any
    //pSub = node-&gt;FirstSubnode() ;
    pSub = node-&gt;GetFirstChild() ;
    if (pSub)
    {
        //for (; pSub ; pSub = pSub-&gt;NextSubnode())
        for (; pSub ; pSub = pSub-&gt;Sibling())
            _xport(Z, pSub) ;
    }</pre>
			<pre>    //  Write out the closing of the tag
    Z.Printf("&#37;2d: ", node-&gt;Level()) ;
    for (n = node-&gt;Level() ; n ; n--)
        Z &lt;&lt; ". " ;
    Z.Printf("&lt;/&#37;s&gt;\n", *Tagtype2Txt(node-&gt;Type())) ;
    return E_OK ;
}</pre>
			<pre>hzEcode hzDocHtml::Export   (const hzString&amp; filepath)
{
    //  Exports a HTML page to a file named as per the supplied file path.
    //
    //  Arguments:  1)  filepath    The file to export the HTML document to
    //
    //  Returns:    E_ARGUMENT  If no export file path is supplied
    //              E_NODATA    If there is no HTML elements in the document
    //              E_OPENFAIL  If the supplied 
    //              E_WRITEFAIL If a write file occurs during export
    //              E_OK        If the export ran to completion</pre>
			<pre>    _hzfunc("hzDocHtml::Export") ;</pre>
			<pre>    ofstream    os ;        //  Output stream
    hzChain     Z ;         //  Working chain for output construction
    hzEcode     rc = E_OK ; //  Return code</pre>
			<pre>    if (!filepath)
        return hzerr(E_ARGUMENT, "No pathname supplied") ;</pre>
			<pre>    if (!m_pRoot)
    {
        if (!m_Content.Size())
            return hzerr(E_NODATA, "Empty page (no root node). Nothing written to file &#37;s\n", *filepath) ;
    }</pre>
			<pre>    //  Dump out to file
    os.clear() ;
    os.open(*filepath) ;
    if (os.fail())
        return hzerr(E_OPENFAIL, "Could not open file &#37;s\n", *filepath) ;</pre>
			<pre>    if (m_Info.m_urlReq)
        Z.Printf("URL (req): &#37;s\n", *m_Info.m_urlReq) ;
    if (*m_Info.m_urlAct)
        Z.Printf("URL (act): &#37;s\n", *m_Info.m_urlAct) ;
    os &lt;&lt; Z ;
    if (os.fail())
        rc = E_WRITEFAIL ;
    Z.Clear() ;</pre>
			<pre>    if (rc == E_OK)
    {
        if (m_pRoot)
            rc = _xport(Z, m_pRoot) ;
        else
            Z = m_Content ;</pre>
			<pre>        os &lt;&lt; Z ;
        if (os.fail())
            rc = E_WRITEFAIL ;
    }</pre>
			<pre>    os.close() ;
    return rc ;
}</pre>
			<pre>void    hzDocHtml::Clear    (void)
{
    //  Recursively clear the tree of nodes
    //
    //  Arguments:  None
    //  Returns:    None</pre>
			<pre>    hzHtmElem*  pNode ;     //  Node pointer
    uint32_t    nIndex ;    //  Document tags iterator</pre>
			<pre>    for (nIndex = 0 ; nIndex &lt; m_vecTags.Count() ; nIndex++)
    {
        pNode = m_vecTags[nIndex] ;
        delete pNode ;
    }</pre>
			<pre>    m_vecTags.Clear() ;
    m_vecLinks.Clear() ;
    m_setLinks.Clear() ;
    m_Emails.Clear() ;</pre>
			<pre>    m_pRoot = 0 ;
    m_pHead = 0 ;
    m_pBody = 0 ;
}</pre>
			<pre>hzEcode hzDocHtml::FindElements (hzVect&lt;hzHtmElem*&gt;&amp; elements, hzString&amp; htag, hzString&amp; attrName, hzString&amp; attrValue)
{
    //  Find all elements in a page with the given tag name and/or attribute and value.
    //
    //  Arguments:  1)  elements    Elements found in order of incidence in this document matching on tag type and on attribute name and value if supplied.
    //              2)  htag        The tag type. This is compulsory and matches only elements of the given type.
    //              3)  aname       The attribute name. This is optional but if supplied, will require elements to have an attribute of the supplied name
    //              4)  avalue      The attribute value. Also optional but if supplied, will require elements to have an attribute of the supplied name
    //
    //  Returns:    E_NOTFOUND  If no elements matched
    //              E_OK        If elements matched</pre>
			<pre>    hzHtmElem*      pElement ;  //  HTML node
    hzAttrset       ai ;        //  Attribute iterator
    hzString        anam ;      //  Attribute name
    hzString        aval ;      //  Attribute value
    hzString        S ;         //  Content of link node
    hzUrl           link ;      //  URL of link
    uint32_t        Lo ;        //  First element in m_mapTags to investigate
    uint32_t        Hi ;        //  Last element in m_mapTags to investigate
    uint32_t        nIndex ;    //  Links iterator
    bool            bOk ;       //  OK to insert the element</pre>
			<pre>    elements.Clear() ;</pre>
			<pre>    Lo = 0 ;
    Hi = m_mapTags.Count() - 1 ;</pre>
			<pre>    if (htag)
    {
        //  A tagname has been supplied so limit the investigation to tags with the tagname
        Lo = m_mapTags.First(htag) ;
        if (Lo &lt; 0)
            return E_NOTFOUND ;
        Hi = m_mapTags.Last(htag) ;
    }</pre>
			<pre>    //  Investigate elements
    for (nIndex = Lo ; nIndex &lt;= Hi ; nIndex++)
    {
        pElement = m_mapTags.GetObj(nIndex) ;</pre>
			<pre>        bOk = false ;</pre>
			<pre>        if (attrName)
        {
            //  An attrubute name has been supplied so the element must have this attribute
            for (ai = pElement ; ai.Valid() ; ai.Advance())
            {
                anam = ai.Name() ; aval = ai.Value() ;</pre>
			<pre>                if (anam == attrName)
                {
                    if (!attrValue)
                        bOk = true ;
                    else
                    {
                        if (aval == attrValue)
                            bOk = true ;
                    }
                }
            }
        }
        else
        {
            if (attrValue)
            {
                //  An attribute value ...
                for (ai = pElement ; ai.Valid() ; ai.Advance())
                {
                    anam = ai.Name() ; aval = ai.Value() ;</pre>
			<pre>                    if (aval == attrValue)
                        bOk = true ;
                }
            }
        }</pre>
			<pre>        if (bOk)
            //elements.Insert(pElement) ;
            elements.Add(pElement) ;
    }</pre>
			<pre>    return E_OK ;
}</pre>
			<pre>hzEcode hzDocHtml::FindElements (hzVect&lt;hzHtmElem*&gt;&amp; elements, const char* srchExp)
{
    //  Find all tags meeting the supplied criteria and place pointers to the tags in the supplied results vector.
    //
    //  Note:   The criteria will be of the form of one or more name-value pairs as follows:-
    //
    //      1)  name="some_name";       - Only applies if the element is given an id which is often not the case
    //      2)  type="html_tagtype";    - The element is of the right type, eg &lt;table&gt;
    //      3)  class="class_value";    - The element has the given class value
    //      4)  pname="param_name";     - The element has the parameter
    //      4)  pvalue="param_value";   - The element has the parameter value
    //      6)  cont="content_value";   - The element has contents of the given value
    //
    //  Arguments:  1)  elements    The vector of elements found and in thier actual order of incidence.
    //              2)  srchExp     Search expression
    //
    //  Returns:    E_NOTFOUND  If no elements matched
    //              E_OK        If elements matched</pre>
			<pre>    _hzfunc("hzDocHtml::FindElements") ;</pre>
			<pre>    hzVect&lt;hzString&gt;    list ;      //  List of tagnames forming required nod ancestry
    hzVect&lt;hzHtmElem*&gt;  found ;     //  Nodes matching this</pre>
			<pre>    hzChain         Z ;             //  For extracting tagnames etc
    hzHtmElem*      pN ;            //  Element
    hzHtmElem*      pK ;            //  Element child
    hzAttrset       ai ;            //  Attribute iterator
    const char*     i ;             //  For processing criteria
    hzString        tnam ;          //  Tagname
    hzString        knam ;          //  Child tagname (if any)
    hzString        reqAttr_name ;  //  Attribute name (if any)
    hzString        reqAttr_value ; //  Attribute value (if any)
    uint32_t        Lo ;            //  1st element to investigate
    uint32_t        Hi ;            //  Lst element to investigate
    uint32_t        x ;             //  Element iterator
    uint32_t        v ;             //  Element iterator
    uint32_t        anc ;           //  Ancestry level</pre>
			<pre>    elements.Clear() ;</pre>
			<pre>    //  Find node by name required name of node
    for (i = srchExp ; IsAlphanum(*i) ; i++)
        Z.AddByte(*i) ;
    tnam = Z ;
    Z.Clear() ;
    list.Add(tnam) ;</pre>
			<pre>    for (; *i == CHAR_PERIOD ;)
    {
        i++ ;
        if (!IsAlpha(*i))
            return hzerr(E_FORMAT, "Malformed criteria (&#37;s)\n", srchExp) ;</pre>
			<pre>        for (; IsAlphanum(*i) ; i++)
            Z.AddByte(*i) ;
        tnam = Z ;
        Z.Clear() ;
        list.Add(tnam) ;
    }</pre>
			<pre>    //  Get name of attribute if applicable
    if (i[0] == CHAR_MINUS &amp;&amp; i[1] == CHAR_MORE)
    {
        for (i += 2 ; IsUrlnorm(*i) ; i++)
            Z.AddByte(*i) ;
        reqAttr_name = Z ;
        Z.Clear() ;
    }</pre>
			<pre>    //  An equal sign after the tag name specifies what the tag contents must be for the tag to qualify
    if (*i == CHAR_EQUAL)
    {
        for (i += 2 ; *i != CHAR_SQUOTE ; i++)
            Z.AddByte(*i) ;
        reqAttr_value = Z ;
        Z.Clear() ;
    }</pre>
			<pre>    anc = list.Count() ;
    if (anc)
    {
        //  Look up the last tag in the m_mapTags
        anc-- ;
        tnam = list[anc] ;</pre>
			<pre>        Lo = m_mapTags.First(tnam) ;
        if (Lo &lt; 0)
            return E_OK ;
        Hi = m_mapTags.Last(tnam) ;</pre>
			<pre>        threadLog("node (&#37;d - &#37;d) &#37;s a=&#37;s v=&#37;s", Lo, Hi, *tnam, *reqAttr_name, *reqAttr_value) ;</pre>
			<pre>        for (x = Lo ; x &lt;= Hi ; x++)
        {
            pN = m_mapTags.GetObj(x) ;</pre>
			<pre>            if (!anc)
                found.Add(pN) ;
            else
            {
                //  Progress thru ancestry
                pK = pN-&gt;Parent() ;
                for (v = anc-1 ; pK &amp;&amp; v &gt;= 0 ; pK = pK-&gt;Parent(), v--)
                {
                    threadLog("&lt;- &#37;s ", *pK-&gt;Name()) ;
                    if (pK-&gt;Name() != list[v])
                        break ;
                }
                if (v &lt; 0)
                {
                    found.Add(pN) ;
                    threadLog("OK ") ;
                }
            }
        }</pre>
			<pre>        //  Check all found nodes for attribute criiteria
        for (x = 0 ; x &lt; found.Count() ; x++)
        {
            pN = found[x] ;</pre>
			<pre>            if (!reqAttr_name &amp;&amp; !reqAttr_value)
                elements.Add(pN) ;
            else
            {
                for (ai = pN ; ai.Valid() ; ai.Advance())
                {
                    if (reqAttr_name &amp;&amp; reqAttr_name != ai.Name())
                    {
                        threadLog("-1 ") ;
                        continue ;
                    }
                    if (reqAttr_value &amp;&amp; reqAttr_value != ai.Value())
                    {
                        threadLog("-2 ") ;
                        continue ;
                    }
                    elements.Add(pN) ;
                    threadLog("+ ") ;
                    break ;
                }
            }
        }</pre>
			<pre>        threadLog("done\n") ;
    }
    else
    {
        //  Check all the nodes for attribute criteria
        for (x = 0 ; x &lt; m_mapTags.Count() ; x++)
        {
            pN = m_mapTags.GetObj(x) ;</pre>
			<pre>            if (!reqAttr_name &amp;&amp; !reqAttr_value)
                elements.Add(pN) ;
            else
            {
                for (ai = pN ; ai.Valid() ; ai.Advance())
                {
                    if (reqAttr_name &amp;&amp; reqAttr_name != ai.Name())
                        continue ;
                    if (reqAttr_value &amp;&amp; reqAttr_value != ai.Value())
                        continue ;
                    elements.Add(pN) ;
                    break ;
                }
            }
        }
    }</pre>
			<pre>    return E_OK ;
}</pre>
			<pre>hzEcode hzDocHtml::_selectTag   (hzSet&lt;hzHtmElem*&gt;&amp; parents, hzSet&lt;hzHtmElem*&gt;&amp; elements, const hzString&amp; tagspec)
{
    //  Finds the set of tags meeting the supplied tag specifier.
    //
    //  Arguments:  1)  parents     Set of parent tags
    //              2)  elements    Set of selected tags
    //              3)  tagspec     Tag selection criteria
    //
    //  Returns:    E_SYNTAX    If the tag is malformed or illegal
    //              E_OK        If the tag is correct, even if no instances are found</pre>
			<pre>    _hzfunc("hzDocHtml::_selectTag") ;</pre>
			<pre>    hzMapS&lt;hzString,hzString&gt;   pairs ;     //  List of attrs and attr values the tag must possess (if any)</pre>
			<pre>    hzChain         word ;          //  Word extraction
    hzAttrset       ai ;            //  Attribute iterator
    hzHtmElem*      pE ;            //  HTML element (tag)
    hzHtmElem*      pAnc ;          //  HTML element (tag)
    const char*     i ;             //  For processing term
    hzString        tagname ;       //  Name of tag sought
    hzString        pnam ;          //  Name of attr sought
    hzString        pval ;          //  Value of attr sought
    hzString        anam ;          //  Attribute name
    hzString        aval ;          //  Attribute value
    uint32_t        nP ;            //  Name-value pair iterator
    uint32_t        Lo ;            //  First incidence of tagname
    uint32_t        Hi ;            //  Last incidence of tagname
    uint32_t        nIndex ;        //  Tag iterator
    uint32_t        nFound ;        //  All attributes found
    bool            bFound ;        //  Ancestry test
    hzEcode         rc = E_OK ;     //  Return code</pre>
			<pre>    elements.Clear() ;</pre>
			<pre>    /*
    **  Get tag name from the search criteria
    */</pre>
			<pre>    i = *tagspec ;</pre>
			<pre>    if (i[0] != CHAR_LESS)
        return hzerr(E_SYNTAX, "Term does not begin with an opening '&lt;' char") ;</pre>
			<pre>    for (i++ ; IsAlphanum(*i) ; i++)
        word.AddByte(*i) ;
    tagname = word ;
    word.Clear() ;</pre>
			<pre>    if (!tagname)
        return hzerr(E_SYNTAX, "No tagname supplied") ;</pre>
			<pre>    /*
    **  Get attribute requirements from the search criteria
    */</pre>
			<pre>    for (; *i == CHAR_SPACE ;)
    {
        for (i++ ; *i &amp;&amp; *i &lt;= CHAR_SPACE ; i++) ;
        pnam = pval = (char*) 0 ;</pre>
			<pre>        for (; IsAlphanum(*i) ; i++)
            word.AddByte(*i) ;
        pnam = word ;
        word.Clear() ;</pre>
			<pre>        if (!pnam)
            { rc = E_SYNTAX ; threadLog("Attr name not supplied\n") ; break ; }
        if (*i != CHAR_EQUAL)
            { rc = E_SYNTAX ; threadLog("Attr name not followed by an assignment operator\n") ; break ; }</pre>
			<pre>        i++ ;
        if (*i == CHAR_ASTERISK)
        {
            i++ ;
            pval = "*" ;
            pairs.Insert(pnam, pval) ;
            continue ;
        }</pre>
			<pre>        if (*i != CHAR_SQUOTE)
            { rc = E_SYNTAX ; threadLog("Attr has no opening single quote\n") ; break ; }
        for (i++ ; *i &amp;&amp; *i != CHAR_SQUOTE ; i++)
            word.AddByte(*i) ;
        if (*i != CHAR_SQUOTE)
            { rc = E_SYNTAX ; threadLog("Attr has no closing single quote\n") ; break ; }
        i++ ;
        pval = word ;
        word.Clear() ;</pre>
			<pre>        pairs.Insert(pnam, pval) ;
    }</pre>
			<pre>    if (rc != E_OK)
        return rc ;</pre>
			<pre>    if (*i != CHAR_MORE)
        { threadLog("Term does not end with a closing '&lt;' char\n") ; return E_SYNTAX ; }</pre>
			<pre>    threadLog("Examining &#37;d tags for tagnam=&#37;s\n", m_vecTags.Count(), *tagname) ;
    for (nP = 0 ; nP &lt; pairs.Count() ; nP++)
    {
        pnam = pairs.GetKey(nP) ;
        pval = pairs.GetObj(nP) ;
        threadLog(" - with &#37;s=&#37;s\n", *pnam, *pval) ;
    }</pre>
			<pre>    /*
    **  Get all tags in document with the tagname. It is not a failure if none found.
    */</pre>
			<pre>    Lo = m_mapTags.First(tagname) ;
    if (Lo &lt; 0)
        threadLog("No matching tags for &lt;&#37;s&gt;\n", *tagname) ;
    else
    {
        Hi = m_mapTags.Last(tagname) ;</pre>
			<pre>        for (nIndex = Lo ; nIndex &lt;= Hi ; nIndex++)
        {
            pE = m_mapTags.GetObj(nIndex) ;</pre>
			<pre>            //  Exclude elements with the wrong parent
            if (parents.Count())
            {
                bFound = false ;
                for (pAnc = pE-&gt;Parent() ; pAnc ; pAnc = pAnc-&gt;Parent())
                {
                    if (parents.Exists(pAnc))
                    {
                        bFound = true ;
                        threadLog("Found parent of &#37;p\n", pAnc) ;
                        break ;
                    }</pre>
			<pre>                    threadLog("No such parent as &#37;p\n", pAnc) ;
                }</pre>
			<pre>                if (!bFound)
                    continue ;
            }</pre>
			<pre>            //if (parents.Count() &amp;&amp; !parents.Exists(pE-&gt;Parent()))
            //  continue ;</pre>
			<pre>            //  No attribute/value pairs specified so the tag is added to the list
            if (!pairs.Count())
                { elements.Insert(pE) ; continue ; }</pre>
			<pre>            nFound = 0 ;
            for (ai = pE ; ai.Valid() ; ai.Advance())
            {
                anam = ai.Name() ; aval = ai.Value() ;</pre>
			<pre>                if (!pairs.Exists(anam))
                    continue ;</pre>
			<pre>                pval = pairs[anam] ;</pre>
			<pre>                if (pval == "*")
                    { nFound++ ; continue ; }
                if (pval == aval)
                    nFound++ ;
            }</pre>
			<pre>            //  If there is a match on every attribute/value pair specified, add to the list
            if (nFound == pairs.Count())
                elements.Insert(pE) ;
        }
    }</pre>
			<pre>    threadLog("Found &#37;d tags for tagspec=[&#37;s]\n", elements.Count(), *tagspec) ;</pre>
			<pre>    return rc ;
}</pre>
			<pre>hzEcode hzDocHtml::_selectTerm  (hzSet&lt;hzHtmElem*&gt;&amp; elements, const hzString&amp; term)
{
    //  A 'term' within the context of HTML document tag selection, can be a specification of a single tag or it can specifiy multiple tags. In the latter case,
    //  where multiple tag specifiers are concatenated, hierarchy is implied.
    //
    //  Selection works on the basis of more detail, more tests. For example, the term &lt;div&gt; will populate the set of elements found with every &lt;div&gt; tag in the
    //  document. The term &lt;div class&gt; will only find div tags with an attribute of 'class' while the term &lt;div class="body"&gt; will only find div tags that have
    //  an attribute of class whose value is 'body'. It should be noted however, that tags are selected if they have what is asked for in the term. There is not
    //  presently, any means to exclude tags if they have something we don't want them to have.
    //
    //  A hierarchical concatenated term such as &lt;div class='body'&gt;&lt;p&gt; will find every paragraph tag in the document whose parent tag is a div with an attribute
    //  of class whose value is 'body'. If no div tags meet that criteria nothing will be selected. Likewise if div tags do meet the &lt;div class="body"&gt; test but
    //  are not followed directly by the &lt;p&gt; tag, nothing is selected.
    //
    //  Note that multiple tag terms are implemented by multiples calls to _selectTag, with the selection of tags found being reduced by each call. 
    //
    //  Arguments:  1)  elements    Set of lements selected by this function
    //              2)  term        Tag selection criteria
    //
    //  Returns:    E_SYNTAX    If the tag is malformed or illegal
    //              E_OK        If the tag is correct, even if no instances are found</pre>
			<pre>    _hzfunc("hzDocHtml::_selectTerm") ;</pre>
			<pre>    hzSet&lt;hzHtmElem*&gt;   parents ;   //  Parents
    hzArray&lt;hzString&gt;   ar ;        //  Array of terms</pre>
			<pre>    uint32_t    x ;     //  For populating reducedSet
    uint32_t    t ;     //  Term count
    hzEcode     rc ;    //  Return code</pre>
			<pre>    SplitCSV(ar, *term, CHAR_PLUS) ;</pre>
			<pre>    if (!ar.Count())
        return hzerr(E_SYNTAX, "No tag specifiers found in term") ;
    threadLog("Term is &#37;s (&#37;d) components\n", *term, ar.Count()) ;</pre>
			<pre>    for (t = 0 ; t &lt; ar.Count() ; t++)
    {
        threadLog("Term component &#37;d: &#37;s\n", t, *ar[t]) ;
    }</pre>
			<pre>    if (ar.Count() == 1)
    {
        //  Call the _selectTag function once with the document's m_vecTags vector as the reduced set
        rc = _selectTag(parents, elements, ar[0]) ;
        return rc ;
    }</pre>
			<pre>    //  There is more than one tag. Call the _selectTag function with no parents listed to start with and then repeatedly with the elements
    //  found acting as the list of valid parents for the next call.
    rc = _selectTag(parents, elements, ar[0]) ;
    if (rc == E_OK)
    {
        if (elements.Count())
        {
            for (t = 1 ; rc == E_OK &amp;&amp; t &lt; ar.Count() ; t++)
            {
                //  Parents is the last tag's haul
                parents.Clear() ;
                for (x = 0 ; x &lt; elements.Count() ; x++)
                    parents.Insert(elements.GetObj(x)) ;
                rc = _selectTag(parents, elements, ar[t]) ;
            }
        }
    }</pre>
			<pre>    threadLog("Found &#37;d tags for term=[&#37;s]\n", elements.Count(), *term) ;
    return rc ;
}</pre>
			<pre>hzEcode hzDocHtml::_selectExp   (hzSet&lt;hzHtmElem*&gt;&amp; elements, const hzString&amp; srchExp)
{
    //  Recursive support function for hzDocHtml::SelectElements (see below)
    //
    //  Breaks up the expression into a term or 'term op expression' and calls _selectTerm to find the set of tags for each term. The terms can
    //  be enclosed in parenthesis but individually, they take the form of tags enclosed in a &lt;&gt; block. The tag name is the first and often only
    //  part but optionally after that, attributes may be specified.
    //
    //  Arguments:  1)  elements    The set of elements elected (in order of tag type)
    //              2)  srchExp     Search expression
    //
    //  Returns:    E_SYNTAX    If the expression is malformed
    //              E_OK        If the operation was successful (it still may have found no elements)</pre>
			<pre>    _hzfunc("hzDocHtml::_selectExp") ;</pre>
			<pre>    hzSet&lt;hzHtmElem*&gt;   setA ;      //  Element set for first term
    hzSet&lt;hzHtmElem*&gt;   setB ;      //  Element set for second term</pre>
			<pre>    hzChain         word ;          //  Individual word
    hzHtmElem*      pE ;            //  HTML element
    const char*     i ;             //  For processing criteria
    hzString        termA ;         //  First term
    hzString        termB ;         //  Remainder of epression
    hzString        expA ;          //  First term
    hzString        expB ;          //  Remainder of epression
    uint32_t        op ;            //  1 for OR and 2 for AND
    uint32_t        n ;             //  Counter
    uint32_t        level ;         //  Parenthesis
    hzEcode         rc = E_OK ;     //  Return code</pre>
			<pre>    /*
    **  Get 1st term
    */</pre>
			<pre>    for (i = *srchExp ; *i &amp;&amp; *i &lt;= CHAR_SPACE ; i++) ;</pre>
			<pre>    if (*i == '(')
    {
        level = 1 ;
        for (i++ ; level &amp;&amp; *i &gt;= CHAR_SPACE ; i++)
        {
            if (*i == '(')  level++ ;
            if (*i == ')')  level-- ;</pre>
			<pre>            if (level)
                word.AddByte(*i) ;
        }</pre>
			<pre>        expA = word ;
    }
    else if (*i == CHAR_LESS)
    {
        for (; *i == CHAR_LESS ;)
        {
            for (; *i != CHAR_MORE ; i++)
                word.AddByte(*i) ;
            word.AddByte(CHAR_MORE) ;
            i++ ;
            if (*i == CHAR_PLUS)
                { word.AddByte(CHAR_PLUS) ; i++ ; }
        }</pre>
			<pre>        termA = word ;
    }
    else
    {
        threadLog("Expected an opening '&lt;'\n") ;
        rc = E_SYNTAX ;
    }</pre>
			<pre>    if (rc != E_OK)
        return rc ;</pre>
			<pre>    if (*i == 0)
    {
        //  No further terms so populate element list with setA
        threadLog("Calling _selectTerm with a single exp [&#37;s] term [&#37;s]\n", *srchExp, *termA) ;
        if (expA)
            rc = _selectExp(elements, termA) ;
        if (termA)
            rc = _selectTerm(elements, termA) ;
        //for (n = 0 ; n &lt; setA.Count() ; n++)
        //  elements.Insert(setA.GetObj(n)) ;
        threadLog("case 1 Found &#37;d tags for term=[&#37;s]\n", elements.Count(), *srchExp) ;
        return rc ;
    }</pre>
			<pre>    /*
    **  Get operator
    */</pre>
			<pre>    for (; *i &amp;&amp; *i &lt;= CHAR_SPACE ; i++) ;</pre>
			<pre>    if (!CstrCompareI(i, "or"))
        { i += 2 ; op = 1 ; }
    else if (!CstrCompareI(i, "and"))
        { i += 3 ; op = 2 ; }
    else
        { threadLog("Illegal operator [&#37;s]\n", i) ; return E_SYNTAX ; }</pre>
			<pre>    /*
    **  Get remainder of expression as second term
    */</pre>
			<pre>    for (; *i &amp;&amp; *i &lt;= CHAR_SPACE ; i++) ;
    word.Clear() ;</pre>
			<pre>    if (*i == '(')
    {
        level = 1 ;
        for (i++ ; level &amp;&amp; *i &gt;= CHAR_SPACE ; i++)
        {
            if (*i == '(')  level++ ;
            if (*i == ')')  level-- ;</pre>
			<pre>            if (level)
                word.AddByte(*i) ;
        }</pre>
			<pre>        expB = word ;
    }
    else if (*i == CHAR_LESS)
    {
        for (; *i == CHAR_LESS ;)
        {
            for (; *i != CHAR_MORE ; i++)
                word.AddByte(*i) ;
            word.AddByte(CHAR_MORE) ;
            i++ ;
            if (*i == CHAR_PLUS)
                { word.AddByte(CHAR_PLUS) ; i++ ; }
        }</pre>
			<pre>        termB = word ;
    }
    else
    {
        threadLog("Expected an opening '&lt;'\n") ;
        rc = E_SYNTAX ;
    }</pre>
			<pre>    if (rc != E_OK)
        return rc ;</pre>
			<pre>    /*
    **  Apply operator
    */</pre>
			<pre>    threadLog("Calling _selectTerm with terms [&#37;s:&#37;s] and [&#37;s:&#37;s]\n", *expA, *termA, *expB, *termB) ;</pre>
			<pre>    if (expA)
        rc = _selectExp(setA, termA) ;
    if (termA)
        rc = _selectTerm(setA, termA) ;</pre>
			<pre>    if (expB)
        rc = _selectExp(setB, expB) ;
    if (termB)
        rc = _selectTerm(setB, termB) ;</pre>
			<pre>    if (op == 1)
    {
        threadLog("OR'ing\n") ;</pre>
			<pre>        for (n = 0 ; n &lt; setA.Count() ; n++)
            elements.Insert(setA.GetObj(n)) ;</pre>
			<pre>        for (n = 0 ; n &lt; setB.Count() ; n++)
            elements.Insert(setB.GetObj(n)) ;</pre>
			<pre>        threadLog("(total &#37;d)\n", elements.Count()) ;
    }
    else
    {
        threadLog("AND'ing\n") ;
        for (n = 0 ; n &lt; setA.Count() ; n++)
        {
            pE = setA.GetObj(n) ;
            if (setB.Exists(pE))
                elements.Insert(pE) ;
        }
    }</pre>
			<pre>    threadLog("Found &#37;d tags for term=[&#37;s]\n", elements.Count(), *srchExp) ;
    return rc ;
}</pre>
			<pre>hzEcode hzDocHtml::FindElements (hzVect&lt;hzHtmElem*&gt;&amp; elements, const hzString&amp; srchExp)
{
    //  Select elements from this document according to the supplied search expression
    //
    //  Webpages (HTML documents) commonly contain a lot of supurfluous matter whilst confining most information content to a limited set of elements (tags). If
    //  it is known which element(s) contain what information (eg title, author, body content etc), FindElements can be used to select these element(s) and from
    //  there, data can be efficiently extracted.
    //
    //  Arguments:  1)  The vector of HTML elements to be populated by this query. A vector is used in preference to a set as this ensures that
    //                  the elements found will be in the order of thier incidence in the HTML document.
    //              2)  The criteria as a boolean expression of one or more terms, where each term specifies how elements are to be selected.
    //
    //  Returns:    E_SYNTAX    If the expression is malformed
    //              E_OK        If the operation was successful (it still may have found no elements)
    //
    //  Support functions:
    //
    //  SelectElements() itself calls the private member function _selectExp to do the selecting. This places selected elements in a hzSet ordered
    //  by their RAM address (this ensures tags are only counted once). SelectElements() then re-orders the elements from the hzSet into a hzVect.
    //
    //  _selectExp  (hzSet&lt;hzHtmElem*&gt;&amp; elements, const hzString&amp; exp) simply breaks up the expression into a term or 'term op expression' and calls
    //  the second fupport function _selectTerm() to find the set of tags for each term.
    //
    //  _selectTerm (hzSet&lt;hzHtmElem*&gt;&amp; elements, const hzString&amp; exp) deals only with terms designed to specify elements. Each term consists of one or
    //  more tag specifiers, which when multiple, are separated by a + sign. A single tag specifier will identify a list of one or more tags within
    //  the document. Subsequent tag specifiers will do the same but will limit the search to descendents of the tags found under the previous tag
    //  specifier. The _selectTerm() calls the third support function _selectTag() on each tag specifier in turn, to actually do the selecting.
    //
    //  _selectTag  (hzSet&lt;hzHtmElem*&gt;&amp; parents, hzSet&lt;hzHtmElem*&gt;&amp; elements, const hzString&amp; exp) uses a single tag specifier to select tags from the
    //  HTML document and then if a list of parents (previously found tags) is supplied the selected tags are tested to ensure they have an ancestor
    //  among the list of parents.
    //
    //  Each tag specifier will be encased in a &lt;&gt; block and be of the general form &lt;tagname attr1='value1' attr2='value2' ...&gt; where either the tag
    //  name or at least one attribute must exist. If an attribute is specified the tag must match on the attribute be be selected. Wildcards can be
    //  used as well.</pre>
			<pre>    _hzfunc("hzDocHtml::FindElements") ;</pre>
			<pre>    hzMapS&lt;uint32_t,hzHtmElem*&gt; ord ;   //  Ordered set
    hzSet&lt;hzHtmElem*&gt;           res ;   //  Results</pre>
			<pre>    hzHtmElem*  pE ;    //  The HTML element (tag)
    uint32_t    x ;     //  Result set iterator
    hzEcode     rc ;    //  Return code</pre>
			<pre>    elements.Clear() ;
    if (!srchExp)
        return E_OK ;</pre>
			<pre>    //  Get expression 
    rc = _selectExp(res, srchExp) ;
    if (rc != E_OK)
    {
        threadLog("Failed\n") ;
        return rc ;
    }</pre>
			<pre>    //  Assemble results
    for (x = 0 ; x &lt; res.Count() ; x++)
    {
        pE = res.GetObj(x) ;
        ord.Insert(pE-&gt;GetUid(), pE) ;
    }</pre>
			<pre>    for (x = 0 ; x &lt; res.Count() ; x++)
    {
        pE = ord.GetObj(x) ;
        elements.Add(pE) ;
    }</pre>
			<pre>    threadLog("Got &#37;d elements\n", res.Count()) ;
    return E_OK ;
}</pre>
			<pre>/*
**  Section 2:  hzHtmElem members
*/</pre>
			<pre>hzEcode hzHtmElem::Init (hzDocHtml* pRoot, hzHtmElem* pParent, hzString&amp; tagname, hzHtagtype type, uint32_t id, uint32_t line)
{
    //  Initialize a HTML element (tag) to the parent element (if any), the tag type. Set also the id and line number (within the HTML
    //  in question)
    //
    //  Arguments:  1)  pRoot   Pointer to the HTML document root
    //              2)  pParent Pointer to the parent element of this
    //              3)  tagname The name of this tag
    //              4)  htag    HTML Tag type
    //              5)  id      Numeric identifier
    //              6)  line    Line number of tag in the source HTML file
    //
    //  Returns:    E_ARGUMENT  If no root is supplied
    //              E_OK        If the HTML element was initialized</pre>
			<pre>    _hzfunc("hzHtmElem::Init") ;</pre>
			<pre>    if (!pRoot)
    {
        hzerr(E_ARGUMENT, "No root supplied") ;
        return E_ARGUMENT ;
    }</pre>
			<pre>    if (!pParent)
    {
        m_Parent = 0 ;
        m_nLevel = 0 ;
    }
    else
    {
        m_Parent = pParent-&gt;GetUid() ;
        m_nLevel = pParent-&gt;m_nLevel + 1 ;
        pParent-&gt;_addnode(this) ;
    }</pre>
			<pre>    m_Name = tagname ;
    m_Type = type ;
    m_Uid = id ;
    m_nLine = line ;</pre>
			<pre>    m_Children = 0 ;
    m_Sibling = 0 ;</pre>
			<pre>    return E_OK ;
}</pre>
			<pre>hzEcode hzHtmElem::_addnode (hzHtmElem* pNode)
{
    //  Adds an element as a subnode of this. Subnodes are always appended.
    //
    //  Arguments:  1)  pNode   Element to add as child of this element
    //
    //  Returns:    E_ARGUMENT  If no element is supplied
    //              E_DUPLICATE If the supplied element is actually this element
    //              E_OK        If the element is added as child</pre>
			<pre>    _hzfunc("hzHtmElem::_addnode") ;</pre>
			<pre>    hzHtmElem*  p_temp ;    //  Current node pointer</pre>
			<pre>    if (!pNode)
        return hzerr(E_ARGUMENT, "Attempt to add a null node") ;
    if (pNode == this)
        return hzerr(E_DUPLICATE, "Attempt to add a node to itself (&#37;s)", *m_Name) ;</pre>
			<pre>    if (!m_Children)
        m_Children = pNode-&gt;GetUid() ;
    else
    {
        for (p_temp = GetFirstChild() ; p_temp-&gt;m_Sibling ; p_temp = p_temp-&gt;Sibling())
        {
            if (pNode == p_temp)
                return hzerr(E_DUPLICATE, "Attempt to add an already existing node to &#37;s", *m_Name) ;
        }
        p_temp-&gt;m_Sibling = pNode-&gt;GetUid() ;
    }</pre>
			<pre>    m_nSubnodes++ ;
    return E_OK ;
}</pre>
			<pre>/*
**  Section 2A: hzHtmlTable members
*/</pre>
			<pre>uint32_t    hzHtmTbl::Colcount  (void)
{
    //  Establishes the number of column headers. If there are no &lt;th&gt; headers there will still be columns.
    //
    //  Method is to check if there has been an edit (any additional tags) since the last report (of either row or column count). If not then the value held in
    //  m_NoCols is returned. Otherwise the columns are counted explicitly. In the absence of the row of table headers, the column count will be the row with
    //  the maximum number of columns.
    //
    //  Arguments:  None
    //  Returns:    Number of columns</pre>
			<pre>    hzHtmElem*  pE ;        //  Table row tags
    hzHtmElem*  pC ;        //  Columns</pre>
			<pre>    if (!m_nCols)
    {
        pE = GetFirstChild() ; </pre>
			<pre>        for (pC = pE-&gt;GetFirstChild() ; pC ; pC = pC-&gt;Sibling())
        {
            if (pC-&gt;Type() != HTAG_TH)
                continue ;
            m_nCols++ ;
        }
    }
    
    return m_nCols ;
}</pre>
			<pre>uint32_t    hzHtmTbl::Rowcount  (void)
{
    //  Returns the number of rows. This will not include the row of headers.
    //
    //  Arguments:  None
    //  Returns:    Number of rows in the table</pre>
			<pre>    if (!m_nSubnodes)
    {
        //threadLog("Table is empty\n") ;
        return 0 ;
    }</pre>
			<pre>    if (!m_nCols)
    {
        if (!m_nRows)
            Colcount() ;</pre>
			<pre>        if (!m_nCols)
            m_nRows = m_nSubnodes ;
        else
            m_nRows = m_nSubnodes - 1 ;
    }
    
    return m_nRows ;
}</pre>
			<pre>hzString    hzHtmTbl::GetColl   (uint32_t nCol)
{
    //  Return the value (string) of the requested column
    //
    //  In the case of a table, the only allowed sub-nodes are &lt;tr&gt; nodes. The columns for the table are all under the table's first &lt;tr&gt; sub-node as &lt;th&gt; nodes.
    //
    //  Arguments:  1)  nCol    The column number
    //
    //  Returns:    Instance of hzString by value - of the table row as a concatenated series of &lt;td&gt;content&lt;/td&gt;</pre>
			<pre>    hzHtmElem*  pE ;        //  Table row tags
    hzHtmElem*  pC ;        //  Columns
    hzString    S ;         //  Target string
    uint32_t    nIndex ;    //  Column iterator</pre>
			<pre>    if (!m_Children)
        return S ;
    pE = GetFirstChild() ; </pre>
			<pre>    if (!pE-&gt;GetFirstChild())
        return S ;</pre>
			<pre>    nIndex = 0 ;
    for (pC = pE-&gt;GetFirstChild() ; pC ; pC = pC-&gt;Sibling())
    {
        if (pC-&gt;Type() != HTAG_THEAD)
            continue ;</pre>
			<pre>        if (nIndex == nCol)
        {
            S = pC-&gt;m_tmpContent ;
            break ;
        }</pre>
			<pre>        nIndex++ ;
    }</pre>
			<pre>    return S ;
}</pre>
			<pre>hzString    hzHtmTbl::GetCell   (uint32_t nRow, uint32_t nCol)
{
    //  Return the cell from the supplied row and column.
    //
    //  Method is to move thru the table's &lt;tr&gt; subnodes to get to the row, then move thur that row's &lt;td&gt; (or equivelent) tags to get to the column within the row (the cell).
    //
    //  Arguments:  1)  nRow    The row number
    //              2)  nCol    The column number
    //
    //  Returns:    Instance of hzString by value - of the table cell</pre>
			<pre>    hzHtmElem*  pR ;        //  Table row tags
    hzHtmElem*  pC ;        //  Columns
    hzString    S ;         //  Target string
    uint32_t    row = -1 ;  //  Row counter
    uint32_t    col = 0 ;   //  Column counter</pre>
			<pre>    if (!m_Children)    { S = "No child nodes" ; return S ; }
    if (!m_nCols)       { S = "No columns" ; return S ; }</pre>
			<pre>    for (pR = GetFirstChild() ; row &lt;= nRow &amp;&amp; pR ; row++, pR = pR-&gt;Sibling())
    {
        if (row &lt; nRow)
            continue ;</pre>
			<pre>        for (pC = pR-&gt;GetFirstChild() ; col &lt;= nCol &amp;&amp; pC ; col++, pC = pC-&gt;Sibling())
        {
            if (col &lt; nCol)
                continue ;</pre>
			<pre>            S = pC-&gt;m_tmpContent ;
            break ;
        }
        break ;
    }</pre>
			<pre>    return S ;
}</pre>
			<pre>/*
**  Non-member functions
*/</pre>
			<pre>hzDoctype   DeriveDoctype   (hzChain&amp; Z)
{
    //  Category:   Text Processing
    //
    //  Rudimentary check to determine if the document is HTML or XML.
    //
    //  Argument:   Z   Input document
    //
    //  Returns:    The doctype</pre>
			<pre>    chIter  zi ;        //  Chain iterator</pre>
			<pre>    for (zi = Z ; !zi.eof() &amp;&amp; *zi != CHAR_LESS ; zi++) ;</pre>
			<pre>    if (zi.Equiv("&lt;html"))
        return DOCTYPE_HTML ;</pre>
			<pre>    if (zi.Equiv("&lt;!DOCTYPE "))
    {
        zi += 10 ;
        if (zi.Equiv("html"))
            return DOCTYPE_HTML ;
        if (zi.Equiv("xml"))
            return DOCTYPE_XML ;
    }</pre>
			<pre>    if (zi.Equiv("&lt;?xml"))
        return DOCTYPE_XML ;
        
    return DOCTYPE_UNDEFINED ;
}</pre>