/* * $LynxId: HTML.c,v 1.192 2018/04/01 23:26:24 tom Exp $ * * Structured stream to Rich hypertext converter * ============================================ * * This generates a hypertext object. It converts from the * structured stream interface of HTML events into the style- * oriented interface of the HText.h interface. This module is * only used in clients and should not be linked into servers. * * Override this module if making a new GUI browser. * * Being Overidden * */ #define HTSTREAM_INTERNAL 1 #include #define Lynx_HTML_Handler #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #ifdef VMS #include #endif /* VMS */ #ifdef USE_PRETTYSRC #include #endif #ifdef USE_COLOR_STYLE #include #include #include #include #undef SELECTED_STYLES #define pHText_changeStyle(X,Y,Z) {} #endif /* USE_COLOR_STYLE */ #ifdef USE_SOURCE_CACHE #include #endif #include #include #include #include #define STACKLEVEL(me) ((me->stack + MAX_NESTING - 1) - me->sp) #define DFT_TEXTAREA_COLS 60 #define DFT_TEXTAREA_ROWS 4 #define MAX_TEXTAREA_COLS LYcolLimit #define MAX_TEXTAREA_ROWS (3 * LYlines) #define LimitValue(name, value) \ if (name > value) { \ CTRACE((tfp, "Limited " #name " to %d, was %d\n", \ value, name)); \ name = value; \ } struct _HTStream { const HTStreamClass *isa; #ifdef USE_SOURCE_CACHE HTParentAnchor *anchor; FILE *fp; char *filename; HTChunk *chunk; HTChunk *last_chunk; /* the last chunk in a chain! */ const HTStreamClass *actions; HTStream *target; int status; #else /* .... */ #endif }; static HTStyleSheet *styleSheet = NULL; /* Application-wide */ /* Module-wide style cache */ static HTStyle *styles[HTML_ELEMENTS + LYNX_HTML_EXTRA_ELEMENTS]; /* adding 24 nested list styles */ /* and 3 header alignment styles */ /* and 3 div alignment styles */ static HTStyle *default_style = NULL; const char *LYToolbarName = "LynxPseudoToolbar"; /* used to turn off a style if the HTML author forgot to static int i_prior_style = -1; */ /* * Private function.... */ static int HTML_end_element(HTStructured * me, int element_number, char **include); static int HTML_start_element(HTStructured * me, int element_number, const BOOL *present, STRING2PTR value, int tag_charset, char **include); /* * If we have verbose_img set, display labels for images. */ #define VERBOSE_IMG(value,src_type,string) \ ((verbose_img) ? (newtitle = MakeNewTitle(value,src_type)): string) static char *MakeNewTitle(STRING2PTR value, int src_type); static char *MakeNewImageValue(STRING2PTR value); static char *MakeNewMapValue(STRING2PTR value, const char *mapstr); /* Set an internal flag that the next call to a stack-affecting method * is only internal and the stack manipulation should be skipped. - kw */ #define SET_SKIP_STACK(el_num) if (HTML_dtd.tags[el_num].contents != SGML_EMPTY) \ { me->skip_stack++; } void strtolower(char *i) { if (!i) return; while (*i) { *i = (char) TOLOWER(*i); i++; } } /* Flattening the style structure * ------------------------------ * * On the NeXT, and on any read-only browser, it is simpler for the text to * have a sequence of styles, rather than a nested tree of styles. In this * case we have to flatten the structure as it arrives from SGML tags into a * sequence of styles. */ /* * If style really needs to be set, call this. */ void actually_set_style(HTStructured * me) { if (!me->text) { /* First time through */ LYGetChartransInfo(me); UCSetTransParams(&me->T, me->UCLYhndl, me->UCI, HTAnchor_getUCLYhndl(me->node_anchor, UCT_STAGE_HTEXT), HTAnchor_getUCInfoStage(me->node_anchor, UCT_STAGE_HTEXT)); me->text = HText_new2(me->node_anchor, me->target); HText_beginAppend(me->text); HText_setStyle(me->text, me->new_style); me->in_word = NO; LYCheckForContentBase(me); } else { HText_setStyle(me->text, me->new_style); } me->old_style = me->new_style; me->style_change = NO; } /* * If you THINK you need to change style, call this. */ static void change_paragraph_style(HTStructured * me, HTStyle *style) { if (me->new_style != style) { me->style_change = YES; me->new_style = style; } me->in_word = NO; } /* * Return true if we should write a message (to LYNXMESSAGES, or the trace * file) telling about some bad HTML that we've found. */ BOOL LYBadHTML(HTStructured * me) { BOOL code = FALSE; switch ((enumBadHtml) cfg_bad_html) { case BAD_HTML_IGNORE: break; case BAD_HTML_TRACE: code = TRUE; break; case BAD_HTML_MESSAGE: code = TRUE; break; case BAD_HTML_WARN: /* * If we're already tracing, do not add a warning. */ if (!TRACE && !me->inBadHTML) { HTUserMsg(BAD_HTML_USE_TRACE); me->inBadHTML = TRUE; } code = TRACE; break; } return code; } /* * Handle the formatted message. */ void LYShowBadHTML(const char *message) { if (dump_output_immediately && dump_to_stderr) fprintf(stderr, "%s", message); switch ((enumBadHtml) cfg_bad_html) { case BAD_HTML_IGNORE: break; case BAD_HTML_TRACE: case BAD_HTML_MESSAGE: case BAD_HTML_WARN: CTRACE((tfp, "%s", message)); break; } switch ((enumBadHtml) cfg_bad_html) { case BAD_HTML_IGNORE: case BAD_HTML_TRACE: case BAD_HTML_WARN: break; case BAD_HTML_MESSAGE: LYstore_message(message); break; } } /*_________________________________________________________________________ * * A C T I O N R O U T I N E S */ /* FIXME: this should be amended to do the substitution only when not in a * multibyte stream. */ #ifdef EXP_JAPANESE_SPACES #define FIX_JAPANESE_SPACES \ (HTCJK == CHINESE || HTCJK == JAPANESE || HTCJK == TAIPEI) /* don't replace '\n' with ' ' if Chinese or Japanese - HN */ #else #define FIX_JAPANESE_SPACES 0 #endif /* Character handling * ------------------ */ void HTML_put_character(HTStructured * me, int c) { unsigned uc = UCH(c); /* * Ignore all non-MAP content when just scanning a document for MAPs. - FM */ if (LYMapsOnly && me->sp[0].tag_number != HTML_OBJECT) return; c = (int) uc; /* * Do EOL conversion if needed. - FM * * Convert EOL styles: * macintosh: cr --> lf * ascii: cr-lf --> lf * unix: lf --> lf */ if ((me->lastraw == '\r') && c == '\n') { me->lastraw = -1; return; } me->lastraw = c; if (c == '\r') { c = '\n'; uc = UCH(c); } /* * Handle SGML_LITTERAL tags that have HTChunk elements. - FM */ switch (me->sp[0].tag_number) { case HTML_COMMENT: return; /* Do Nothing */ case HTML_TITLE: if (c == LY_SOFT_HYPHEN) return; if (c != '\n' && c != '\t' && c != '\r') { HTChunkPutc(&me->title, uc); } else if (FIX_JAPANESE_SPACES) { if (c == '\t') { HTChunkPutc(&me->title, ' '); } else { return; } } else { HTChunkPutc(&me->title, ' '); } return; case HTML_STYLE: HTChunkPutc(&me->style_block, uc); return; case HTML_SCRIPT: HTChunkPutc(&me->script, uc); return; case HTML_OBJECT: HTChunkPutc(&me->object, uc); return; case HTML_TEXTAREA: HTChunkPutc(&me->textarea, uc); return; case HTML_SELECT: case HTML_OPTION: HTChunkPutc(&me->option, uc); return; case HTML_MATH: HTChunkPutc(&me->math, uc); return; default: if (me->inSELECT) { /* * If we are within a SELECT not caught by the cases above - * HTML_SELECT or HTML_OPTION may not be the last element pushed on * the style stack if there were invalid markup tags within a * SELECT element. For error recovery, treat text as part of the * OPTION text, it is probably meant to show up as user-visible * text. Having A as an open element while in SELECT is really * sick, don't make anchor text part of the option text in that * case since the option text will probably just be discarded. - * kw */ if (me->sp[0].tag_number == HTML_A) break; HTChunkPutc(&me->option, uc); return; } break; } /* end first switch */ /* * Handle all other tag content. - FM */ switch (me->sp[0].tag_number) { case HTML_PRE: /* Formatted text */ /* * We guarantee that the style is up-to-date in begin_litteral. But we * still want to strip \r's. */ if (c != '\r' && !(c == '\n' && me->inLABEL && !me->inP) && !(c == '\n' && !me->inPRE)) { me->inP = TRUE; me->inLABEL = FALSE; HText_appendCharacter(me->text, c); } me->inPRE = TRUE; break; case HTML_LISTING: /* Literal text */ case HTML_XMP: case HTML_PLAINTEXT: /* * We guarantee that the style is up-to-date in begin_litteral. But we * still want to strip \r's. */ if (c != '\r') { me->inP = TRUE; me->inLABEL = FALSE; HText_appendCharacter(me->text, c); } break; default: /* * Free format text. */ if (me->sp->style->id == ST_Preformatted) { if (c != '\r' && !(c == '\n' && me->inLABEL && !me->inP) && !(c == '\n' && !me->inPRE)) { me->inP = TRUE; me->inLABEL = FALSE; HText_appendCharacter(me->text, c); } me->inPRE = TRUE; } else if (me->sp->style->id == ST_Listing || me->sp->style->id == ST_Example) { if (c != '\r') { me->inP = TRUE; me->inLABEL = FALSE; HText_appendCharacter(me->text, c); } } else { if (me->style_change) { if ((c == '\n') || (c == ' ')) return; /* Ignore it */ UPDATE_STYLE; } if (c == '\n') { if (!FIX_JAPANESE_SPACES) { if (me->in_word) { if (HText_getLastChar(me->text) != ' ') { me->inP = TRUE; me->inLABEL = FALSE; HText_appendCharacter(me->text, ' '); } me->in_word = NO; } } } else if (c == ' ' || c == '\t') { if (HText_getLastChar(me->text) != ' ') { me->inP = TRUE; me->inLABEL = FALSE; HText_appendCharacter(me->text, ' '); } } else if (c == '\r') { /* ignore */ } else { me->inP = TRUE; me->inLABEL = FALSE; HText_appendCharacter(me->text, c); me->in_word = YES; } } } /* end second switch */ if (c == '\n' || c == '\t') { HText_setLastChar(me->text, ' '); /* set it to a generic separator */ } else { HText_setLastChar(me->text, c); } } /* String handling * --------------- * * This is written separately from put_character because the loop can * in some cases be promoted to a higher function call level for speed. */ void HTML_put_string(HTStructured * me, const char *s) { HTChunk *target = NULL; #ifdef USE_PRETTYSRC char *translated_string = NULL; #endif if (s == NULL || (LYMapsOnly && me->sp[0].tag_number != HTML_OBJECT)) return; #ifdef USE_PRETTYSRC if (psrc_convert_string) { StrAllocCopy(translated_string, s); TRANSLATE_AND_UNESCAPE_ENTITIES(&translated_string, TRUE, FALSE); s = (const char *) translated_string; } #endif switch (me->sp[0].tag_number) { case HTML_COMMENT: break; /* Do Nothing */ case HTML_TITLE: target = &me->title; break; case HTML_STYLE: target = &me->style_block; break; case HTML_SCRIPT: target = &me->script; break; case HTML_PRE: /* Formatted text */ case HTML_LISTING: /* Literal text */ case HTML_XMP: case HTML_PLAINTEXT: /* * We guarantee that the style is up-to-date in begin_litteral */ HText_appendText(me->text, s); break; case HTML_OBJECT: target = &me->object; break; case HTML_TEXTAREA: target = &me->textarea; break; case HTML_SELECT: case HTML_OPTION: target = &me->option; break; case HTML_MATH: target = &me->math; break; default: /* Free format text? */ if (!me->sp->style->freeFormat) { /* * If we are within a preformatted text style not caught by the * cases above (HTML_PRE or similar may not be the last element * pushed on the style stack). - kw */ #ifdef USE_PRETTYSRC if (psrc_view) { /* * We do this so that a raw '\r' in the string will not be * interpreted as an internal request to break a line - passing * '\r' to HText_appendText is treated by it as a request to * insert a blank line - VH */ for (; *s; ++s) HTML_put_character(me, *s); } else #endif HText_appendText(me->text, s); break; } else { const char *p = s; char c; if (me->style_change) { for (; *p && ((*p == '\n') || (*p == '\r') || (*p == ' ') || (*p == '\t')); p++) ; /* Ignore leaders */ if (!*p) break; UPDATE_STYLE; } for (; *p; p++) { if (*p == 13 && p[1] != 10) { /* * Treat any '\r' which is not followed by '\n' as '\n', to * account for macintosh lineend in ALT attributes etc. - * kw */ c = '\n'; } else { c = *p; } if (me->style_change) { if ((c == '\n') || (c == ' ') || (c == '\t')) continue; /* Ignore it */ UPDATE_STYLE; } if (c == '\n') { if (!FIX_JAPANESE_SPACES) { if (me->in_word) { if (HText_getLastChar(me->text) != ' ') HText_appendCharacter(me->text, ' '); me->in_word = NO; } } } else if (c == ' ' || c == '\t') { if (HText_getLastChar(me->text) != ' ') HText_appendCharacter(me->text, ' '); } else if (c == '\r') { /* ignore */ } else { HText_appendCharacter(me->text, c); me->in_word = YES; } /* set the Last Character */ if (c == '\n' || c == '\t') { /* set it to a generic separator */ HText_setLastChar(me->text, ' '); } else if (c == '\r' && HText_getLastChar(me->text) == ' ') { /* * \r's are ignored. In order to keep collapsing spaces * correctly, we must default back to the previous * separator, if there was one. So we set LastChar to a * generic separator. */ HText_setLastChar(me->text, ' '); } else { HText_setLastChar(me->text, c); } } /* for */ } } /* end switch */ if (target != NULL) { if (target->data == s) { CTRACE((tfp, "BUG: appending chunk to itself: `%.*s'\n", target->size, target->data)); } else { HTChunkPuts(target, s); } } #ifdef USE_PRETTYSRC if (psrc_convert_string) { psrc_convert_string = FALSE; FREE(translated_string); } #endif } /* Buffer write * ------------ */ void HTML_write(HTStructured * me, const char *s, int l) { const char *p; const char *e = s + l; if (LYMapsOnly && me->sp[0].tag_number != HTML_OBJECT) return; for (p = s; p < e; p++) HTML_put_character(me, *p); } /* * "Internal links" are hyperlinks whose source and destination are * within the same document, and for which the destination is given * as a URL Reference with an empty URL, but possibly with a non-empty * #fragment. (This terminology re URL-Reference vs. URL follows the * Fielding URL syntax and semantics drafts). * Differences: * (1) The document's base (in whatever way it is given) is not used for * resolving internal link references. * (2) Activating an internal link should not result in a new retrieval * of a copy of the document. * (3) Internal links are the only way to refer with a hyperlink to a document * (or a location in it) which is only known as the result of a POST * request (doesn't have a URL from which the document can be retrieved * with GET), and can only be used from within that document. * * *If track_internal_links is true, we keep track of whether a * link destination was given as an internal link. This information is * recorded in the type of the link between anchor objects, and is available * to the HText object and the mainloop from there. URL References to * internal destinations are still resolved into an absolute form before * being passed on, but using the current stream's retrieval address instead * of the base URL. * Examples: (replace [...] to have a valid absolute URL) * In document retrieved from [...]/mypath/mydoc.htm w/ base [...]/otherpath/ * a. HREF="[...]/mypath/mydoc.htm" -> [...]/mypath/mydoc.htm * b. HREF="[...]/mypath/mydoc.htm#frag" -> [...]/mypath/mydoc.htm#frag * c. HREF="mydoc.htm" -> [...]/otherpath/mydoc.htm * d. HREF="mydoc.htm#frag" -> [...]/otherpath/mydoc.htm#frag * e. HREF="" -> [...]/mypath/mydoc.htm (marked internal) * f. HREF="#frag" -> [...]/mypath/mydoc.htm#frag (marked internal) * * *If track_internal_links is false, URL-less URL-References are * resolved differently from URL-References with a non-empty URL (using the * current stream's retrieval address instead of the base), but we make no * further distinction. Resolution is then as in the examples above, execept * that there is no "(marked internal)". * * *Note that this doesn't apply to form ACTIONs (always resolved using base, * never marked internal). Also other references encountered or generated * are not marked internal, whether they have a URL or not, if in a given * context an internal link makes no sense (e.g., IMG SRC=). */ /* A flag is used to keep track of whether an "URL reference" encountered had a real "URL" or not. In the latter case, it will be marked as "internal". The flag is set before we start messing around with the string (resolution of relative URLs etc.). This variable only used locally here, don't confuse with LYinternal_flag which is for overriding non-caching similar to LYoverride_no_cache. - kw */ #define CHECK_FOR_INTERN(flag,s) \ flag = (BOOLEAN) (((s) && (*(s)=='#' || *(s)=='\0')) ? TRUE : FALSE) /* Last argument to pass to HTAnchor_findChildAndLink() calls, just an abbreviation. - kw */ #define INTERN_CHK(flag) (HTLinkType *)((flag) ? HTInternalLink : NULL) #define INTERN_LT INTERN_CHK(intern_flag) #ifdef USE_COLOR_STYLE static char *Style_className = 0; static char *Style_className_end = 0; static size_t Style_className_len = 0; static int hcode; #ifdef LY_FIND_LEAKS static void free_Style_className(void) { FREE(Style_className); } #endif static void addClassName(const char *prefix, const char *actual, size_t length) { size_t offset = strlen(prefix); size_t have = (unsigned) (Style_className_end - Style_className); size_t need = (offset + length + 1); if ((have + need) >= Style_className_len) { Style_className_len += 1024 + 2 * (have + need); if (Style_className == 0) { Style_className = typeMallocn(char, Style_className_len); } else { Style_className = typeRealloc(char, Style_className, Style_className_len); } if (Style_className == NULL) outofmem(__FILE__, "addClassName"); Style_className_end = Style_className + have; } if (offset) strcpy(Style_className_end, prefix); if (length) memcpy(Style_className_end + offset, actual, length); Style_className_end[offset + length] = '\0'; strtolower(Style_className_end); Style_className_end += (offset + length); } #else #define addClassName(prefix, actual, length) /* nothing */ #endif static void LYStartArea(HTStructured * obj, const char *href, const char *alt, const char *title, int tag_charset) { BOOL new_present[HTML_AREA_ATTRIBUTES]; const char *new_value[HTML_AREA_ATTRIBUTES]; int i; for (i = 0; i < HTML_AREA_ATTRIBUTES; i++) new_present[i] = NO; if (alt) { new_present[HTML_AREA_ALT] = YES; new_value[HTML_AREA_ALT] = (const char *) alt; } if (non_empty(title)) { new_present[HTML_AREA_TITLE] = YES; new_value[HTML_AREA_TITLE] = (const char *) title; } if (href) { new_present[HTML_AREA_HREF] = YES; new_value[HTML_AREA_HREF] = (const char *) href; } (*obj->isa->start_element) (obj, HTML_AREA, new_present, new_value, tag_charset, 0); } static void LYHandleFIG(HTStructured * me, const BOOL *present, STRING2PTR value, int isobject, int imagemap, const char *id, const char *src, int convert, int start, BOOL *intern_flag GCC_UNUSED) { if (start == TRUE) { me->inFIG = TRUE; if (me->inA) { SET_SKIP_STACK(HTML_A); HTML_end_element(me, HTML_A, NULL); } if (!isobject) { LYEnsureDoubleSpace(me); LYResetParagraphAlignment(me); me->inFIGwithP = TRUE; } else { me->inFIGwithP = FALSE; HTML_put_character(me, ' '); /* space char may be ignored */ } if (non_empty(id)) { if (present && convert) { CHECK_ID(HTML_FIG_ID); } else LYHandleID(me, id); } me->in_word = NO; me->inP = FALSE; if (clickable_images && non_empty(src)) { char *href = NULL; StrAllocCopy(href, src); CHECK_FOR_INTERN(*intern_flag, href); LYLegitimizeHREF(me, &href, TRUE, TRUE); if (*href) { me->CurrentA = HTAnchor_findChildAndLink(me->node_anchor, /* Parent */ NULL, /* Tag */ href, /* Addresss */ INTERN_CHK(*intern_flag)); /* Type */ HText_beginAnchor(me->text, me->inUnderline, me->CurrentA); if (me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_START_CHAR); HTML_put_string(me, (isobject ? (imagemap ? "(IMAGE)" : "(OBJECT)") : "[FIGURE]")); if (me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_END_CHAR); HText_endAnchor(me->text, 0); HTML_put_character(me, '-'); HTML_put_character(me, ' '); /* space char may be ignored */ me->in_word = NO; } FREE(href); } } else { /* handle end tag */ if (me->inFIGwithP) { LYEnsureDoubleSpace(me); } else { HTML_put_character(me, ' '); /* space char may be ignored */ } LYResetParagraphAlignment(me); me->inFIGwithP = FALSE; me->inFIG = FALSE; change_paragraph_style(me, me->sp->style); /* Often won't really change */ if (me->List_Nesting_Level >= 0) { UPDATE_STYLE; HText_NegateLineOne(me->text); } } } static void clear_objectdata(HTStructured * me) { if (me) { HTChunkClear(&me->object); me->object_started = FALSE; me->object_declare = FALSE; me->object_shapes = FALSE; me->object_ismap = FALSE; FREE(me->object_usemap); FREE(me->object_id); FREE(me->object_title); FREE(me->object_data); FREE(me->object_type); FREE(me->object_classid); FREE(me->object_codebase); FREE(me->object_codetype); FREE(me->object_name); } } #define HTParseALL(pp,pconst) \ { char* free_me = *pp; \ *pp = HTParse(*pp, pconst, PARSE_ALL); \ FREE(free_me); \ } /* Start Element * ------------- */ static int HTML_start_element(HTStructured * me, int element_number, const BOOL *present, STRING2PTR value, int tag_charset, char **include) { char *alt_string = NULL; char *id_string = NULL; char *newtitle = NULL; char **pdoctitle = NULL; char *href = NULL; char *map_href = NULL; char *title = NULL; char *I_value = NULL; char *I_name = NULL; char *temp = NULL; const char *Base = NULL; int dest_char_set = -1; HTParentAnchor *dest = NULL; /* An anchor's destination */ BOOL dest_ismap = FALSE; /* Is dest an image map script? */ HTChildAnchor *ID_A = NULL; /* HTML_foo_ID anchor */ int url_type = 0, i = 0; char *cp = NULL; HTMLElement ElementNumber = (HTMLElement) element_number; BOOL intern_flag = FALSE; short stbl_align = HT_ALIGN_NONE; int status = HT_OK; #ifdef USE_COLOR_STYLE const char *class_name; const char *prefix_string; BOOL class_used = FALSE; #endif if (LYMapsOnly) { if (!(ElementNumber == HTML_MAP || ElementNumber == HTML_AREA || ElementNumber == HTML_BASE || ElementNumber == HTML_OBJECT || ElementNumber == HTML_A)) { return HT_OK; } } else if (!me->text) { UPDATE_STYLE; } { /* me->tag_charset is charset for attribute values. */ int j = ((tag_charset < 0) ? me->UCLYhndl : tag_charset); if ((me->tag_charset != j) || (j < 0 /* for trace entry */ )) { CTRACE((tfp, "me->tag_charset: %d -> %d", me->tag_charset, j)); CTRACE((tfp, " (me->UCLYhndl: %d, tag_charset: %d)\n", me->UCLYhndl, tag_charset)); me->tag_charset = j; } } /* this should be done differently */ #if defined(USE_COLOR_STYLE) addClassName(";", HTML_dtd.tags[element_number].name, (size_t) HTML_dtd.tags[element_number].name_len); class_name = (force_classname ? forced_classname : class_string); force_classname = FALSE; if (force_current_tag_style == FALSE) { current_tag_style = (non_empty(class_name) ? -1 : cached_tag_styles[element_number]); } else { force_current_tag_style = FALSE; } CTRACE2(TRACE_STYLE, (tfp, "CSS.elt:<%s>\n", HTML_dtd.tags[element_number].name)); prefix_string = ""; if (current_tag_style == -1) { /* Append class_name */ hcode = color_style_1(HTML_dtd.tags[element_number].name); if (non_empty(class_name)) { int ohcode = hcode; prefix_string = HTML_dtd.tags[element_number].name; hcode = color_style_3(prefix_string, ".", class_name); if (!hashStyles[hcode].used) { /* None such -> classless version */ hcode = ohcode; prefix_string = ""; CTRACE2(TRACE_STYLE, (tfp, "STYLE.start_element: <%s> (class <%s> not configured), hcode=%d.\n", HTML_dtd.tags[element_number].name, class_name, hcode)); } else { addClassName(".", class_name, strlen(class_name)); CTRACE2(TRACE_STYLE, (tfp, "STYLE.start_element: <%s>.<%s>, hcode=%d.\n", prefix_string, class_name, hcode)); class_used = TRUE; } } class_string[0] = '\0'; } else { /* (current_tag_style!=-1) */ if (non_empty(class_name)) { addClassName(".", class_name, strlen(class_name)); class_string[0] = '\0'; } hcode = current_tag_style; if (hcode >= 0 && hashStyles[hcode].used) { prefix_string = hashStyles[hcode].name; } CTRACE2(TRACE_STYLE, (tfp, "STYLE.start_element: <%s>, hcode=%d.\n", HTML_dtd.tags[element_number].name, hcode)); current_tag_style = -1; } if (!class_used && ElementNumber == HTML_INPUT) { /* For some other too? */ const char *type = ""; int ohcode = hcode; if (present && present[HTML_INPUT_TYPE] && value[HTML_INPUT_TYPE]) type = value[HTML_INPUT_TYPE]; hcode = color_style_3(prefix_string, ".type.", type); if (!hashStyles[hcode].used) { /* None such -> classless version */ hcode = ohcode; CTRACE2(TRACE_STYLE, (tfp, "STYLE.start_element: type <%s> not configured.\n", type)); } else { addClassName(".type.", type, strlen(type)); CTRACE2(TRACE_STYLE, (tfp, "STYLE.start_element: <%s>.type.<%s>, hcode=%d.\n", HTML_dtd.tags[element_number].name, type, hcode)); } } HText_characterStyle(me->text, hcode, STACK_ON); #endif /* USE_COLOR_STYLE */ /* * Handle the start tag. - FM */ switch (ElementNumber) { case HTML_HTML: break; case HTML_HEAD: break; case HTML_BASE: if (present && present[HTML_BASE_HREF] && !local_host_only && non_empty(value[HTML_BASE_HREF])) { char *base = NULL; const char *related = NULL; StrAllocCopy(base, value[HTML_BASE_HREF]); CTRACE((tfp, "*HTML_BASE: initial href=`%s'\n", NonNull(base))); if (!(url_type = LYLegitimizeHREF(me, &base, TRUE, TRUE))) { CTRACE((tfp, "HTML: BASE '%s' is not an absolute URL.\n", NonNull(base))); if (me->inBadBASE == FALSE) HTAlert(BASE_NOT_ABSOLUTE); me->inBadBASE = TRUE; } if (url_type == LYNXIMGMAP_URL_TYPE) { /* * These have a non-standard form, basically strip the prefix * or the code below would insert a nonsense host into the * pseudo URL. These should never occur where they would be * used for resolution of relative URLs anyway. We can also * strip the #map part. - kw */ temp = base; base = HTParse(base + 11, "", PARSE_ALL_WITHOUT_ANCHOR); FREE(temp); } /* * Get parent's address for defaulted fields. */ related = me->node_anchor->address; /* * Create the access field. */ temp = HTParse(base, related, PARSE_ACCESS + PARSE_PUNCTUATION); StrAllocCopy(me->base_href, temp); FREE(temp); /* * Create the host[:port] field. */ temp = HTParse(base, "", PARSE_HOST + PARSE_PUNCTUATION); if (!StrNCmp(temp, "//", 2)) { StrAllocCat(me->base_href, temp); if (!strcmp(me->base_href, "file://")) { StrAllocCat(me->base_href, "localhost"); } } else { if (isFILE_URL(me->base_href)) { StrAllocCat(me->base_href, "//localhost"); } else if (strcmp(me->base_href, STR_NEWS_URL)) { FREE(temp); StrAllocCat(me->base_href, (temp = HTParse(related, "", PARSE_HOST + PARSE_PUNCTUATION))); } } FREE(temp); /* * Create the path field. */ temp = HTParse(base, "", PARSE_PATH + PARSE_PUNCTUATION); if (*temp != '\0') { char *p = StrChr(temp, '?'); if (p) *p = '\0'; p = strrchr(temp, '/'); if (p) *(p + 1) = '\0'; /* strip after the last slash */ StrAllocCat(me->base_href, temp); } else if (!strcmp(me->base_href, STR_NEWS_URL)) { StrAllocCat(me->base_href, "*"); } else if (isNEWS_URL(me->base_href) || isNNTP_URL(me->base_href) || isSNEWS_URL(me->base_href)) { StrAllocCat(me->base_href, "/*"); } else { StrAllocCat(me->base_href, "/"); } FREE(temp); FREE(base); me->inBASE = TRUE; me->node_anchor->inBASE = TRUE; StrAllocCopy(me->node_anchor->content_base, me->base_href); /* me->base_href is a valid URL */ CTRACE((tfp, "*HTML_BASE: final href=`%s'\n", me->base_href)); } break; case HTML_META: if (present) LYHandleMETA(me, present, value, include); break; case HTML_TITLE: HTChunkClear(&me->title); break; case HTML_LINK: intern_flag = FALSE; if (present && present[HTML_LINK_HREF]) { CHECK_FOR_INTERN(intern_flag, value[HTML_LINK_HREF]); /* * Prepare to do housekeeping on the reference. - FM */ if (isEmpty(value[HTML_LINK_HREF])) { Base = (me->inBASE) ? me->base_href : me->node_anchor->address; StrAllocCopy(href, Base); } else { StrAllocCopy(href, value[HTML_LINK_HREF]); (void) LYLegitimizeHREF(me, &href, TRUE, TRUE); Base = (me->inBASE && *href != '\0' && *href != '#') ? me->base_href : me->node_anchor->address; HTParseALL(&href, Base); } /* * Handle links with a REV attribute. - FM * Handle REV="made" or REV="owner". - LM & FM * Handle REL="author" -TD */ if (present && ((present[HTML_LINK_REV] && value[HTML_LINK_REV] && (!strcasecomp("made", value[HTML_LINK_REV]) || !strcasecomp("owner", value[HTML_LINK_REV]))) || (present[HTML_LINK_REL] && value[HTML_LINK_REL] && (!strcasecomp("author", value[HTML_LINK_REL]))))) { /* * Load the owner element. - FM */ HTAnchor_setOwner(me->node_anchor, href); CTRACE((tfp, "HTML: DOC OWNER '%s' found\n", href)); FREE(href); /* * Load the RevTitle element if a TITLE attribute and value * are present. - FM */ if (present && present[HTML_LINK_TITLE] && value[HTML_LINK_TITLE] && *value[HTML_LINK_TITLE] != '\0') { StrAllocCopy(title, value[HTML_LINK_TITLE]); TRANSLATE_AND_UNESCAPE_ENTITIES(&title, TRUE, FALSE); LYTrimHead(title); LYTrimTail(title); if (*title != '\0') HTAnchor_setRevTitle(me->node_anchor, title); FREE(title); } break; } /* * Handle REL links. - FM */ if (present && present[HTML_LINK_REL] && value[HTML_LINK_REL]) { /* * Ignore style sheets, for now. - FM * * lss and css have different syntax - lynx shouldn't try to * parse them now (it tries to parse them as lss, so it exits * with error message on the 1st non-empty line) - VH */ #ifndef USE_COLOR_STYLE if (!strcasecomp(value[HTML_LINK_REL], "StyleSheet") || !strcasecomp(value[HTML_LINK_REL], "Style")) { CTRACE2(TRACE_STYLE, (tfp, "HTML: StyleSheet link found.\n")); CTRACE2(TRACE_STYLE, (tfp, " StyleSheets not yet implemented.\n")); FREE(href); break; } #endif /* ! USE_COLOR_STYLE */ /* * Ignore anything not registered in the 28-Mar-95 IETF HTML * 3.0 draft and W3C HTML 3.2 draft, or not appropriate for * Lynx banner links in the expired Maloney and Quin relrev * draft. We'll make this more efficient when the situation * stabilizes, and for now, we'll treat "Banner" as another * toolbar element. - FM */ if (!strcasecomp(value[HTML_LINK_REL], "Home") || !strcasecomp(value[HTML_LINK_REL], "ToC") || !strcasecomp(value[HTML_LINK_REL], "Contents") || !strcasecomp(value[HTML_LINK_REL], "Index") || !strcasecomp(value[HTML_LINK_REL], "Glossary") || !strcasecomp(value[HTML_LINK_REL], "Copyright") || !strcasecomp(value[HTML_LINK_REL], "Help") || !strcasecomp(value[HTML_LINK_REL], "Search") || !strcasecomp(value[HTML_LINK_REL], "Bookmark") || !strcasecomp(value[HTML_LINK_REL], "Banner") || !strcasecomp(value[HTML_LINK_REL], "Top") || !strcasecomp(value[HTML_LINK_REL], "Origin") || !strcasecomp(value[HTML_LINK_REL], "Navigator") || !strcasecomp(value[HTML_LINK_REL], "Disclaimer") || !strcasecomp(value[HTML_LINK_REL], "Author") || !strcasecomp(value[HTML_LINK_REL], "Editor") || !strcasecomp(value[HTML_LINK_REL], "Publisher") || !strcasecomp(value[HTML_LINK_REL], "Trademark") || !strcasecomp(value[HTML_LINK_REL], "Hotlist") || !strcasecomp(value[HTML_LINK_REL], "Begin") || !strcasecomp(value[HTML_LINK_REL], "First") || !strcasecomp(value[HTML_LINK_REL], "End") || !strcasecomp(value[HTML_LINK_REL], "Last") || !strcasecomp(value[HTML_LINK_REL], "Documentation") || !strcasecomp(value[HTML_LINK_REL], "Biblioentry") || !strcasecomp(value[HTML_LINK_REL], "Bibliography") || !strcasecomp(value[HTML_LINK_REL], "Start") || !strcasecomp(value[HTML_LINK_REL], "Appendix")) { StrAllocCopy(title, value[HTML_LINK_REL]); pdoctitle = &title; /* for setting HTAnchor's title */ } else if (!strcasecomp(value[HTML_LINK_REL], "Up") || !strcasecomp(value[HTML_LINK_REL], "Next") || !strcasecomp(value[HTML_LINK_REL], "Previous") || !strcasecomp(value[HTML_LINK_REL], "Prev") || !strcasecomp(value[HTML_LINK_REL], "Child") || !strcasecomp(value[HTML_LINK_REL], "Sibling") || !strcasecomp(value[HTML_LINK_REL], "Parent") || !strcasecomp(value[HTML_LINK_REL], "Meta") || !strcasecomp(value[HTML_LINK_REL], "URC") || !strcasecomp(value[HTML_LINK_REL], "Pointer") || !strcasecomp(value[HTML_LINK_REL], "Translation") || !strcasecomp(value[HTML_LINK_REL], "Definition") || !strcasecomp(value[HTML_LINK_REL], "Alternate") || !strcasecomp(value[HTML_LINK_REL], "Section") || !strcasecomp(value[HTML_LINK_REL], "Subsection") || !strcasecomp(value[HTML_LINK_REL], "Chapter")) { StrAllocCopy(title, value[HTML_LINK_REL]); /* not setting target HTAnchor's title, for these links of highly relative character. Instead, try to remember the REL attribute as a property of the link (but not the destination), in the (otherwise underused) link type in a special format; the LIST page generation code may later use it. - kw */ if (!intern_flag) { StrAllocCopy(temp, "RelTitle: "); StrAllocCat(temp, value[HTML_LINK_REL]); } #ifndef DISABLE_BIBP } else if (!strcasecomp(value[HTML_LINK_REL], "citehost")) { /* Citehost determination for bibp links. - RDC */ HTAnchor_setCitehost(me->node_anchor, href); CTRACE((tfp, "HTML: citehost '%s' found\n", href)); FREE(href); break; #endif } else { CTRACE((tfp, "HTML: LINK with REL=\"%s\" ignored.\n", value[HTML_LINK_REL])); FREE(href); break; } } } else if (present && present[HTML_LINK_REL] && value[HTML_LINK_REL]) { /* * If no HREF was specified, handle special REL links with * self-designated HREFs. - FM */ if (!strcasecomp(value[HTML_LINK_REL], "Home")) { StrAllocCopy(href, LynxHome); } else if (!strcasecomp(value[HTML_LINK_REL], "Help")) { StrAllocCopy(href, helpfile); } else if (!strcasecomp(value[HTML_LINK_REL], "Index")) { StrAllocCopy(href, indexfile); } else { CTRACE((tfp, "HTML: LINK with REL=\"%s\" and no HREF ignored.\n", value[HTML_LINK_REL])); break; } StrAllocCopy(title, value[HTML_LINK_REL]); pdoctitle = &title; } if (href) { /* * Create a title (link name) from the TITLE value, if present, or * default to the REL value that was loaded into title. - FM */ if (present && present[HTML_LINK_TITLE] && non_empty(value[HTML_LINK_TITLE])) { StrAllocCopy(title, value[HTML_LINK_TITLE]); TRANSLATE_AND_UNESCAPE_ENTITIES(&title, TRUE, FALSE); LYTrimHead(title); LYTrimTail(title); pdoctitle = &title; FREE(temp); /* forget about recording RelTitle - kw */ } if (isEmpty(title)) { FREE(href); FREE(title); break; } if (me->inA) { /* * Ugh! The LINK tag, which is a HEAD element, is in an * Anchor, which is BODY element. All we can do is close the * Anchor and cross our fingers. - FM */ SET_SKIP_STACK(HTML_A); HTML_end_element(me, HTML_A, include); } /* * Create anchors for the links that simulate a toolbar. - FM */ me->CurrentA = HTAnchor_findChildAndLink(me->node_anchor, /* Parent */ NULL, /* Tag */ href, /* Addresss */ (temp ? (HTLinkType *) HTAtom_for(temp) : INTERN_LT)); /* Type */ FREE(temp); if ((dest = HTAnchor_parent(HTAnchor_followLink(me->CurrentA) )) != NULL) { if (pdoctitle && !HTAnchor_title(dest)) HTAnchor_setTitle(dest, *pdoctitle); /* Don't allow CHARSET attribute to change *this* document's charset assumption. - kw */ if (dest == me->node_anchor) dest = NULL; if (present[HTML_LINK_CHARSET] && non_empty(value[HTML_LINK_CHARSET])) { dest_char_set = UCGetLYhndl_byMIME(value[HTML_LINK_CHARSET]); if (dest_char_set < 0) dest_char_set = UCLYhndl_for_unrec; } if (dest && dest_char_set >= 0) HTAnchor_setUCInfoStage(dest, dest_char_set, UCT_STAGE_PARSER, UCT_SETBY_LINK); } UPDATE_STYLE; if (!HText_hasToolbar(me->text) && (ID_A = HTAnchor_findChildAndLink(me->node_anchor, /* Parent */ LYToolbarName, /* Tag */ NULL, /* Addresss */ (HTLinkType *) 0))) { /* Type */ HText_appendCharacter(me->text, '#'); HText_setLastChar(me->text, ' '); /* absorb white space */ HText_beginAnchor(me->text, me->inUnderline, ID_A); HText_endAnchor(me->text, 0); HText_setToolbar(me->text); } else { /* * Add collapsible space to separate link from previous * generated links. - kw */ HTML_put_character(me, ' '); } HText_beginAnchor(me->text, me->inUnderline, me->CurrentA); if (me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_START_CHAR); #ifdef USE_COLOR_STYLE if (present && present[HTML_LINK_CLASS] && non_empty(value[HTML_LINK_CLASS])) { char *tmp = 0; int hcode2; HTSprintf0(&tmp, "link.%s.%s", value[HTML_LINK_CLASS], title); hcode2 = color_style_1(tmp); CTRACE2(TRACE_STYLE, (tfp, "STYLE.link: using style <%s>\n", tmp)); HText_characterStyle(me->text, hcode2, STACK_ON); HTML_put_string(me, title); HTML_put_string(me, " ("); HTML_put_string(me, value[HTML_LINK_CLASS]); HTML_put_string(me, ")"); HText_characterStyle(me->text, hcode2, STACK_OFF); FREE(tmp); } else #endif HTML_put_string(me, title); if (me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_END_CHAR); HText_endAnchor(me->text, 0); } FREE(href); FREE(title); break; case HTML_ISINDEX: if (((present)) && ((present[HTML_ISINDEX_HREF] && value[HTML_ISINDEX_HREF]) || (present[HTML_ISINDEX_ACTION] && value[HTML_ISINDEX_ACTION]))) { /* * Lynx was supporting ACTION, which never made it into the HTML * 2.0 specs. HTML 3.0 uses HREF, so we'll use that too, but allow * use of ACTION as an alternate until people have fully switched * over. - FM */ if (present[HTML_ISINDEX_HREF] && value[HTML_ISINDEX_HREF]) StrAllocCopy(href, value[HTML_ISINDEX_HREF]); else StrAllocCopy(href, value[HTML_ISINDEX_ACTION]); LYLegitimizeHREF(me, &href, TRUE, TRUE); Base = (me->inBASE && *href != '\0' && *href != '#') ? me->base_href : me->node_anchor->address; HTParseALL(&href, Base); HTAnchor_setIndex(me->node_anchor, href); FREE(href); } else { Base = (me->inBASE) ? me->base_href : me->node_anchor->address; HTAnchor_setIndex(me->node_anchor, Base); } /* * Support HTML 3.0 PROMPT attribute. - FM */ if (present && present[HTML_ISINDEX_PROMPT] && non_empty(value[HTML_ISINDEX_PROMPT])) { StrAllocCopy(temp, value[HTML_ISINDEX_PROMPT]); TRANSLATE_AND_UNESCAPE_ENTITIES(&temp, TRUE, FALSE); LYTrimHead(temp); LYTrimTail(temp); if (*temp != '\0') { StrAllocCat(temp, " "); HTAnchor_setPrompt(me->node_anchor, temp); } else { HTAnchor_setPrompt(me->node_anchor, ENTER_DATABASE_QUERY); } FREE(temp); } else { HTAnchor_setPrompt(me->node_anchor, ENTER_DATABASE_QUERY); } break; case HTML_NEXTID: break; case HTML_STYLE: /* * We're getting it as Literal text, which, for now, we'll just ignore. * - FM */ HTChunkClear(&me->style_block); break; case HTML_SCRIPT: /* * We're getting it as Literal text, which, for now, we'll just ignore. * - FM */ HTChunkClear(&me->script); break; case HTML_BODY: CHECK_ID(HTML_BODY_ID); if (HText_hasToolbar(me->text)) HText_appendParagraph(me->text); break; case HTML_SECTION: case HTML_ARTICLE: case HTML_MAIN: case HTML_ASIDE: case HTML_HEADER: case HTML_FOOTER: case HTML_NAV: CHECK_ID(HTML_GEN5_ID); if (HText_hasToolbar(me->text)) HText_appendParagraph(me->text); break; case HTML_FIGURE: CHECK_ID(HTML_GEN5_ID); break; case HTML_FRAMESET: break; case HTML_FRAME: if (present && present[HTML_FRAME_NAME] && non_empty(value[HTML_FRAME_NAME])) { StrAllocCopy(id_string, value[HTML_FRAME_NAME]); TRANSLATE_AND_UNESCAPE_ENTITIES(&id_string, TRUE, FALSE); LYTrimHead(id_string); LYTrimTail(id_string); } if (present && present[HTML_FRAME_SRC] && non_empty(value[HTML_FRAME_SRC])) { StrAllocCopy(href, value[HTML_FRAME_SRC]); LYLegitimizeHREF(me, &href, TRUE, TRUE); if (me->inA) { SET_SKIP_STACK(HTML_A); HTML_end_element(me, HTML_A, include); } me->CurrentA = HTAnchor_findChildAndLink(me->node_anchor, /* Parent */ NULL, /* Tag */ href, /* Addresss */ (HTLinkType *) 0); /* Type */ CAN_JUSTIFY_PUSH(FALSE); LYEnsureSingleSpace(me); if (me->inUnderline == FALSE) HText_appendCharacter(me->text, LY_UNDERLINE_START_CHAR); HTML_put_string(me, "FRAME:"); if (me->inUnderline == FALSE) HText_appendCharacter(me->text, LY_UNDERLINE_END_CHAR); HTML_put_character(me, ' '); me->in_word = NO; CHECK_ID(HTML_FRAME_ID); HText_beginAnchor(me->text, me->inUnderline, me->CurrentA); if (me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_START_CHAR); HTML_put_string(me, (id_string ? id_string : href)); FREE(href); if (me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_END_CHAR); HText_endAnchor(me->text, 0); LYEnsureSingleSpace(me); CAN_JUSTIFY_POP; } else { CHECK_ID(HTML_FRAME_ID); } FREE(id_string); break; case HTML_NOFRAMES: LYEnsureDoubleSpace(me); LYResetParagraphAlignment(me); break; case HTML_IFRAME: if (present && present[HTML_IFRAME_NAME] && non_empty(value[HTML_IFRAME_NAME])) { StrAllocCopy(id_string, value[HTML_IFRAME_NAME]); TRANSLATE_AND_UNESCAPE_ENTITIES(&id_string, TRUE, FALSE); LYTrimHead(id_string); LYTrimTail(id_string); } if (present && present[HTML_IFRAME_SRC] && non_empty(value[HTML_IFRAME_SRC])) { StrAllocCopy(href, value[HTML_IFRAME_SRC]); LYLegitimizeHREF(me, &href, TRUE, TRUE); if (me->inA) HTML_end_element(me, HTML_A, include); me->CurrentA = HTAnchor_findChildAndLink(me->node_anchor, /* Parent */ NULL, /* Tag */ href, /* Addresss */ (HTLinkType *) 0); /* Type */ LYEnsureDoubleSpace(me); CAN_JUSTIFY_PUSH_F LYResetParagraphAlignment(me); if (me->inUnderline == FALSE) HText_appendCharacter(me->text, LY_UNDERLINE_START_CHAR); HTML_put_string(me, "IFRAME:"); if (me->inUnderline == FALSE) HText_appendCharacter(me->text, LY_UNDERLINE_END_CHAR); HTML_put_character(me, ' '); me->in_word = NO; CHECK_ID(HTML_IFRAME_ID); HText_beginAnchor(me->text, me->inUnderline, me->CurrentA); if (me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_START_CHAR); HTML_put_string(me, (id_string ? id_string : href)); FREE(href); if (me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_END_CHAR); HText_endAnchor(me->text, 0); LYEnsureSingleSpace(me); CAN_JUSTIFY_POP; } else { CHECK_ID(HTML_IFRAME_ID); } FREE(id_string); break; case HTML_BANNER: case HTML_MARQUEE: change_paragraph_style(me, styles[HTML_BANNER]); UPDATE_STYLE; if (me->sp->tag_number == (int) ElementNumber) LYEnsureDoubleSpace(me); /* * Treat this as a toolbar if we don't have one yet, and we are in the * first half of the first page. - FM */ if ((!HText_hasToolbar(me->text) && HText_getLines(me->text) < (display_lines / 2)) && (ID_A = HTAnchor_findChildAndLink(me->node_anchor, /* Parent */ LYToolbarName, /* Tag */ NULL, /* Addresss */ (HTLinkType *) 0))) { /* Type */ HText_beginAnchor(me->text, me->inUnderline, ID_A); HText_endAnchor(me->text, 0); HText_setToolbar(me->text); } CHECK_ID(HTML_GEN_ID); break; case HTML_CENTER: case HTML_DIV: if (me->Division_Level < (MAX_NESTING - 1)) { me->Division_Level++; } else { CTRACE((tfp, "HTML: ****** Maximum nesting of %d divisions exceeded!\n", MAX_NESTING)); } if (me->inP) LYEnsureSingleSpace(me); /* always at least break line - kw */ if (ElementNumber == HTML_CENTER) { me->DivisionAlignments[me->Division_Level] = HT_CENTER; change_paragraph_style(me, styles[HTML_DCENTER]); UPDATE_STYLE; me->current_default_alignment = styles[HTML_DCENTER]->alignment; } else if (me->List_Nesting_Level >= 0 && !(present && present[HTML_DIV_ALIGN] && value[HTML_DIV_ALIGN] && (!strcasecomp(value[HTML_DIV_ALIGN], "center") || !strcasecomp(value[HTML_DIV_ALIGN], "right")))) { if (present && present[HTML_DIV_ALIGN]) me->current_default_alignment = HT_LEFT; else if (me->Division_Level == 0) me->current_default_alignment = HT_LEFT; else if (me->sp[0].tag_number == HTML_UL || me->sp[0].tag_number == HTML_OL || me->sp[0].tag_number == HTML_MENU || me->sp[0].tag_number == HTML_DIR || me->sp[0].tag_number == HTML_LI || me->sp[0].tag_number == HTML_LH || me->sp[0].tag_number == HTML_DD) me->current_default_alignment = HT_LEFT; LYHandlePlike(me, present, value, include, HTML_DIV_ALIGN, TRUE); me->DivisionAlignments[me->Division_Level] = (short) me->current_default_alignment; } else if (present && present[HTML_DIV_ALIGN] && non_empty(value[HTML_DIV_ALIGN])) { if (!strcasecomp(value[HTML_DIV_ALIGN], "center")) { me->DivisionAlignments[me->Division_Level] = HT_CENTER; change_paragraph_style(me, styles[HTML_DCENTER]); UPDATE_STYLE; me->current_default_alignment = styles[HTML_DCENTER]->alignment; } else if (!strcasecomp(value[HTML_DIV_ALIGN], "right")) { me->DivisionAlignments[me->Division_Level] = HT_RIGHT; change_paragraph_style(me, styles[HTML_DRIGHT]); UPDATE_STYLE; me->current_default_alignment = styles[HTML_DRIGHT]->alignment; } else { me->DivisionAlignments[me->Division_Level] = HT_LEFT; change_paragraph_style(me, styles[HTML_DLEFT]); UPDATE_STYLE; me->current_default_alignment = styles[HTML_DLEFT]->alignment; } } else { me->DivisionAlignments[me->Division_Level] = HT_LEFT; change_paragraph_style(me, styles[HTML_DLEFT]); UPDATE_STYLE; me->current_default_alignment = styles[HTML_DLEFT]->alignment; } CHECK_ID(HTML_DIV_ID); break; case HTML_H1: case HTML_H2: case HTML_H3: case HTML_H4: case HTML_H5: case HTML_H6: /* * Close the previous style if not done by HTML doc. Added to get rid * of core dumps in BAD HTML on the net. * GAB 07-07-94 * But then again, these are actually allowed to nest. I guess I have * to depend on the HTML writers correct style. * GAB 07-12-94 if (i_prior_style != -1) { HTML_end_element(me, i_prior_style); } i_prior_style = ElementNumber; */ /* * Check whether we have an H# in a list, and if so, treat it as an LH. * - FM */ if ((me->List_Nesting_Level >= 0) && (me->sp[0].tag_number == HTML_UL || me->sp[0].tag_number == HTML_OL || me->sp[0].tag_number == HTML_MENU || me->sp[0].tag_number == HTML_DIR || me->sp[0].tag_number == HTML_LI)) { if (HTML_dtd.tags[HTML_LH].contents == SGML_EMPTY) { ElementNumber = HTML_LH; } else { me->new_style = me->sp[0].style; ElementNumber = (HTMLElement) me->sp[0].tag_number; UPDATE_STYLE; } /* * Some authors use H# headers as a substitute for FONT, so check * if this one immediately followed an LI. If so, both me->inP and * me->in_word will be FALSE (though the line might not be empty * due to a bullet and/or nbsp) and we can assume it is just for a * FONT change. We thus will not create another line break nor add * to the current left indentation. - FM */ if (!(me->inP == FALSE && me->in_word == NO)) { HText_appendParagraph(me->text); HTML_put_character(me, HT_NON_BREAK_SPACE); HText_setLastChar(me->text, ' '); me->in_word = NO; me->inP = FALSE; } CHECK_ID(HTML_H_ID); break; } if (present && present[HTML_H_ALIGN] && non_empty(value[HTML_H_ALIGN])) { if (!strcasecomp(value[HTML_H_ALIGN], "center")) change_paragraph_style(me, styles[HTML_HCENTER]); else if (!strcasecomp(value[HTML_H_ALIGN], "right")) change_paragraph_style(me, styles[HTML_HRIGHT]); else if (!strcasecomp(value[HTML_H_ALIGN], "left") || !strcasecomp(value[HTML_H_ALIGN], "justify")) change_paragraph_style(me, styles[HTML_HLEFT]); else change_paragraph_style(me, styles[ElementNumber]); } else if (me->Division_Level >= 0) { if (me->DivisionAlignments[me->Division_Level] == HT_CENTER) { change_paragraph_style(me, styles[HTML_HCENTER]); } else if (me->DivisionAlignments[me->Division_Level] == HT_LEFT) { change_paragraph_style(me, styles[HTML_HLEFT]); } else if (me->DivisionAlignments[me->Division_Level] == HT_RIGHT) { change_paragraph_style(me, styles[HTML_HRIGHT]); } } else { change_paragraph_style(me, styles[ElementNumber]); } UPDATE_STYLE; CHECK_ID(HTML_H_ID); if ((bold_headers == TRUE || (ElementNumber == HTML_H1 && bold_H1 == TRUE)) && (styles[ElementNumber]->font & HT_BOLD)) { if (me->inBoldA == FALSE && me->inBoldH == FALSE) { HText_appendCharacter(me->text, LY_BOLD_START_CHAR); } me->inBoldH = TRUE; } break; case HTML_P: LYHandlePlike(me, present, value, include, HTML_P_ALIGN, TRUE); CHECK_ID(HTML_P_ID); break; case HTML_BR: UPDATE_STYLE; CHECK_ID(HTML_GEN_ID); /* Add a \r (new line) if these conditions are true: * * We are not collapsing BR's (and either we are not trimming * blank lines, or the preceding line is non-empty), or * * The current line has text on it. * Otherwise, don't do anything. -DH 19980814, TD 19980827/20170704 */ if ((LYCollapseBRs == FALSE && (!LYtrimBlankLines || !HText_PreviousLineEmpty(me->text, FALSE))) || !HText_LastLineEmpty(me->text, FALSE)) { HText_setLastChar(me->text, ' '); /* absorb white space */ HText_appendCharacter(me->text, '\r'); } me->in_word = NO; me->inP = FALSE; break; case HTML_WBR: UPDATE_STYLE; CHECK_ID(HTML_GEN_ID); HText_setBreakPoint(me->text); break; case HTML_HY: case HTML_SHY: UPDATE_STYLE; CHECK_ID(HTML_GEN_ID); HText_appendCharacter(me->text, LY_SOFT_HYPHEN); break; case HTML_HR: { int width; /* * Start a new line only if we had printable characters following * the previous newline, or remove the previous line if both it and * the last line are blank. - FM */ UPDATE_STYLE; if (!HText_LastLineEmpty(me->text, FALSE)) { HText_setLastChar(me->text, ' '); /* absorb white space */ HText_appendCharacter(me->text, '\r'); } else if (HText_PreviousLineEmpty(me->text, FALSE)) { HText_RemovePreviousLine(me->text); } me->in_word = NO; me->inP = FALSE; /* * Add an ID link if needed. - FM */ CHECK_ID(HTML_HR_ID); /* * Center lines within the current margins, if a right or left * ALIGNment is not specified. If WIDTH="#%" is given and not * garbage, use that to calculate the width, otherwise use the * default width. - FM */ if (present && present[HTML_HR_ALIGN] && value[HTML_HR_ALIGN]) { if (!strcasecomp(value[HTML_HR_ALIGN], "right")) { me->sp->style->alignment = HT_RIGHT; } else if (!strcasecomp(value[HTML_HR_ALIGN], "left")) { me->sp->style->alignment = HT_LEFT; } else { me->sp->style->alignment = HT_CENTER; } } else { me->sp->style->alignment = HT_CENTER; } width = LYcolLimit - me->new_style->leftIndent - me->new_style->rightIndent; if (present && present[HTML_HR_WIDTH] && value[HTML_HR_WIDTH] && isdigit(UCH(*value[HTML_HR_WIDTH])) && value[HTML_HR_WIDTH][strlen(value[HTML_HR_WIDTH]) - 1] == '%') { char *percent = NULL; int Percent, Width; StrAllocCopy(percent, value[HTML_HR_WIDTH]); percent[strlen(percent) - 1] = '\0'; Percent = atoi(percent); if (Percent > 100 || Percent < 1) width -= 5; else { Width = (width * Percent) / 100; if (Width < 1) width = 1; else width = Width; } FREE(percent); } else { width -= 5; } for (i = 0; i < width; i++) HTML_put_character(me, '_'); HText_appendCharacter(me->text, '\r'); me->in_word = NO; me->inP = FALSE; /* * Reset the alignment appropriately for the division and/or block. * - FM */ if (me->List_Nesting_Level < 0 && me->Division_Level >= 0) { me->sp->style->alignment = me->DivisionAlignments[me->Division_Level]; } else if (me->sp->style->id == ST_HeadingCenter || me->sp->style->id == ST_Heading1) { me->sp->style->alignment = HT_CENTER; } else if (me->sp->style->id == ST_HeadingRight) { me->sp->style->alignment = HT_RIGHT; } else { me->sp->style->alignment = HT_LEFT; } /* * Add a blank line and set the second line indentation for lists * and addresses, or a paragraph separator for other blocks. - FM */ if (me->List_Nesting_Level >= 0 || me->sp[0].tag_number == HTML_ADDRESS) { HText_setLastChar(me->text, ' '); /* absorb white space */ HText_appendCharacter(me->text, '\r'); } else { HText_appendParagraph(me->text); } } break; case HTML_TAB: if (!present) { /* Bad tag. Must have at least one attribute. - FM */ CTRACE((tfp, "HTML: TAB tag has no attributes. Ignored.\n")); break; } /* * If page author is using TAB within a TABLE, it's probably formatted * specifically to work well for Lynx without simple table tracking * code. Cancel tracking, it would only make things worse. - kw */ HText_cancelStbl(me->text); UPDATE_STYLE; CANT_JUSTIFY_THIS_LINE; if (present[HTML_TAB_ALIGN] && value[HTML_TAB_ALIGN] && (strcasecomp(value[HTML_TAB_ALIGN], "left") || !(present[HTML_TAB_TO] || present[HTML_TAB_INDENT]))) { /* * Just ensure a collapsible space, until we have the ALIGN and DP * attributes implemented. - FM */ HTML_put_character(me, ' '); CTRACE((tfp, "HTML: ALIGN not 'left'. Using space instead of TAB.\n")); } else if (!LYoverride_default_alignment(me) && me->current_default_alignment != HT_LEFT) { /* * Just ensure a collapsible space, until we can replace * HText_getCurrentColumn() in GridText.c with code which doesn't * require that the alignment be HT_LEFT. - FM */ HTML_put_character(me, ' '); CTRACE((tfp, "HTML: Not HT_LEFT. Using space instead of TAB.\n")); } else if ((present[HTML_TAB_TO] && non_empty(value[HTML_TAB_TO])) || (present[HTML_TAB_INDENT] && value[HTML_TAB_INDENT] && isdigit(UCH(*value[HTML_TAB_INDENT])))) { int column, target = -1; int enval = 2; column = HText_getCurrentColumn(me->text); if (present[HTML_TAB_TO] && non_empty(value[HTML_TAB_TO])) { /* * TO has priority over INDENT if both are present. - FM */ StrAllocCopy(temp, value[HTML_TAB_TO]); TRANSLATE_AND_UNESCAPE_TO_STD(&temp); if (*temp) { target = HText_getTabIDColumn(me->text, temp); } } else if (isEmpty(temp) && present[HTML_TAB_INDENT] && value[HTML_TAB_INDENT] && isdigit(UCH(*value[HTML_TAB_INDENT]))) { /* * The INDENT value is in "en" (enval per column) units. * Divide it by enval, rounding odd values up. - FM */ target = (int) (((1.0 * atoi(value[HTML_TAB_INDENT])) / enval) + (0.5)); } FREE(temp); /* * If we are being directed to a column too far to the left or * right, just add a collapsible space, otherwise, add the * appropriate number of spaces. - FM */ if (target < column || target > HText_getMaximumColumn(me->text)) { HTML_put_character(me, ' '); CTRACE((tfp, "HTML: Column out of bounds. Using space instead of TAB.\n")); } else { for (i = column; i < target; i++) HText_appendCharacter(me->text, ' '); HText_setLastChar(me->text, ' '); /* absorb white space */ } } me->in_word = NO; /* * If we have an ID attribute, save it together with the value of the * column we've reached. - FM */ if (present[HTML_TAB_ID] && non_empty(value[HTML_TAB_ID])) { StrAllocCopy(temp, value[HTML_TAB_ID]); TRANSLATE_AND_UNESCAPE_TO_STD(&temp); if (*temp) HText_setTabID(me->text, temp); FREE(temp); } break; case HTML_BASEFONT: break; case HTML_FONT: /* * FONT *may* have been declared SGML_EMPTY in HTMLDTD.c, and * SGML_character() in SGML.c *may* check for a FONT end tag to call * HTML_end_element() directly (with a check in that to bypass * decrementing of the HTML parser's stack). Or this may have been * really a end tag, for which some incarnations of SGML.c * would fake a start tag instead. - fm & kw * * But if we have an open FONT, DON'T close that one now, since FONT * tags can be legally nested AFAIK, and Lynx currently doesn't do * anything with them anyway... - kw */ #ifdef NOTUSED_FOTEMODS if (me->inFONT == TRUE) HTML_end_element(me, HTML_FONT, &include); #endif /* NOTUSED_FOTEMODS */ /* * Set flag to know we are in a FONT container, and add code to do * something about it, someday. - FM */ me->inFONT = TRUE; break; case HTML_B: /* Physical character highlighting */ case HTML_BLINK: case HTML_I: case HTML_U: case HTML_CITE: /* Logical character highlighting */ case HTML_EM: case HTML_STRONG: UPDATE_STYLE; me->Underline_Level++; CHECK_ID(HTML_GEN_ID); /* * Ignore this if inside of a bold anchor or header. Can't display * both underline and bold at same time. */ if (me->inBoldA == TRUE || me->inBoldH == TRUE) { CTRACE((tfp, "Underline Level is %d\n", me->Underline_Level)); break; } if (me->inUnderline == FALSE) { HText_appendCharacter(me->text, LY_UNDERLINE_START_CHAR); me->inUnderline = TRUE; CTRACE((tfp, "Beginning underline\n")); } else { CTRACE((tfp, "Underline Level is %d\n", me->Underline_Level)); } break; case HTML_ABBR: /* Miscellaneous character containers */ case HTML_ACRONYM: case HTML_AU: case HTML_AUTHOR: case HTML_BIG: case HTML_CODE: case HTML_DFN: case HTML_KBD: case HTML_SAMP: case HTML_SMALL: case HTML_TT: case HTML_VAR: CHECK_ID(HTML_GEN_ID); break; /* ignore */ case HTML_SUP: HText_appendCharacter(me->text, '^'); CHECK_ID(HTML_GEN_ID); break; case HTML_SUB: HText_appendCharacter(me->text, '['); CHECK_ID(HTML_GEN_ID); break; case HTML_DEL: case HTML_S: case HTML_STRIKE: CHECK_ID(HTML_GEN_ID); if (me->inUnderline == FALSE) HText_appendCharacter(me->text, LY_UNDERLINE_START_CHAR); HTML_put_string(me, "[DEL:"); if (me->inUnderline == FALSE) HText_appendCharacter(me->text, LY_UNDERLINE_END_CHAR); HTML_put_character(me, ' '); me->in_word = NO; break; case HTML_INS: CHECK_ID(HTML_GEN_ID); if (me->inUnderline == FALSE) HText_appendCharacter(me->text, LY_UNDERLINE_START_CHAR); HTML_put_string(me, "[INS:"); if (me->inUnderline == FALSE) HText_appendCharacter(me->text, LY_UNDERLINE_END_CHAR); HTML_put_character(me, ' '); me->in_word = NO; break; case HTML_Q: CHECK_ID(HTML_GEN_ID); /* * Should check LANG and/or DIR attributes, and the * me->node_anchor->charset and/or yet to be added structure elements, * to determine whether we should use chevrons, but for now we'll * always use double- or single-quotes. - FM */ if (!(me->Quote_Level & 1)) HTML_put_character(me, '"'); else HTML_put_character(me, '`'); me->Quote_Level++; break; case HTML_PRE: /* Formatted text */ /* * Set our inPRE flag to FALSE so that a newline immediately following * the PRE start tag will be ignored. HTML_put_character() will set it * to TRUE when the first character within the PRE block is received. * - FM */ me->inPRE = FALSE; /* FALLTHRU */ case HTML_LISTING: /* Literal text */ /* FALLTHRU */ case HTML_XMP: /* FALLTHRU */ case HTML_PLAINTEXT: change_paragraph_style(me, styles[ElementNumber]); UPDATE_STYLE; CHECK_ID(HTML_GEN_ID); if (me->comment_end) HText_appendText(me->text, me->comment_end); break; case HTML_BLOCKQUOTE: case HTML_BQ: change_paragraph_style(me, styles[ElementNumber]); UPDATE_STYLE; if (me->sp->tag_number == (int) ElementNumber) LYEnsureDoubleSpace(me); CHECK_ID(HTML_BQ_ID); break; case HTML_NOTE: change_paragraph_style(me, styles[ElementNumber]); UPDATE_STYLE; if (me->sp->tag_number == (int) ElementNumber) LYEnsureDoubleSpace(me); CHECK_ID(HTML_NOTE_ID); { char *note = NULL; /* * Indicate the type of NOTE. */ if (present && present[HTML_NOTE_CLASS] && value[HTML_NOTE_CLASS] && (!strcasecomp(value[HTML_NOTE_CLASS], "CAUTION") || !strcasecomp(value[HTML_NOTE_CLASS], "WARNING"))) { StrAllocCopy(note, value[HTML_NOTE_CLASS]); LYUpperCase(note); StrAllocCat(note, ":"); } else if (present && present[HTML_NOTE_ROLE] && value[HTML_NOTE_ROLE] && (!strcasecomp(value[HTML_NOTE_ROLE], "CAUTION") || !strcasecomp(value[HTML_NOTE_ROLE], "WARNING"))) { StrAllocCopy(note, value[HTML_NOTE_ROLE]); LYUpperCase(note); StrAllocCat(note, ":"); } else { StrAllocCopy(note, "NOTE:"); } if (me->inUnderline == FALSE) HText_appendCharacter(me->text, LY_UNDERLINE_START_CHAR); HTML_put_string(me, note); if (me->inUnderline == FALSE) HText_appendCharacter(me->text, LY_UNDERLINE_END_CHAR); HTML_put_character(me, ' '); CAN_JUSTIFY_START; FREE(note); } CAN_JUSTIFY_START; me->inLABEL = TRUE; me->in_word = NO; me->inP = FALSE; break; case HTML_ADDRESS: if (me->List_Nesting_Level < 0) { change_paragraph_style(me, styles[ElementNumber]); UPDATE_STYLE; if (me->sp->tag_number == (int) ElementNumber) LYEnsureDoubleSpace(me); } else { LYHandlePlike(me, present, value, include, -1, TRUE); } CHECK_ID(HTML_ADDRESS_ID); break; case HTML_DL: me->List_Nesting_Level++; /* increment the List nesting level */ if (me->List_Nesting_Level <= 0) { change_paragraph_style(me, present && present[HTML_DL_COMPACT] ? styles[HTML_DLC] : styles[HTML_DL]); } else if (me->List_Nesting_Level >= 6) { change_paragraph_style(me, present && present[HTML_DL_COMPACT] ? styles[HTML_DLC6] : styles[HTML_DL6]); } else { change_paragraph_style(me, present && present[HTML_DL_COMPACT] ? styles[(HTML_DLC1 - 1) + me->List_Nesting_Level] : styles[(HTML_DL1 - 1) + me->List_Nesting_Level]); } UPDATE_STYLE; /* update to the new style */ CHECK_ID(HTML_DL_ID); break; case HTML_DLC: me->List_Nesting_Level++; /* increment the List nesting level */ if (me->List_Nesting_Level <= 0) { change_paragraph_style(me, styles[HTML_DLC]); } else if (me->List_Nesting_Level >= 6) { change_paragraph_style(me, styles[HTML_DLC6]); } else { change_paragraph_style(me, styles[(HTML_DLC1 - 1) + me->List_Nesting_Level]); } UPDATE_STYLE; /* update to the new style */ CHECK_ID(HTML_DL_ID); break; case HTML_DT: CHECK_ID(HTML_GEN_ID); if (!me->style_change) { BOOL in_line_1 = HText_inLineOne(me->text); HTCoord saved_spaceBefore = me->sp->style->spaceBefore; HTCoord saved_spaceAfter = me->sp->style->spaceAfter; /* * If there are several DT elements and this is not the first, and * the preceding DT element's first (and normally only) line has * not yet been ended, suppress intervening blank line by * temporarily modifying the paragraph style in place. Ugly but * there's ample precedence. - kw */ if (in_line_1) { me->sp->style->spaceBefore = 0; /* temporary change */ me->sp->style->spaceAfter = 0; /* temporary change */ } HText_appendParagraph(me->text); me->sp->style->spaceBefore = saved_spaceBefore; /* undo */ me->sp->style->spaceAfter = saved_spaceAfter; /* undo */ me->in_word = NO; me->sp->style->alignment = HT_LEFT; } me->inP = FALSE; break; case HTML_DD: CHECK_ID(HTML_GEN_ID); HText_setLastChar(me->text, ' '); /* absorb white space */ if (!me->style_change) { if (!HText_LastLineEmpty(me->text, FALSE)) { HText_appendCharacter(me->text, '\r'); } else { HText_NegateLineOne(me->text); } } else { UPDATE_STYLE; HText_appendCharacter(me->text, '\t'); } me->sp->style->alignment = HT_LEFT; me->in_word = NO; me->inP = FALSE; break; case HTML_OL: /* * Set the default TYPE. */ me->OL_Type[(me->List_Nesting_Level < 11 ? me->List_Nesting_Level + 1 : 11)] = '1'; /* * Check whether we have a starting sequence number, or want to * continue the numbering from a previous OL in this nest. - FM */ if (present && (present[HTML_OL_SEQNUM] || present[HTML_OL_START])) { int seqnum; /* * Give preference to the valid HTML 3.0 SEQNUM attribute name over * the Netscape START attribute name (too bad the Netscape * developers didn't read the HTML 3.0 specs before re-inventing * the "wheel" as "we'll"). - FM */ if (present[HTML_OL_SEQNUM] && non_empty(value[HTML_OL_SEQNUM])) { seqnum = atoi(value[HTML_OL_SEQNUM]); } else if (present[HTML_OL_START] && non_empty(value[HTML_OL_START])) { seqnum = atoi(value[HTML_OL_START]); } else { seqnum = 1; } /* * Don't allow negative numbers less than or equal to our flags, or * numbers less than 1 if an Alphabetic or Roman TYPE. - FM */ if (present[HTML_OL_TYPE] && value[HTML_OL_TYPE]) { if (*value[HTML_OL_TYPE] == 'A') { me->OL_Type[(me->List_Nesting_Level < 11 ? me->List_Nesting_Level + 1 : 11)] = 'A'; if (seqnum < 1) seqnum = 1; } else if (*value[HTML_OL_TYPE] == 'a') { me->OL_Type[(me->List_Nesting_Level < 11 ? me->List_Nesting_Level + 1 : 11)] = 'a'; if (seqnum < 1) seqnum = 1; } else if (*value[HTML_OL_TYPE] == 'I') { me->OL_Type[(me->List_Nesting_Level < 11 ? me->List_Nesting_Level + 1 : 11)] = 'I'; if (seqnum < 1) seqnum = 1; } else if (*value[HTML_OL_TYPE] == 'i') { me->OL_Type[(me->List_Nesting_Level < 11 ? me->List_Nesting_Level + 1 : 11)] = 'i'; if (seqnum < 1) seqnum = 1; } else { if (seqnum <= OL_VOID) seqnum = OL_VOID + 1; } } else if (seqnum <= OL_VOID) { seqnum = OL_VOID + 1; } me->OL_Counter[(me->List_Nesting_Level < 11 ? me->List_Nesting_Level + 1 : 11)] = seqnum; } else if (present && present[HTML_OL_CONTINUE]) { me->OL_Counter[me->List_Nesting_Level < 11 ? me->List_Nesting_Level + 1 : 11] = OL_CONTINUE; } else { me->OL_Counter[(me->List_Nesting_Level < 11 ? me->List_Nesting_Level + 1 : 11)] = 1; if (present && present[HTML_OL_TYPE] && value[HTML_OL_TYPE]) { if (*value[HTML_OL_TYPE] == 'A') { me->OL_Type[(me->List_Nesting_Level < 11 ? me->List_Nesting_Level + 1 : 11)] = 'A'; } else if (*value[HTML_OL_TYPE] == 'a') { me->OL_Type[(me->List_Nesting_Level < 11 ? me->List_Nesting_Level + 1 : 11)] = 'a'; } else if (*value[HTML_OL_TYPE] == 'I') { me->OL_Type[(me->List_Nesting_Level < 11 ? me->List_Nesting_Level + 1 : 11)] = 'I'; } else if (*value[HTML_OL_TYPE] == 'i') { me->OL_Type[(me->List_Nesting_Level < 11 ? me->List_Nesting_Level + 1 : 11)] = 'i'; } } } me->List_Nesting_Level++; if (me->List_Nesting_Level <= 0) { change_paragraph_style(me, styles[ElementNumber]); } else if (me->List_Nesting_Level >= 6) { change_paragraph_style(me, styles[HTML_OL6]); } else { change_paragraph_style(me, styles[HTML_OL1 + me->List_Nesting_Level - 1]); } UPDATE_STYLE; /* update to the new style */ CHECK_ID(HTML_OL_ID); break; case HTML_UL: me->List_Nesting_Level++; if (me->List_Nesting_Level <= 0) { if (!(present && present[HTML_UL_PLAIN]) && !(present && present[HTML_UL_TYPE] && value[HTML_UL_TYPE] && 0 == strcasecomp(value[HTML_UL_TYPE], "PLAIN"))) { change_paragraph_style(me, styles[ElementNumber]); } else { change_paragraph_style(me, styles[HTML_DIR]); ElementNumber = HTML_DIR; } } else if (me->List_Nesting_Level >= 6) { if (!(present && present[HTML_UL_PLAIN]) && !(present && present[HTML_UL_TYPE] && value[HTML_UL_TYPE] && 0 == strcasecomp(value[HTML_UL_TYPE], "PLAIN"))) { change_paragraph_style(me, styles[HTML_OL6]); } else { change_paragraph_style(me, styles[HTML_MENU6]); ElementNumber = HTML_DIR; } } else { if (!(present && present[HTML_UL_PLAIN]) && !(present && present[HTML_UL_TYPE] && value[HTML_UL_TYPE] && 0 == strcasecomp(value[HTML_UL_TYPE], "PLAIN"))) { change_paragraph_style(me, styles[HTML_OL1 + me->List_Nesting_Level - 1]); } else { change_paragraph_style(me, styles[HTML_MENU1 + me->List_Nesting_Level - 1]); ElementNumber = HTML_DIR; } } UPDATE_STYLE; /* update to the new style */ CHECK_ID(HTML_UL_ID); break; case HTML_MENU: case HTML_DIR: me->List_Nesting_Level++; if (me->List_Nesting_Level <= 0) { change_paragraph_style(me, styles[ElementNumber]); } else if (me->List_Nesting_Level >= 6) { change_paragraph_style(me, styles[HTML_MENU6]); } else { change_paragraph_style(me, styles[HTML_MENU1 + me->List_Nesting_Level - 1]); } UPDATE_STYLE; /* update to the new style */ CHECK_ID(HTML_UL_ID); break; case HTML_LH: UPDATE_STYLE; /* update to the new style */ HText_appendParagraph(me->text); CHECK_ID(HTML_GEN_ID); HTML_put_character(me, HT_NON_BREAK_SPACE); HText_setLastChar(me->text, ' '); me->in_word = NO; me->inP = FALSE; break; case HTML_LI: UPDATE_STYLE; /* update to the new style */ HText_appendParagraph(me->text); me->sp->style->alignment = HT_LEFT; CHECK_ID(HTML_LI_ID); { int surrounding_tag_number = me->sp[0].tag_number; /* * No, a LI should never occur directly within another LI, but this * may result from incomplete error recovery. So check one more * surrounding level in this case. - kw */ if (surrounding_tag_number == HTML_LI && me->sp < (me->stack + MAX_NESTING - 1)) surrounding_tag_number = me->sp[1].tag_number; if (surrounding_tag_number == HTML_OL) { char number_string[20]; int counter, seqnum; char seqtype; counter = me->List_Nesting_Level < 11 ? me->List_Nesting_Level : 11; if (present && present[HTML_LI_TYPE] && value[HTML_LI_TYPE]) { if (*value[HTML_LI_TYPE] == '1') { me->OL_Type[counter] = '1'; } else if (*value[HTML_LI_TYPE] == 'A') { me->OL_Type[counter] = 'A'; } else if (*value[HTML_LI_TYPE] == 'a') { me->OL_Type[counter] = 'a'; } else if (*value[HTML_LI_TYPE] == 'I') { me->OL_Type[counter] = 'I'; } else if (*value[HTML_LI_TYPE] == 'i') { me->OL_Type[counter] = 'i'; } } if (present && present[HTML_LI_VALUE] && ((value[HTML_LI_VALUE] != NULL) && (*value[HTML_LI_VALUE] != '\0')) && ((isdigit(UCH(*value[HTML_LI_VALUE]))) || (*value[HTML_LI_VALUE] == '-' && isdigit(UCH(*(value[HTML_LI_VALUE] + 1)))))) { seqnum = atoi(value[HTML_LI_VALUE]); if (seqnum <= OL_VOID) seqnum = OL_VOID + 1; seqtype = me->OL_Type[counter]; if (seqtype != '1' && seqnum < 1) seqnum = 1; me->OL_Counter[counter] = seqnum + 1; } else if (me->OL_Counter[counter] >= OL_VOID) { seqnum = me->OL_Counter[counter]++; seqtype = me->OL_Type[counter]; if (seqtype != '1' && seqnum < 1) { seqnum = 1; me->OL_Counter[counter] = seqnum + 1; } } else { seqnum = me->Last_OL_Count + 1; seqtype = me->Last_OL_Type; for (i = (counter - 1); i >= 0; i--) { if (me->OL_Counter[i] > OL_VOID) { seqnum = me->OL_Counter[i]++; seqtype = me->OL_Type[i]; i = 0; } } } if (seqtype == 'A') { strcpy(number_string, LYUppercaseA_OL_String(seqnum)); } else if (seqtype == 'a') { strcpy(number_string, LYLowercaseA_OL_String(seqnum)); } else if (seqtype == 'I') { strcpy(number_string, LYUppercaseI_OL_String(seqnum)); } else if (seqtype == 'i') { strcpy(number_string, LYLowercaseI_OL_String(seqnum)); } else { sprintf(number_string, "%2d.", seqnum); } me->Last_OL_Count = seqnum; me->Last_OL_Type = seqtype; /* * Hack, because there is no append string! */ for (i = 0; number_string[i] != '\0'; i++) if (number_string[i] == ' ') HTML_put_character(me, HT_NON_BREAK_SPACE); else HTML_put_character(me, number_string[i]); /* * Use HTML_put_character so that any other spaces coming * through will be collapsed. We'll use nbsp, so it won't * break at the spacing character if there are no spaces in the * subsequent text up to the right margin, but will declare it * as a normal space to ensure collapsing if a normal space * does immediately follow it. - FM */ HTML_put_character(me, HT_NON_BREAK_SPACE); HText_setLastChar(me->text, ' '); } else if (surrounding_tag_number == HTML_UL) { /* * Hack, because there is no append string! */ HTML_put_character(me, HT_NON_BREAK_SPACE); HTML_put_character(me, HT_NON_BREAK_SPACE); switch (me->List_Nesting_Level % 7) { case 0: HTML_put_character(me, '*'); break; case 1: HTML_put_character(me, '+'); break; case 2: HTML_put_character(me, 'o'); break; case 3: HTML_put_character(me, '#'); break; case 4: HTML_put_character(me, '@'); break; case 5: HTML_put_character(me, '-'); break; case 6: HTML_put_character(me, '='); break; } /* * Keep using HTML_put_character so that any other spaces * coming through will be collapsed. We use nbsp, so we won't * wrap at the spacing character if there are no spaces in the * subsequent text up to the right margin, but will declare it * as a normal space to ensure collapsing if a normal space * does immediately follow it. - FM */ HTML_put_character(me, HT_NON_BREAK_SPACE); HText_setLastChar(me->text, ' '); } else { /* * Hack, because there is no append string! */ HTML_put_character(me, HT_NON_BREAK_SPACE); HTML_put_character(me, HT_NON_BREAK_SPACE); HText_setLastChar(me->text, ' '); } } CAN_JUSTIFY_START; me->in_word = NO; me->inP = FALSE; break; case HTML_SPAN: CHECK_ID(HTML_GEN_ID); /* * Should check LANG and/or DIR attributes, and the * me->node_anchor->charset and/or yet to be added structure elements, * and do something here. - FM */ break; case HTML_BDO: CHECK_ID(HTML_GEN_ID); /* * Should check DIR (and LANG) attributes, and the * me->node_anchor->charset and/or yet to be added structure elements, * and do something here. - FM */ break; case HTML_SPOT: CHECK_ID(HTML_GEN_ID); break; case HTML_FN: change_paragraph_style(me, styles[ElementNumber]); UPDATE_STYLE; if (me->sp->tag_number == (int) ElementNumber) LYEnsureDoubleSpace(me); CHECK_ID(HTML_GEN_ID); if (me->inUnderline == FALSE) HText_appendCharacter(me->text, LY_UNDERLINE_START_CHAR); HTML_put_string(me, "FOOTNOTE:"); if (me->inUnderline == FALSE) HText_appendCharacter(me->text, LY_UNDERLINE_END_CHAR); HTML_put_character(me, ' '); CAN_JUSTIFY_START me->inLABEL = TRUE; me->in_word = NO; me->inP = FALSE; break; case HTML_A: /* * If we are looking for client-side image maps, then handle an A * within a MAP that has a COORDS attribute as an AREA tag. * Unfortunately we lose the anchor text this way for the LYNXIMGMAP, * we would have to do much more parsing to collect it. After * potentially handling the A as AREA, always return immediately if * only looking for image maps, without pushing anything on the style * stack. - kw */ if (me->map_address && present && present[HTML_A_COORDS]) LYStartArea(me, present[HTML_A_HREF] ? value[HTML_A_HREF] : NULL, NULL, present[HTML_A_TITLE] ? value[HTML_A_TITLE] : NULL, tag_charset); if (LYMapsOnly) { return HT_OK; } /* * A may have been declared SGML_EMPTY in HTMLDTD.c, and * SGML_character() in SGML.c may check for an A end tag to call * HTML_end_element() directly (with a check in that to bypass * decrementing of the HTML parser's stack), so if we have an open A, * close that one now. - FM & kw */ if (me->inA) { SET_SKIP_STACK(HTML_A); HTML_end_element(me, HTML_A, include); } /* * Set to know we are in an anchor. */ me->inA = TRUE; /* * Load id_string if we have an ID or NAME. - FM */ if (present && present[HTML_A_ID] && non_empty(value[HTML_A_ID])) { StrAllocCopy(id_string, value[HTML_A_ID]); } else if (present && present[HTML_A_NAME] && non_empty(value[HTML_A_NAME])) { StrAllocCopy(id_string, value[HTML_A_NAME]); } if (id_string) TRANSLATE_AND_UNESCAPE_TO_STD(&id_string); /* * Handle the reference. - FM */ if (present && present[HTML_A_HREF]) { /* * Set to know we are making the content bold. */ me->inBoldA = TRUE; if (isEmpty(value[HTML_A_HREF])) StrAllocCopy(href, "#"); else StrAllocCopy(href, value[HTML_A_HREF]); CHECK_FOR_INTERN(intern_flag, href); /* '#' */ if (intern_flag) { /*** FAST WAY: ***/ TRANSLATE_AND_UNESCAPE_TO_STD(&href); } else { url_type = LYLegitimizeHREF(me, &href, TRUE, TRUE); /* * Deal with our ftp gateway kludge. - FM */ if (!url_type && !StrNCmp(href, "/foo/..", 7) && (isFTP_URL(me->node_anchor->address) || isFILE_URL(me->node_anchor->address))) { for (i = 0; (href[i] = href[i + 7]) != 0; i++) ; } } if (present[HTML_A_ISMAP]) /*??? */ intern_flag = FALSE; } else { if (bold_name_anchors == TRUE) { me->inBoldA = TRUE; } } if (present && present[HTML_A_TYPE] && value[HTML_A_TYPE]) { StrAllocCopy(temp, value[HTML_A_TYPE]); if (!intern_flag && !strcasecomp(value[HTML_A_TYPE], HTAtom_name(HTInternalLink)) && !LYIsUIPage3(me->node_anchor->address, UIP_LIST_PAGE, 0) && !LYIsUIPage3(me->node_anchor->address, UIP_ADDRLIST_PAGE, 0) && !isLYNXIMGMAP(me->node_anchor->address)) { /* Some kind of spoof? * Found TYPE="internal link" but not in a valid context * where we have written it. - kw */ CTRACE((tfp, "HTML: Found invalid HREF=\"%s\" TYPE=\"%s\"!\n", href, temp)); FREE(temp); } } me->CurrentA = HTAnchor_findChildAndLink(me->node_anchor, /* Parent */ id_string, /* Tag */ href, /* Address */ (temp ? (HTLinkType *) HTAtom_for(temp) : INTERN_LT)); /* Type */ FREE(temp); FREE(id_string); if (me->CurrentA && present) { if (present[HTML_A_TITLE] && non_empty(value[HTML_A_TITLE])) { StrAllocCopy(title, value[HTML_A_TITLE]); TRANSLATE_AND_UNESCAPE_ENTITIES(&title, TRUE, FALSE); LYTrimHead(title); LYTrimTail(title); if (*title == '\0') { FREE(title); } } if (present[HTML_A_ISMAP]) dest_ismap = TRUE; if (present[HTML_A_CHARSET] && non_empty(value[HTML_A_CHARSET])) { /* * Set up to load the anchor's chartrans structures * appropriately for the current display character set if it * can handle what's claimed. - FM */ StrAllocCopy(temp, value[HTML_A_CHARSET]); TRANSLATE_AND_UNESCAPE_TO_STD(&temp); dest_char_set = UCGetLYhndl_byMIME(temp); if (dest_char_set < 0) { dest_char_set = UCLYhndl_for_unrec; } } if (title != NULL || dest_ismap == TRUE || dest_char_set >= 0) { dest = HTAnchor_parent(HTAnchor_followLink(me->CurrentA) ); } if (dest && title != NULL && HTAnchor_title(dest) == NULL) HTAnchor_setTitle(dest, title); if (dest && dest_ismap) dest->isISMAPScript = TRUE; /* Don't allow CHARSET attribute to change *this* document's charset assumption. - kw */ if (dest && dest != me->node_anchor && dest_char_set >= 0) { /* * Load the anchor's chartrans structures. This should be done * more intelligently when setting up the structured object, * but it gets the job done for now. - FM */ HTAnchor_setUCInfoStage(dest, dest_char_set, UCT_STAGE_MIME, UCT_SETBY_DEFAULT); HTAnchor_setUCInfoStage(dest, dest_char_set, UCT_STAGE_PARSER, UCT_SETBY_LINK); } FREE(temp); dest = NULL; FREE(title); } me->CurrentANum = HText_beginAnchor(me->text, me->inUnderline, me->CurrentA); if (me->inBoldA == TRUE && me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_START_CHAR); #if defined(NOTUSED_FOTEMODS) /* * Close an HREF-less NAMED-ed now if we aren't making their content * bold, and let the check in HTML_end_element() deal with any dangling * end tag this creates. - FM */ if (href == NULL && me->inBoldA == FALSE) { SET_SKIP_STACK(HTML_A); HTML_end_element(me, HTML_A, include); } #else /*Close an HREF-less NAMED-ed now if force_empty_hrefless_a was requested - VH */ if (href == NULL && force_empty_hrefless_a) { SET_SKIP_STACK(HTML_A); HTML_end_element(me, HTML_A, include); } #endif FREE(href); break; case HTML_IMG: /* Images */ /* * If we're in an anchor, get the destination, and if it's a clickable * image for the current anchor, set our flags for faking a 0,0 * coordinate pair, which typically returns the image's default. - FM */ if (me->inA && me->CurrentA) { if ((dest = HTAnchor_parent(HTAnchor_followLink(me->CurrentA) )) != NULL) { if (dest->isISMAPScript == TRUE) { dest_ismap = TRUE; CTRACE((tfp, "HTML: '%s' is an ISMAP script\n", dest->address)); } else if (present && present[HTML_IMG_ISMAP]) { dest_ismap = TRUE; dest->isISMAPScript = TRUE; CTRACE((tfp, "HTML: Designating '%s' as an ISMAP script\n", dest->address)); } } } intern_flag = FALSE; /* unless set below - kw */ /* * If there's a USEMAP, resolve it. - FM */ if (present && present[HTML_IMG_USEMAP] && non_empty(value[HTML_IMG_USEMAP])) { StrAllocCopy(map_href, value[HTML_IMG_USEMAP]); CHECK_FOR_INTERN(intern_flag, map_href); (void) LYLegitimizeHREF(me, &map_href, TRUE, TRUE); /* * If map_href ended up zero-length or otherwise doesn't have a * hash, it can't be valid, so ignore it. - FM */ if (findPoundSelector(map_href) == NULL) { FREE(map_href); } } /* * Handle a MAP reference if we have one at this point. - FM */ if (map_href) { /* * If the MAP reference doesn't yet begin with a scheme, check * whether a base tag is in effect. - FM */ /* * If the USEMAP value is a lone fragment and LYSeekFragMAPinCur is * set, we'll use the current document's URL for resolving. * Otherwise use the BASE. - kw */ Base = ((me->inBASE && !(*map_href == '#' && LYSeekFragMAPinCur == TRUE)) ? me->base_href : me->node_anchor->address); HTParseALL(&map_href, Base); /* * Prepend our client-side MAP access field. - FM */ StrAllocCopy(temp, STR_LYNXIMGMAP); StrAllocCat(temp, map_href); StrAllocCopy(map_href, temp); FREE(temp); } /* * Check whether we want to suppress the server-side ISMAP link if a * client-side MAP is present. - FM */ if (LYNoISMAPifUSEMAP && map_href && dest_ismap) { dest_ismap = FALSE; dest = NULL; } /* * Check for a TITLE attribute. - FM */ if (present && present[HTML_IMG_TITLE] && non_empty(value[HTML_IMG_TITLE])) { StrAllocCopy(title, value[HTML_IMG_TITLE]); TRANSLATE_AND_UNESCAPE_ENTITIES(&title, TRUE, FALSE); LYTrimHead(title); LYTrimTail(title); if (*title == '\0') { FREE(title); } } /* * If there's an ALT string, use it, unless the ALT string is * zero-length or just spaces and we are making all SRCs links or have * a USEMAP link. - FM */ if (((present) && (present[HTML_IMG_ALT] && value[HTML_IMG_ALT])) && (!clickable_images || ((clickable_images || map_href) && *value[HTML_IMG_ALT] != '\0'))) { StrAllocCopy(alt_string, value[HTML_IMG_ALT]); TRANSLATE_AND_UNESCAPE_ENTITIES(&alt_string, me->UsePlainSpace, me->HiddenValue); /* * If it's all spaces and we are making SRC or USEMAP links, treat * it as zero-length. - FM */ if (clickable_images || map_href) { LYTrimHead(alt_string); LYTrimTail(alt_string); if (*alt_string == '\0') { if (map_href) { StrAllocCopy(alt_string, (title ? title : (temp = MakeNewMapValue(value, "USEMAP")))); FREE(temp); } else if (dest_ismap) { StrAllocCopy(alt_string, (title ? title : (temp = MakeNewMapValue(value, "ISMAP")))); FREE(temp); } else if (me->inA == TRUE && dest) { StrAllocCopy(alt_string, (title ? title : VERBOSE_IMG(value, HTML_IMG_SRC, "[LINK]"))); } else { StrAllocCopy(alt_string, (title ? title : ((present && present[HTML_IMG_ISOBJECT]) ? "(OBJECT)" : VERBOSE_IMG(value, HTML_IMG_SRC, "[INLINE]")))); } } } } else if (map_href) { StrAllocCopy(alt_string, (title ? title : (temp = MakeNewMapValue(value, "USEMAP")))); FREE(temp); } else if ((dest_ismap == TRUE) || (me->inA && present && present[HTML_IMG_ISMAP])) { StrAllocCopy(alt_string, (title ? title : (temp = MakeNewMapValue(value, "ISMAP")))); FREE(temp); } else if (me->inA == TRUE && dest) { StrAllocCopy(alt_string, (title ? title : VERBOSE_IMG(value, HTML_IMG_SRC, "[LINK]"))); } else { if (pseudo_inline_alts || clickable_images) StrAllocCopy(alt_string, (title ? title : ((present && present[HTML_IMG_ISOBJECT]) ? "(OBJECT)" : VERBOSE_IMG(value, HTML_IMG_SRC, "[INLINE]")))); else StrAllocCopy(alt_string, NonNull(title)); } if (*alt_string == '\0' && map_href) { StrAllocCopy(alt_string, (temp = MakeNewMapValue(value, "USEMAP"))); FREE(temp); } CTRACE((tfp, "HTML IMG: USEMAP=%d ISMAP=%d ANCHOR=%d PARA=%d\n", map_href ? 1 : 0, (dest_ismap == TRUE) ? 1 : 0, me->inA, me->inP)); /* * Check for an ID attribute. - FM */ if (present && present[HTML_IMG_ID] && non_empty(value[HTML_IMG_ID])) { StrAllocCopy(id_string, value[HTML_IMG_ID]); TRANSLATE_AND_UNESCAPE_TO_STD(&id_string); if (*id_string == '\0') { FREE(id_string); } } /* * Create links to the SRC for all images, if desired. - FM */ if (clickable_images && present && present[HTML_IMG_SRC] && non_empty(value[HTML_IMG_SRC])) { StrAllocCopy(href, value[HTML_IMG_SRC]); LYLegitimizeHREF(me, &href, TRUE, TRUE); /* * If it's an ISMAP and/or USEMAP, or graphic for an anchor, end * that anchor and start one for the SRC. - FM */ if (me->inA) { /* * If we have a USEMAP, end this anchor and start a new one for * the client-side MAP. - FM */ if (map_href) { if (dest_ismap) { HTML_put_character(me, ' '); me->in_word = NO; HTML_put_string(me, (temp = MakeNewMapValue(value, "ISMAP"))); FREE(temp); } else if (dest) { HTML_put_character(me, ' '); me->in_word = NO; HTML_put_string(me, "[LINK]"); } if (me->inBoldA == TRUE && me->inBoldH == FALSE) { HText_appendCharacter(me->text, LY_BOLD_END_CHAR); } me->inBoldA = FALSE; HText_endAnchor(me->text, me->CurrentANum); me->CurrentANum = 0; if (dest_ismap || dest) HTML_put_character(me, '-'); if (id_string) { if ((ID_A = HTAnchor_findChildAndLink(me->node_anchor, /* Parent */ id_string, /* Tag */ NULL, /* Addresss */ 0)) != NULL) { /* Type */ HText_beginAnchor(me->text, me->inUnderline, ID_A); HText_endAnchor(me->text, 0); } } me->CurrentA = HTAnchor_findChildAndLink(me->node_anchor, /* Parent */ NULL, /* Tag */ map_href, /* Addresss */ INTERN_LT); /* Type */ if (me->CurrentA && title) { if ((dest = HTAnchor_parent(HTAnchor_followLink(me->CurrentA) )) != NULL) { if (!HTAnchor_title(dest)) HTAnchor_setTitle(dest, title); } } me->CurrentANum = HText_beginAnchor(me->text, me->inUnderline, me->CurrentA); if (me->inBoldA == FALSE && me->inBoldH == FALSE) { HText_appendCharacter(me->text, LY_BOLD_START_CHAR); } me->inBoldA = TRUE; } else { HTML_put_character(me, ' '); /* space char may be ignored */ me->in_word = NO; } HTML_put_string(me, alt_string); if (me->inBoldA == TRUE && me->inBoldH == FALSE) { HText_appendCharacter(me->text, LY_BOLD_END_CHAR); } me->inBoldA = FALSE; HText_endAnchor(me->text, me->CurrentANum); me->CurrentANum = 0; HTML_put_character(me, '-'); FREE(newtitle); StrAllocCopy(alt_string, ((present && present[HTML_IMG_ISOBJECT]) ? ((map_href || dest_ismap) ? "(IMAGE)" : "(OBJECT)") : VERBOSE_IMG(value, HTML_IMG_SRC, "[IMAGE]"))); if (id_string && !map_href) { if ((ID_A = HTAnchor_findChildAndLink(me->node_anchor, /* Parent */ id_string, /* Tag */ NULL, /* Addresss */ 0)) != NULL) { /* Type */ HText_beginAnchor(me->text, me->inUnderline, ID_A); HText_endAnchor(me->text, 0); } } } else if (map_href) { HTML_put_character(me, ' '); /* space char may be ignored */ me->in_word = NO; if (id_string) { if ((ID_A = HTAnchor_findChildAndLink(me->node_anchor, /* Parent */ id_string, /* Tag */ NULL, /* Addresss */ 0)) != NULL) { /* Type */ HText_beginAnchor(me->text, me->inUnderline, ID_A); HText_endAnchor(me->text, 0); } } me->CurrentA = HTAnchor_findChildAndLink(me->node_anchor, /* Parent */ NULL, /* Tag */ map_href, /* Addresss */ INTERN_LT); /* Type */ if (me->CurrentA && title) { if ((dest = HTAnchor_parent(HTAnchor_followLink(me->CurrentA) )) != NULL) { if (!HTAnchor_title(dest)) HTAnchor_setTitle(dest, title); } } me->CurrentANum = HText_beginAnchor(me->text, me->inUnderline, me->CurrentA); if (me->inBoldA == FALSE && me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_START_CHAR); me->inBoldA = TRUE; HTML_put_string(me, alt_string); if (me->inBoldA == TRUE && me->inBoldH == FALSE) { HText_appendCharacter(me->text, LY_BOLD_END_CHAR); } me->inBoldA = FALSE; HText_endAnchor(me->text, me->CurrentANum); me->CurrentANum = 0; HTML_put_character(me, '-'); FREE(newtitle); StrAllocCopy(alt_string, ((present && present[HTML_IMG_ISOBJECT]) ? "(IMAGE)" : VERBOSE_IMG(value, HTML_IMG_SRC, "[IMAGE]"))); } else { HTML_put_character(me, ' '); /* space char may be ignored */ me->in_word = NO; if (id_string) { if ((ID_A = HTAnchor_findChildAndLink(me->node_anchor, /* Parent */ id_string, /* Tag */ NULL, /* Addresss */ 0)) != NULL) { /* Type */ HText_beginAnchor(me->text, me->inUnderline, ID_A); HText_endAnchor(me->text, 0); } } } /* * Create the link to the SRC. - FM */ me->CurrentA = HTAnchor_findChildAndLink(me->node_anchor, /* Parent */ NULL, /* Tag */ href, /* Addresss */ (HTLinkType *) 0); /* Type */ FREE(href); me->CurrentANum = HText_beginAnchor(me->text, me->inUnderline, me->CurrentA); if (me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_START_CHAR); HTML_put_string(me, alt_string); if (!me->inA) { if (me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_END_CHAR); HText_endAnchor(me->text, me->CurrentANum); me->CurrentANum = 0; HTML_put_character(me, ' '); /* space char may be ignored */ me->in_word = NO; } else { HTML_put_character(me, ' '); /* space char may be ignored */ me->in_word = NO; me->inBoldA = TRUE; } } else if (map_href) { if (me->inA) { /* * We're in an anchor and have a USEMAP, so end the anchor and * start a new one for the client-side MAP. - FM */ if (dest_ismap) { HTML_put_character(me, ' '); /* space char may be ignored */ me->in_word = NO; HTML_put_string(me, (temp = MakeNewMapValue(value, "ISMAP"))); FREE(temp); } else if (dest) { HTML_put_character(me, ' '); /* space char may be ignored */ me->in_word = NO; HTML_put_string(me, "[LINK]"); } if (me->inBoldA == TRUE && me->inBoldH == FALSE) { HText_appendCharacter(me->text, LY_BOLD_END_CHAR); } me->inBoldA = FALSE; HText_endAnchor(me->text, me->CurrentANum); me->CurrentANum = 0; if (dest_ismap || dest) { HTML_put_character(me, '-'); } } else { HTML_put_character(me, ' '); me->in_word = NO; } me->CurrentA = HTAnchor_findChildAndLink(me->node_anchor, /* Parent */ NULL, /* Tag */ map_href, /* Addresss */ INTERN_LT); /* Type */ if (me->CurrentA && title) { if ((dest = HTAnchor_parent(HTAnchor_followLink(me->CurrentA) )) != NULL) { if (!HTAnchor_title(dest)) HTAnchor_setTitle(dest, title); } } me->CurrentANum = HText_beginAnchor(me->text, me->inUnderline, me->CurrentA); if (me->inBoldA == FALSE && me->inBoldH == FALSE) { HText_appendCharacter(me->text, LY_BOLD_START_CHAR); } me->inBoldA = TRUE; HTML_put_string(me, alt_string); if (!me->inA) { if (me->inBoldA == TRUE && me->inBoldH == FALSE) { HText_appendCharacter(me->text, LY_BOLD_END_CHAR); } me->inBoldA = FALSE; HText_endAnchor(me->text, me->CurrentANum); me->CurrentANum = 0; } } else { /* * Just put in the ALT or pseudo-ALT string for the current anchor * or inline, with an ID link if indicated. - FM */ HTML_put_character(me, ' '); /* space char may be ignored */ me->in_word = NO; if (id_string) { if ((ID_A = HTAnchor_findChildAndLink(me->node_anchor, /* Parent */ id_string, /* Tag */ NULL, /* Addresss */ (HTLinkType *) 0)) != NULL) { /* Type */ HText_beginAnchor(me->text, me->inUnderline, ID_A); HText_endAnchor(me->text, 0); } } HTML_put_string(me, alt_string); HTML_put_character(me, ' '); /* space char may be ignored */ me->in_word = NO; } FREE(map_href); FREE(alt_string); FREE(id_string); FREE(title); FREE(newtitle); dest = NULL; break; case HTML_MAP: /* * Load id_string if we have a NAME or ID. - FM */ if (present && present[HTML_MAP_NAME] && non_empty(value[HTML_MAP_NAME])) { StrAllocCopy(id_string, value[HTML_MAP_NAME]); } else if (present && present[HTML_MAP_ID] && non_empty(value[HTML_MAP_ID])) { StrAllocCopy(id_string, value[HTML_MAP_ID]); } if (id_string) { TRANSLATE_AND_UNESCAPE_TO_STD(&id_string); if (*id_string == '\0') { FREE(id_string); } } /* * Generate a target anchor in this place in the containing document. * MAP can now contain block markup, if it doesn't contain any AREAs * (or A anchors with COORDS converted to AREAs) the current location * can be used as a fallback for following a USEMAP link. - kw */ if (!LYMapsOnly) LYHandleID(me, id_string); /* * Load map_address. - FM */ if (id_string) { /* * The MAP must be in the current stream, even if it had a BASE * tag, so we'll use its address here, but still use the BASE, if * present, when resolving the AREA elements in it's content, * unless the AREA's HREF is a lone fragment and * LYSeekFragAREAinCur is set. - FM && KW */ StrAllocCopy(me->map_address, me->node_anchor->address); if ((cp = StrChr(me->map_address, '#')) != NULL) *cp = '\0'; StrAllocCat(me->map_address, "#"); StrAllocCat(me->map_address, id_string); FREE(id_string); if (present && present[HTML_MAP_TITLE] && non_empty(value[HTML_MAP_TITLE])) { StrAllocCopy(title, value[HTML_MAP_TITLE]); TRANSLATE_AND_UNESCAPE_ENTITIES(&title, TRUE, FALSE); LYTrimHead(title); LYTrimTail(title); if (*title == '\0') { FREE(title); } } LYAddImageMap(me->map_address, title, me->node_anchor); FREE(title); } break; case HTML_AREA: if (me->map_address && present && present[HTML_AREA_HREF] && non_empty(value[HTML_AREA_HREF])) { /* * Resolve the HREF. - FM */ StrAllocCopy(href, value[HTML_AREA_HREF]); CHECK_FOR_INTERN(intern_flag, href); (void) LYLegitimizeHREF(me, &href, TRUE, TRUE); /* * Check whether a BASE tag is in effect, and use it for resolving, * even though we used this stream's address for locating the MAP * itself, unless the HREF is a lone fragment and * LYSeekFragAREAinCur is set. - FM */ Base = (((me->inBASE && *href != '\0') && !(*href == '#' && LYSeekFragAREAinCur == TRUE)) ? me->base_href : me->node_anchor->address); HTParseALL(&href, Base); /* * Check for an ALT. - FM */ if (present[HTML_AREA_ALT] && non_empty(value[HTML_AREA_ALT])) { StrAllocCopy(alt_string, value[HTML_AREA_ALT]); } else if (present[HTML_AREA_TITLE] && non_empty(value[HTML_AREA_TITLE])) { /* * Use the TITLE as an ALT. - FM */ StrAllocCopy(alt_string, value[HTML_AREA_TITLE]); } if (alt_string != NULL) { TRANSLATE_AND_UNESCAPE_ENTITIES(&alt_string, me->UsePlainSpace, me->HiddenValue); /* * Make sure it's not just space(s). - FM */ LYTrimHead(alt_string); LYTrimTail(alt_string); if (*alt_string == '\0') { StrAllocCopy(alt_string, href); } } else { /* * Use the HREF as an ALT. - FM */ StrAllocCopy(alt_string, href); } LYAddMapElement(me->map_address, href, alt_string, me->node_anchor, intern_flag); FREE(href); FREE(alt_string); } break; case HTML_PARAM: /* * We may need to look at this someday to deal with MAPs, OBJECTs or * APPLETs optimally, but just ignore it for now. - FM */ break; case HTML_BODYTEXT: CHECK_ID(HTML_BODYTEXT_ID); /* * We may need to look at this someday to deal with OBJECTs optimally, * but just ignore it for now. - FM */ break; case HTML_TEXTFLOW: CHECK_ID(HTML_BODYTEXT_ID); /* * We may need to look at this someday to deal with APPLETs optimally, * but just ignore it for now. - FM */ break; case HTML_FIG: if (present) LYHandleFIG(me, present, value, present[HTML_FIG_ISOBJECT], present[HTML_FIG_IMAGEMAP], present[HTML_FIG_ID] ? value[HTML_FIG_ID] : NULL, present[HTML_FIG_SRC] ? value[HTML_FIG_SRC] : NULL, YES, TRUE, &intern_flag); else LYHandleFIG(me, NULL, NULL, 0, 0, NULL, NULL, YES, TRUE, &intern_flag); break; case HTML_OBJECT: if (!me->object_started) { /* * This is an outer OBJECT start tag, i.e., not a nested OBJECT, so * save its relevant attributes. - FM */ if (present) { if (present[HTML_OBJECT_DECLARE]) me->object_declare = TRUE; if (present[HTML_OBJECT_SHAPES]) me->object_shapes = TRUE; if (present[HTML_OBJECT_ISMAP]) me->object_ismap = TRUE; if (present[HTML_OBJECT_USEMAP] && non_empty(value[HTML_OBJECT_USEMAP])) { StrAllocCopy(me->object_usemap, value[HTML_OBJECT_USEMAP]); TRANSLATE_AND_UNESCAPE_TO_STD(&me->object_usemap); if (*me->object_usemap == '\0') { FREE(me->object_usemap); } } if (present[HTML_OBJECT_ID] && non_empty(value[HTML_OBJECT_ID])) { StrAllocCopy(me->object_id, value[HTML_OBJECT_ID]); TRANSLATE_AND_UNESCAPE_TO_STD(&me->object_id); if (*me->object_id == '\0') { FREE(me->object_id); } } if (present[HTML_OBJECT_TITLE] && non_empty(value[HTML_OBJECT_TITLE])) { StrAllocCopy(me->object_title, value[HTML_OBJECT_TITLE]); TRANSLATE_AND_UNESCAPE_ENTITIES(&me->object_title, TRUE, FALSE); LYTrimHead(me->object_title); LYTrimTail(me->object_title); if (*me->object_title == '\0') { FREE(me->object_title); } } if (present[HTML_OBJECT_DATA] && non_empty(value[HTML_OBJECT_DATA])) { StrAllocCopy(me->object_data, value[HTML_OBJECT_DATA]); TRANSLATE_AND_UNESCAPE_TO_STD(&me->object_data); if (*me->object_data == '\0') { FREE(me->object_data); } } if (present[HTML_OBJECT_TYPE] && non_empty(value[HTML_OBJECT_TYPE])) { StrAllocCopy(me->object_type, value[HTML_OBJECT_TYPE]); TRANSLATE_AND_UNESCAPE_ENTITIES(&me->object_type, TRUE, FALSE); LYTrimHead(me->object_type); LYTrimTail(me->object_type); if (*me->object_type == '\0') { FREE(me->object_type); } } if (present[HTML_OBJECT_CLASSID] && non_empty(value[HTML_OBJECT_CLASSID])) { StrAllocCopy(me->object_classid, value[HTML_OBJECT_CLASSID]); TRANSLATE_AND_UNESCAPE_ENTITIES(&me->object_classid, TRUE, FALSE); LYTrimHead(me->object_classid); LYTrimTail(me->object_classid); if (*me->object_classid == '\0') { FREE(me->object_classid); } } if (present[HTML_OBJECT_CODEBASE] && non_empty(value[HTML_OBJECT_CODEBASE])) { StrAllocCopy(me->object_codebase, value[HTML_OBJECT_CODEBASE]); TRANSLATE_AND_UNESCAPE_TO_STD(&me->object_codebase); if (*me->object_codebase == '\0') { FREE(me->object_codebase); } } if (present[HTML_OBJECT_CODETYPE] && non_empty(value[HTML_OBJECT_CODETYPE])) { StrAllocCopy(me->object_codetype, value[HTML_OBJECT_CODETYPE]); TRANSLATE_AND_UNESCAPE_ENTITIES(&me->object_codetype, TRUE, FALSE); LYTrimHead(me->object_codetype); LYTrimTail(me->object_codetype); if (*me->object_codetype == '\0') { FREE(me->object_codetype); } } if (present[HTML_OBJECT_NAME] && non_empty(value[HTML_OBJECT_NAME])) { StrAllocCopy(me->object_name, value[HTML_OBJECT_NAME]); TRANSLATE_AND_UNESCAPE_ENTITIES(&me->object_name, TRUE, FALSE); LYTrimHead(me->object_name); LYTrimTail(me->object_name); if (*me->object_name == '\0') { FREE(me->object_name); } } } /* * If we can determine now that we are not going to do anything * special to the OBJECT element's SGML contents, like skipping it * completely or collecting it up in order to add something after * it, then generate any output that should be emitted in the place * of the OBJECT start tag NOW, then don't initialize special * handling but return, letting our SGML parser know that further * content is to be parsed normally not literally. We could defer * this until we have collected the contents and then recycle the * contents (as was previously always done), but that has a higher * chance of completely losing content in case of nesting errors in * the input, incomplete transmissions, etc. - kw */ if ((!present || (me->object_declare == FALSE && me->object_name == NULL && me->object_shapes == FALSE && me->object_usemap == NULL))) { if (!LYMapsOnly) { if (!clickable_images || me->object_data == NULL || !(me->object_data != NULL && me->object_classid == NULL && me->object_codebase == NULL && me->object_codetype == NULL)) FREE(me->object_data); if (me->object_data) { HTStartAnchor5(me, (me->object_id ? value[HTML_OBJECT_ID] : NULL), value[HTML_OBJECT_DATA], value[HTML_OBJECT_TYPE], tag_charset); if ((me->object_type != NULL) && !strncasecomp(me->object_type, "image/", 6)) HTML_put_string(me, "(IMAGE)"); else HTML_put_string(me, "(OBJECT)"); HTML_end_element(me, HTML_A, NULL); } else if (me->object_id) LYHandleID(me, me->object_id); } clear_objectdata(me); /* * We do NOT want the HTML_put_* functions that are going to be * called for the OBJECT's character content to add to the * chunk, so we don't push on the stack. Instead we keep a * counter for open OBJECT tags that are treated this way, so * HTML_end_element can skip handling the corresponding end tag * that is going to arrive unexpectedly as far as our stack is * concerned. */ status = HT_PARSER_OTHER_CONTENT; if (me->sp[0].tag_number == HTML_FIG && me->objects_figged_open > 0) { ElementNumber = (HTMLElement) HTML_OBJECT_M; } else { me->objects_mixed_open++; SET_SKIP_STACK(HTML_OBJECT); } } else if (me->object_declare == FALSE && me->object_name == NULL && me->object_shapes == TRUE) { LYHandleFIG(me, present, value, 1, 1 || me->object_ismap, me->object_id, ((me->object_data && !me->object_classid) ? value[HTML_OBJECT_DATA] : NULL), NO, TRUE, &intern_flag); clear_objectdata(me); status = HT_PARSER_OTHER_CONTENT; me->objects_figged_open++; ElementNumber = HTML_FIG; } else { /* * Set flag that we are accumulating OBJECT content. - FM */ me->object_started = TRUE; } } break; case HTML_OVERLAY: if (clickable_images && me->inFIG && present && present[HTML_OVERLAY_SRC] && non_empty(value[HTML_OVERLAY_SRC])) { StrAllocCopy(href, value[HTML_OVERLAY_SRC]); LYLegitimizeHREF(me, &href, TRUE, TRUE); if (*href) { if (me->inA) { SET_SKIP_STACK(HTML_A); HTML_end_element(me, HTML_A, include); } me->CurrentA = HTAnchor_findChildAndLink(me->node_anchor, /* Parent */ NULL, /* Tag */ href, /* Addresss */ (HTLinkType *) 0); /* Type */ HTML_put_character(me, ' '); HText_appendCharacter(me->text, '+'); me->CurrentANum = HText_beginAnchor(me->text, me->inUnderline, me->CurrentA); if (me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_START_CHAR); HTML_put_string(me, "[OVERLAY]"); if (me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_END_CHAR); HText_endAnchor(me->text, me->CurrentANum); HTML_put_character(me, ' '); me->in_word = NO; } FREE(href); } break; case HTML_APPLET: me->inAPPLET = TRUE; me->inAPPLETwithP = FALSE; HTML_put_character(me, ' '); /* space char may be ignored */ /* * Load id_string if we have an ID or NAME. - FM */ if (present && present[HTML_APPLET_ID] && non_empty(value[HTML_APPLET_ID])) { StrAllocCopy(id_string, value[HTML_APPLET_ID]); } else if (present && present[HTML_APPLET_NAME] && non_empty(value[HTML_APPLET_NAME])) { StrAllocCopy(id_string, value[HTML_APPLET_NAME]); } if (id_string) { TRANSLATE_AND_UNESCAPE_TO_STD(&id_string); LYHandleID(me, id_string); FREE(id_string); } me->in_word = NO; /* * If there's an ALT string, use it, unless the ALT string is * zero-length and we are making all sources links. - FM */ if (present && present[HTML_APPLET_ALT] && value[HTML_APPLET_ALT] && (!clickable_images || (clickable_images && *value[HTML_APPLET_ALT] != '\0'))) { StrAllocCopy(alt_string, value[HTML_APPLET_ALT]); TRANSLATE_AND_UNESCAPE_ENTITIES(&alt_string, me->UsePlainSpace, me->HiddenValue); /* * If it's all spaces and we are making sources links, treat it as * zero-length. - FM */ if (clickable_images) { LYTrimHead(alt_string); LYTrimTail(alt_string); if (*alt_string == '\0') { StrAllocCopy(alt_string, "[APPLET]"); } } } else { if (clickable_images) StrAllocCopy(alt_string, "[APPLET]"); else StrAllocCopy(alt_string, ""); } /* * If we're making all sources links, get the source. - FM */ if (clickable_images && present && present[HTML_APPLET_CODE] && non_empty(value[HTML_APPLET_CODE])) { char *base = NULL; Base = (me->inBASE) ? me->base_href : me->node_anchor->address; /* * Check for a CODEBASE attribute. - FM */ if (present[HTML_APPLET_CODEBASE] && non_empty(value[HTML_APPLET_CODEBASE])) { StrAllocCopy(base, value[HTML_APPLET_CODEBASE]); LYRemoveBlanks(base); TRANSLATE_AND_UNESCAPE_TO_STD(&base); /* * Force it to be a directory. - FM */ if (*base == '\0') StrAllocCopy(base, "/"); LYAddHtmlSep(&base); LYLegitimizeHREF(me, &base, TRUE, FALSE); HTParseALL(&base, Base); } StrAllocCopy(href, value[HTML_APPLET_CODE]); LYLegitimizeHREF(me, &href, TRUE, FALSE); HTParseALL(&href, (base ? base : Base)); FREE(base); if (*href) { if (me->inA) { if (me->inBoldA == TRUE && me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_END_CHAR); HText_endAnchor(me->text, me->CurrentANum); HTML_put_character(me, '-'); } me->CurrentA = HTAnchor_findChildAndLink(me->node_anchor, /* Parent */ NULL, /* Tag */ href, /* Addresss */ (HTLinkType *) 0); /* Type */ me->CurrentANum = HText_beginAnchor(me->text, me->inUnderline, me->CurrentA); if (me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_START_CHAR); HTML_put_string(me, alt_string); if (me->inA == FALSE) { if (me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_END_CHAR); HText_endAnchor(me->text, me->CurrentANum); me->CurrentANum = 0; } HTML_put_character(me, ' '); /* space char may be ignored */ me->in_word = NO; } FREE(href); } else if (*alt_string) { /* * Just put up the ALT string, if non-zero. - FM */ HTML_put_string(me, alt_string); HTML_put_character(me, ' '); /* space char may be ignored */ me->in_word = NO; } FREE(alt_string); FREE(id_string); break; case HTML_BGSOUND: /* * If we're making all sources links, get the source. - FM */ if (clickable_images && present && present[HTML_BGSOUND_SRC] && non_empty(value[HTML_BGSOUND_SRC])) { StrAllocCopy(href, value[HTML_BGSOUND_SRC]); LYLegitimizeHREF(me, &href, TRUE, TRUE); if (*href == '\0') { FREE(href); break; } if (me->inA) { if (me->inBoldA == TRUE && me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_END_CHAR); HText_endAnchor(me->text, me->CurrentANum); HTML_put_character(me, '-'); } else { HTML_put_character(me, ' '); /* space char may be ignored */ me->in_word = NO; } me->CurrentA = HTAnchor_findChildAndLink(me->node_anchor, /* Parent */ NULL, /* Tag */ href, /* Addresss */ (HTLinkType *) 0); /* Type */ me->CurrentANum = HText_beginAnchor(me->text, me->inUnderline, me->CurrentA); if (me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_START_CHAR); HTML_put_string(me, "[BGSOUND]"); if (me->inA == FALSE) { if (me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_END_CHAR); HText_endAnchor(me->text, me->CurrentANum); me->CurrentANum = 0; } HTML_put_character(me, ' '); /* space char may be ignored */ me->in_word = NO; FREE(href); } break; case HTML_EMBED: if (pseudo_inline_alts || clickable_images) HTML_put_character(me, ' '); /* space char may be ignored */ /* * Load id_string if we have an ID or NAME. - FM */ if (present && present[HTML_EMBED_ID] && non_empty(value[HTML_EMBED_ID])) { StrAllocCopy(id_string, value[HTML_EMBED_ID]); } else if (present && present[HTML_EMBED_NAME] && non_empty(value[HTML_EMBED_NAME])) { StrAllocCopy(id_string, value[HTML_EMBED_NAME]); } if (id_string) { TRANSLATE_AND_UNESCAPE_TO_STD(&id_string); LYHandleID(me, id_string); FREE(id_string); } if (pseudo_inline_alts || clickable_images) me->in_word = NO; /* * If there's an ALT string, use it, unless the ALT string is * zero-length and we are making all sources links. - FM */ if (present && present[HTML_EMBED_ALT] && value[HTML_EMBED_ALT] && (!clickable_images || (clickable_images && *value[HTML_EMBED_ALT] != '\0'))) { StrAllocCopy(alt_string, value[HTML_EMBED_ALT]); TRANSLATE_AND_UNESCAPE_ENTITIES(&alt_string, me->UsePlainSpace, me->HiddenValue); /* * If it's all spaces and we are making sources links, treat it as * zero-length. - FM */ if (clickable_images) { LYTrimHead(alt_string); LYTrimTail(alt_string); if (*alt_string == '\0') { StrAllocCopy(alt_string, "[EMBED]"); } } } else { if (pseudo_inline_alts || clickable_images) StrAllocCopy(alt_string, "[EMBED]"); else StrAllocCopy(alt_string, ""); } /* * If we're making all sources links, get the source. - FM */ if (clickable_images && present && present[HTML_EMBED_SRC] && non_empty(value[HTML_EMBED_SRC])) { StrAllocCopy(href, value[HTML_EMBED_SRC]); LYLegitimizeHREF(me, &href, TRUE, TRUE); if (*href) { if (me->inA) { if (me->inBoldA == TRUE && me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_END_CHAR); HText_endAnchor(me->text, me->CurrentANum); HTML_put_character(me, '-'); } me->CurrentA = HTAnchor_findChildAndLink(me->node_anchor, /* Parent */ NULL, /* Tag */ href, /* Addresss */ (HTLinkType *) 0); /* Type */ me->CurrentANum = HText_beginAnchor(me->text, me->inUnderline, me->CurrentA); if (me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_START_CHAR); HTML_put_string(me, alt_string); if (me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_END_CHAR); if (me->inA == FALSE) { if (me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_END_CHAR); HText_endAnchor(me->text, me->CurrentANum); me->CurrentANum = 0; } HTML_put_character(me, ' '); me->in_word = NO; } FREE(href); } else if (*alt_string) { /* * Just put up the ALT string, if non-zero. - FM */ HTML_put_string(me, alt_string); HTML_put_character(me, ' '); /* space char may be ignored */ me->in_word = NO; } FREE(alt_string); FREE(id_string); break; case HTML_CREDIT: LYEnsureDoubleSpace(me); LYResetParagraphAlignment(me); me->inCREDIT = TRUE; CHECK_ID(HTML_GEN_ID); if (me->inUnderline == FALSE) HText_appendCharacter(me->text, LY_UNDERLINE_START_CHAR); HTML_put_string(me, "CREDIT:"); if (me->inUnderline == FALSE) HText_appendCharacter(me->text, LY_UNDERLINE_END_CHAR); HTML_put_character(me, ' '); CAN_JUSTIFY_START; if (me->inFIG) /* * Assume all text in the FIG container is intended to be * paragraphed. - FM */ me->inFIGwithP = TRUE; if (me->inAPPLET) /* * Assume all text in the APPLET container is intended to be * paragraphed. - FM */ me->inAPPLETwithP = TRUE; me->inLABEL = TRUE; me->in_word = NO; me->inP = FALSE; break; case HTML_CAPTION: LYEnsureDoubleSpace(me); LYResetParagraphAlignment(me); me->inCAPTION = TRUE; CHECK_ID(HTML_CAPTION_ID); if (me->inUnderline == FALSE) HText_appendCharacter(me->text, LY_UNDERLINE_START_CHAR); HTML_put_string(me, "CAPTION:"); if (me->inUnderline == FALSE) HText_appendCharacter(me->text, LY_UNDERLINE_END_CHAR); HTML_put_character(me, ' '); CAN_JUSTIFY_START; if (me->inFIG) /* * Assume all text in the FIG container is intended to be * paragraphed. - FM */ me->inFIGwithP = TRUE; if (me->inAPPLET) /* * Assume all text in the APPLET container is intended to be * paragraphed. - FM */ me->inAPPLETwithP = TRUE; me->inLABEL = TRUE; me->in_word = NO; me->inP = FALSE; break; case HTML_FORM: { char *action = NULL; char *method = NULL; char *enctype = NULL; const char *accept_cs = NULL; HTChildAnchor *source; HTAnchor *link_dest; /* * FORM may have been declared SGML_EMPTY in HTMLDTD.c, and * SGML_character() in SGML.c may check for a FORM end tag to call * HTML_end_element() directly (with a check in that to bypass * decrementing of the HTML parser's stack), so if we have an open * FORM, close that one now. - FM */ if (me->inFORM) { CTRACE((tfp, "HTML: Missing FORM end tag. Faking it!\n")); SET_SKIP_STACK(HTML_FORM); HTML_end_element(me, HTML_FORM, include); } /* * Set to know we are in a new form. */ me->inFORM = TRUE; EMIT_IFDEF_USE_JUSTIFY_ELTS(form_in_htext = TRUE); if (present && present[HTML_FORM_ACCEPT_CHARSET]) { accept_cs = (value[HTML_FORM_ACCEPT_CHARSET] ? value[HTML_FORM_ACCEPT_CHARSET] : "UNKNOWN"); } Base = (me->inBASE) ? me->base_href : me->node_anchor->address; if (present && present[HTML_FORM_ACTION] && value[HTML_FORM_ACTION]) { StrAllocCopy(action, value[HTML_FORM_ACTION]); LYLegitimizeHREF(me, &action, TRUE, TRUE); /* * Check whether a base tag is in effect. Note that actions * always are resolved w.r.t. to the base, even if the action * is empty. - FM */ HTParseALL(&action, Base); } else { StrAllocCopy(action, Base); } source = HTAnchor_findChildAndLink(me->node_anchor, NULL, action, (HTLinkType *) 0); if ((link_dest = HTAnchor_followLink(source)) != NULL) { /* * Memory leak fixed. 05-28-94 Lynx 2-3-1 Garrett Arch Blythe */ char *cp_freeme = HTAnchor_address(link_dest); if (cp_freeme != NULL) { StrAllocCopy(action, cp_freeme); FREE(cp_freeme); } else { StrAllocCopy(action, ""); } } if (present && present[HTML_FORM_METHOD]) StrAllocCopy(method, (value[HTML_FORM_METHOD] ? value[HTML_FORM_METHOD] : "GET")); if (present && present[HTML_FORM_ENCTYPE] && non_empty(value[HTML_FORM_ENCTYPE])) { StrAllocCopy(enctype, value[HTML_FORM_ENCTYPE]); LYLowerCase(enctype); } if (present) { /* * Check for a TITLE attribute, and if none is present, check * for a SUBJECT attribute as a synonym. - FM */ if (present[HTML_FORM_TITLE] && non_empty(value[HTML_FORM_TITLE])) { StrAllocCopy(title, value[HTML_FORM_TITLE]); } else if (present[HTML_FORM_SUBJECT] && non_empty(value[HTML_FORM_SUBJECT])) { StrAllocCopy(title, value[HTML_FORM_SUBJECT]); } if (non_empty(title)) { TRANSLATE_AND_UNESCAPE_ENTITIES(&title, TRUE, FALSE); LYTrimHead(title); LYTrimTail(title); if (*title == '\0') { FREE(title); } } } HText_beginForm(action, method, enctype, title, accept_cs); FREE(action); FREE(method); FREE(enctype); FREE(title); } CHECK_ID(HTML_FORM_ID); break; case HTML_FIELDSET: LYEnsureDoubleSpace(me); LYResetParagraphAlignment(me); CHECK_ID(HTML_GEN_ID); break; case HTML_LEGEND: LYEnsureDoubleSpace(me); LYResetParagraphAlignment(me); CHECK_ID(HTML_CAPTION_ID); break; case HTML_LABEL: CHECK_ID(HTML_LABEL_ID); break; case HTML_KEYGEN: CHECK_ID(HTML_KEYGEN_ID); break; case HTML_BUTTON: { InputFieldData I; int chars; BOOL faked_button = FALSE; /* init */ memset(&I, 0, sizeof(I)); I.name_cs = ATTR_CS_IN; I.value_cs = ATTR_CS_IN; UPDATE_STYLE; if (present && present[HTML_BUTTON_TYPE] && value[HTML_BUTTON_TYPE]) { if (!strcasecomp(value[HTML_BUTTON_TYPE], "submit") || !strcasecomp(value[HTML_BUTTON_TYPE], "reset")) { /* * It's a button for submitting or resetting a form. - FM */ I.type = value[HTML_BUTTON_TYPE]; } else { /* * Ugh, it's a button for a script. - FM */ I.type = value[HTML_BUTTON_TYPE]; CTRACE((tfp, "found button for a script\n")); } } else { /* default, if no type given, is a submit button */ I.type = "submit"; } /* * Before any input field, add a collapsible space if we're not in * a PRE block, to promote a wrap there for any long values that * would extend past the right margin from our current position in * the line. If we are in a PRE block, start a new line if the * last line already is within 6 characters of the wrap point for * PRE blocks. - FM */ if (me->sp[0].tag_number != HTML_PRE && !me->inPRE && me->sp->style->freeFormat) { HTML_put_character(me, ' '); me->in_word = NO; } else if (HText_LastLineSize(me->text, FALSE) > (LYcolLimit - 6)) { HTML_put_character(me, '\n'); me->in_word = NO; } HTML_put_character(me, '('); if (!(present && present[HTML_BUTTON_NAME] && value[HTML_BUTTON_NAME])) { I.name = ""; } else if (StrChr(value[HTML_BUTTON_NAME], '&') == NULL) { I.name = value[HTML_BUTTON_NAME]; } else { StrAllocCopy(I_name, value[HTML_BUTTON_NAME]); UNESCAPE_FIELDNAME_TO_STD(&I_name); I.name = I_name; } if (present && present[HTML_BUTTON_VALUE] && non_empty(value[HTML_BUTTON_VALUE])) { /* * Convert any HTML entities or decimal escaping. - FM */ StrAllocCopy(I.value, value[HTML_BUTTON_VALUE]); me->UsePlainSpace = TRUE; TRANSLATE_AND_UNESCAPE_ENTITIES(&I.value, TRUE, me->HiddenValue); me->UsePlainSpace = FALSE; /* * Convert any newlines or tabs to spaces, and trim any lead or * trailing spaces. - FM */ LYReduceBlanks(I.value); } else if (!strcasecomp(I.type, "button")) { if (non_empty(I.name)) { StrAllocCopy(I.value, I.name); } else { StrAllocCopy(I.value, "BUTTON"); faked_button = TRUE; } } else if (I.value == 0) { StrAllocCopy(I.value, "BUTTON"); } if (present && present[HTML_BUTTON_READONLY]) I.readonly = YES; if (present && present[HTML_BUTTON_DISABLED]) I.disabled = YES; if (present && present[HTML_BUTTON_CLASS] && /* Not yet used. */ non_empty(value[HTML_BUTTON_CLASS])) I.iclass = value[HTML_BUTTON_CLASS]; if (present && present[HTML_BUTTON_ID] && non_empty(value[HTML_BUTTON_ID])) { I.id = value[HTML_BUTTON_ID]; CHECK_ID(HTML_BUTTON_ID); } if (present && present[HTML_BUTTON_LANG] && /* Not yet used. */ non_empty(value[HTML_BUTTON_LANG])) I.lang = value[HTML_BUTTON_LANG]; chars = HText_beginInput(me->text, me->inUnderline, &I); /* * Submit and reset buttons have values which don't change, so * HText_beginInput() sets I.value to the string which should be * displayed, and we'll enter that instead of underscore * placeholders into the HText structure to see it instead of * underscores when dumping or printing. We also won't worry about * a wrap in PRE blocks, because the line editor never is invoked * for submit or reset buttons. - LE & FM */ if (me->sp[0].tag_number == HTML_PRE || !me->sp->style->freeFormat) { /* * We have a submit or reset button in a PRE block, so output * the entire value from the markup. If it extends to the * right margin, it will wrap there, and only the portion * before that wrap will be highlighted on screen display * (Yuk!) but we may as well show the rest of the full value on * the next or more lines. - FM */ while (I.value[i]) HTML_put_character(me, I.value[i++]); } else { /* * The submit or reset button is not in a PRE block. Note that * if a wrap occurs before outputting the entire value, the * wrapped portion will not be highlighted or clearly indicated * as part of the link for submission or reset (Yuk!). We'll * replace any spaces in the submit or reset button value with * nbsp, to promote a wrap at the space we ensured would be * present before the start of the string, as when we use all * underscores instead of the INPUT's actual value, but we * could still get a wrap at the right margin, instead, if the * value is greater than a line width for the current style. * Also, if chars somehow ended up longer than the length of * the actual value (shouldn't have), we'll continue padding * with nbsp up to the length of chars. - FM */ for (i = 0; I.value[i]; i++) { HTML_put_character(me, (char) ((I.value[i] == ' ') ? HT_NON_BREAK_SPACE : I.value[i])); } while (i++ < chars) { HTML_put_character(me, HT_NON_BREAK_SPACE); } } HTML_put_character(me, ')'); if (me->sp[0].tag_number != HTML_PRE && me->sp->style->freeFormat) { HTML_put_character(me, ' '); me->in_word = NO; } if (faked_button) FREE(I.value); FREE(I_name); } break; case HTML_INPUT: { InputFieldData I; int chars; BOOL UseALTasVALUE = FALSE; BOOL HaveSRClink = FALSE; char *ImageSrc = NULL; BOOL IsSubmitOrReset = FALSE; HTkcode kcode = NOKANJI; HTkcode specified_kcode = NOKANJI; /* init */ memset(&I, 0, sizeof(I)); I.name_cs = ATTR_CS_IN; I.value_cs = ATTR_CS_IN; UPDATE_STYLE; /* * Before any input field, add a collapsible space if we're not in * a PRE block, to promote a wrap there for any long values that * would extend past the right margin from our current position in * the line. If we are in a PRE block, start a new line if the * last line already is within 6 characters of the wrap point for * PRE blocks. - FM */ if (me->sp[0].tag_number != HTML_PRE && !me->inPRE && me->sp->style->freeFormat) { HTML_put_character(me, ' '); me->in_word = NO; } else if (HText_LastLineSize(me->text, FALSE) > (LYcolLimit - 6)) { HTML_put_character(me, '\n'); me->in_word = NO; } /* * Get the TYPE and make sure we can handle it. - FM */ if (present && present[HTML_INPUT_TYPE] && non_empty(value[HTML_INPUT_TYPE])) { const char *not_impl = NULL; char *usingval = NULL; I.type = value[HTML_INPUT_TYPE]; if (!strcasecomp(I.type, "range")) { if (present[HTML_INPUT_MIN] && non_empty(value[HTML_INPUT_MIN])) I.min = value[HTML_INPUT_MIN]; if (present[HTML_INPUT_MAX] && non_empty(value[HTML_INPUT_MAX])) I.max = value[HTML_INPUT_MAX]; /* * Not yet implemented. */ #ifdef NOTDEFINED not_impl = "[RANGE Input]"; if (me->inFORM) HText_DisableCurrentForm(); #endif /* NOTDEFINED */ CTRACE((tfp, "HTML: Ignoring TYPE=\"range\"\n")); break; } else if (!strcasecomp(I.type, "file")) { if (present[HTML_INPUT_ACCEPT] && non_empty(value[HTML_INPUT_ACCEPT])) I.accept = value[HTML_INPUT_ACCEPT]; #ifndef USE_FILE_UPLOAD not_impl = "[FILE Input]"; CTRACE((tfp, "Attempting to fake as: %s\n", I.type)); #ifdef NOTDEFINED if (me->inFORM) HText_DisableCurrentForm(); #endif /* NOTDEFINED */ CTRACE((tfp, "HTML: Ignoring TYPE=\"file\"\n")); #endif /* USE_FILE_UPLOAD */ } else if (!strcasecomp(I.type, "button")) { /* * Ugh, a button for a script. */ not_impl = "[BUTTON Input]"; } if (not_impl != NULL) { if (me->inUnderline == FALSE) { HText_appendCharacter(me->text, LY_UNDERLINE_START_CHAR); } HTML_put_string(me, not_impl); if (usingval != NULL) { HTML_put_string(me, usingval); FREE(usingval); } else { HTML_put_string(me, " (not implemented)"); } if (me->inUnderline == FALSE) { HText_appendCharacter(me->text, LY_UNDERLINE_END_CHAR); } } } CTRACE((tfp, "Ok, we're trying type=[%s]\n", NONNULL(I.type))); /* * Check for an unclosed TEXTAREA. */ if (me->inTEXTAREA) { if (LYBadHTML(me)) { LYShowBadHTML("Bad HTML: Missing TEXTAREA end tag.\n"); } } /* * Check for an unclosed SELECT, try to close it if found. */ if (me->inSELECT) { CTRACE((tfp, "HTML: Missing SELECT end tag, faking it...\n")); if (me->sp->tag_number != HTML_SELECT) { SET_SKIP_STACK(HTML_SELECT); } HTML_end_element(me, HTML_SELECT, include); } /* * Handle the INPUT as for a FORM. - FM */ if (!(present && present[HTML_INPUT_NAME] && non_empty(value[HTML_INPUT_NAME]))) { I.name = ""; } else if (StrChr(value[HTML_INPUT_NAME], '&') == NULL) { I.name = value[HTML_INPUT_NAME]; } else { StrAllocCopy(I_name, value[HTML_INPUT_NAME]); UNESCAPE_FIELDNAME_TO_STD(&I_name); I.name = I_name; } if ((present && present[HTML_INPUT_ALT] && non_empty(value[HTML_INPUT_ALT]) && I.type && !strcasecomp(I.type, "image")) && !(present && present[HTML_INPUT_VALUE] && non_empty(value[HTML_INPUT_VALUE]))) { /* * This is a TYPE="image" using an ALT rather than VALUE * attribute to indicate the link string for text clients or * GUIs with image loading off, so set the flag to use that as * if it were a VALUE attribute. - FM */ UseALTasVALUE = TRUE; } if (verbose_img && !clickable_images && present && present[HTML_INPUT_SRC] && non_empty(value[HTML_INPUT_SRC]) && I.type && !strcasecomp(I.type, "image")) { ImageSrc = MakeNewImageValue(value); } else if (clickable_images == TRUE && present && present[HTML_INPUT_SRC] && non_empty(value[HTML_INPUT_SRC]) && I.type && !strcasecomp(I.type, "image")) { StrAllocCopy(href, value[HTML_INPUT_SRC]); /* * We have a TYPE="image" with a non-zero-length SRC attribute * and want clickable images. Make the SRC's value a link if * it's still not zero-length legitimizing it. - FM */ LYLegitimizeHREF(me, &href, TRUE, TRUE); if (*href) { if (me->inA) { SET_SKIP_STACK(HTML_A); HTML_end_element(me, HTML_A, include); } me->CurrentA = HTAnchor_findChildAndLink(me->node_anchor, /* Parent */ NULL, /* Tag */ href, /* Addresss */ (HTLinkType *) 0); /* Type */ HText_beginAnchor(me->text, me->inUnderline, me->CurrentA); if (me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_START_CHAR); HTML_put_string(me, VERBOSE_IMG(value, HTML_INPUT_SRC, "[IMAGE]")); FREE(newtitle); if (me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_END_CHAR); HText_endAnchor(me->text, 0); HTML_put_character(me, '-'); HaveSRClink = TRUE; } FREE(href); } CTRACE((tfp, "2.Ok, we're trying type=[%s] (present=%p)\n", NONNULL(I.type), (const void *) present)); /* text+file don't go in here */ if ((UseALTasVALUE == TRUE) || (present && present[HTML_INPUT_VALUE] && value[HTML_INPUT_VALUE] && (*value[HTML_INPUT_VALUE] || (I.type && (!strcasecomp(I.type, "checkbox") || !strcasecomp(I.type, "radio")))))) { /* * Convert any HTML entities or decimal escaping. - FM */ int CurrentCharSet = current_char_set; BOOL CurrentEightBitRaw = HTPassEightBitRaw; BOOLEAN CurrentUseDefaultRawMode = LYUseDefaultRawMode; HTCJKlang CurrentHTCJK = HTCJK; if (I.type && !strcasecomp(I.type, "hidden")) { me->HiddenValue = TRUE; current_char_set = LATIN1; /* Default ISO-Latin1 */ LYUseDefaultRawMode = TRUE; HTMLSetCharacterHandling(current_char_set); } CTRACE((tfp, "3.Ok, we're trying type=[%s]\n", NONNULL(I.type))); if (!I.type) me->UsePlainSpace = TRUE; else if (!strcasecomp(I.type, "text") || #ifdef USE_FILE_UPLOAD !strcasecomp(I.type, "file") || #endif !strcasecomp(I.type, "submit") || !strcasecomp(I.type, "image") || !strcasecomp(I.type, "reset")) { CTRACE((tfp, "normal field type: %s\n", NONNULL(I.type))); me->UsePlainSpace = TRUE; } StrAllocCopy(I_value, ((UseALTasVALUE == TRUE) ? value[HTML_INPUT_ALT] : value[HTML_INPUT_VALUE])); if (me->UsePlainSpace && !me->HiddenValue) { I.value_cs = current_char_set; } CTRACE((tfp, "4.Ok, we're trying type=[%s]\n", NONNULL(I.type))); TRANSLATE_AND_UNESCAPE_ENTITIES6(&I_value, ATTR_CS_IN, I.value_cs, (BOOL) (me->UsePlainSpace && !me->HiddenValue), me->UsePlainSpace, me->HiddenValue); I.value = I_value; if (me->UsePlainSpace == TRUE) { /* * Convert any newlines or tabs to spaces, and trim any * lead or trailing spaces. - FM */ LYReduceBlanks(I.value); } me->UsePlainSpace = FALSE; if (I.type && !strcasecomp(I.type, "hidden")) { me->HiddenValue = FALSE; current_char_set = CurrentCharSet; LYUseDefaultRawMode = CurrentUseDefaultRawMode; HTMLSetCharacterHandling(current_char_set); HTPassEightBitRaw = CurrentEightBitRaw; HTCJK = CurrentHTCJK; } } else if (HaveSRClink == TRUE) { /* * We put up an [IMAGE] link and '-' for a TYPE="image" and * didn't get a VALUE or ALT string, so fake a "Submit" value. * If we didn't put up a link, then HText_beginInput() will use * "[IMAGE]-Submit". - FM */ StrAllocCopy(I_value, "Submit"); I.value = I_value; } else if (ImageSrc) { /* [IMAGE]-Submit with verbose images and not clickable images. * Use ImageSrc if no other alt or value is supplied. --LE */ I.value = ImageSrc; } if (present && present[HTML_INPUT_READONLY]) I.readonly = YES; if (present && present[HTML_INPUT_CHECKED]) I.checked = YES; if (present && present[HTML_INPUT_SIZE] && non_empty(value[HTML_INPUT_SIZE])) I.size = atoi(value[HTML_INPUT_SIZE]); LimitValue(I.size, MAX_LINE); if (present && present[HTML_INPUT_MAXLENGTH] && non_empty(value[HTML_INPUT_MAXLENGTH])) I.maxlength = value[HTML_INPUT_MAXLENGTH]; if (present && present[HTML_INPUT_DISABLED]) I.disabled = YES; if (present && present[HTML_INPUT_ACCEPT_CHARSET]) { /* Not yet used. */ I.accept_cs = (value[HTML_INPUT_ACCEPT_CHARSET] ? value[HTML_INPUT_ACCEPT_CHARSET] : "UNKNOWN"); } if (present && present[HTML_INPUT_ALIGN] && /* Not yet used. */ non_empty(value[HTML_INPUT_ALIGN])) I.align = value[HTML_INPUT_ALIGN]; if (present && present[HTML_INPUT_CLASS] && /* Not yet used. */ non_empty(value[HTML_INPUT_CLASS])) I.iclass = value[HTML_INPUT_CLASS]; if (present && present[HTML_INPUT_ERROR] && /* Not yet used. */ non_empty(value[HTML_INPUT_ERROR])) I.error = value[HTML_INPUT_ERROR]; if (present && present[HTML_INPUT_HEIGHT] && /* Not yet used. */ non_empty(value[HTML_INPUT_HEIGHT])) I.height = value[HTML_INPUT_HEIGHT]; if (present && present[HTML_INPUT_WIDTH] && /* Not yet used. */ non_empty(value[HTML_INPUT_WIDTH])) I.width = value[HTML_INPUT_WIDTH]; if (present && present[HTML_INPUT_ID] && non_empty(value[HTML_INPUT_ID])) { I.id = value[HTML_INPUT_ID]; CHECK_ID(HTML_INPUT_ID); } if (present && present[HTML_INPUT_LANG] && /* Not yet used. */ non_empty(value[HTML_INPUT_LANG])) I.lang = value[HTML_INPUT_LANG]; if (present && present[HTML_INPUT_MD] && /* Not yet used. */ non_empty(value[HTML_INPUT_MD])) I.md = value[HTML_INPUT_MD]; chars = HText_beginInput(me->text, me->inUnderline, &I); CTRACE((tfp, "I.%s have %d chars, or something\n", NONNULL(I.type), chars)); /* * Submit and reset buttons have values which don't change, so * HText_beginInput() sets I.value to the string which should be * displayed, and we'll enter that instead of underscore * placeholders into the HText structure to see it instead of * underscores when dumping or printing. We also won't worry about * a wrap in PRE blocks, because the line editor never is invoked * for submit or reset buttons. - LE & FM */ if (I.type && (!strcasecomp(I.type, "submit") || !strcasecomp(I.type, "reset") || !strcasecomp(I.type, "image"))) IsSubmitOrReset = TRUE; if (I.type && chars == 3 && !strcasecomp(I.type, "radio")) { /* * Put a (_) placeholder, and one space (collapsible) before * the label that is expected to follow. - FM */ HTML_put_string(me, "(_)"); HText_endInput(me->text); chars = 0; me->in_word = YES; if (me->sp[0].tag_number != HTML_PRE && me->sp->style->freeFormat) { HTML_put_character(me, ' '); me->in_word = NO; } } else if (I.type && chars == 3 && !strcasecomp(I.type, "checkbox")) { /* * Put a [_] placeholder, and one space (collapsible) before * the label that is expected to follow. - FM */ HTML_put_string(me, "[_]"); HText_endInput(me->text); chars = 0; me->in_word = YES; if (me->sp[0].tag_number != HTML_PRE && me->sp->style->freeFormat) { HTML_put_character(me, ' '); me->in_word = NO; } } else if ((me->sp[0].tag_number == HTML_PRE || !me->sp->style->freeFormat) && chars > 6 && IsSubmitOrReset == FALSE) { /* * This is not a submit or reset button, and we are in a PRE * block with a field intended to exceed 6 character widths. * The code inadequately handles INPUT fields in PRE tags if * wraps occur (at the right margin) for the underscore * placeholders. We'll put up a minimum of 6 underscores, * since we should have wrapped artificially, above, if the * INPUT begins within 6 columns of the right margin, and if * any more would exceed the wrap column, we'll ignore them. * Note that if we somehow get tripped up and a wrap still does * occur before all 6 of the underscores are output, the * wrapped ones won't be treated as part of the editing window, * nor be highlighted when not editing (Yuk!). - FM */ for (i = 0; i < 6; i++) { HTML_put_character(me, '_'); chars--; } } CTRACE((tfp, "I.%s, %d\n", NONNULL(I.type), IsSubmitOrReset)); if (IsSubmitOrReset == FALSE) { /* * This is not a submit or reset button, so output the rest of * the underscore placeholders, if any more are needed. - FM */ if (chars > 0) { for (; chars > 0; chars--) HTML_put_character(me, '_'); HText_endInput(me->text); } } else { if (HTCJK == JAPANESE) { kcode = HText_getKcode(me->text); HText_updateKcode(me->text, kanji_code); specified_kcode = HText_getSpecifiedKcode(me->text); HText_updateSpecifiedKcode(me->text, kanji_code); } if (me->sp[0].tag_number == HTML_PRE || !me->sp->style->freeFormat) { /* * We have a submit or reset button in a PRE block, so * output the entire value from the markup. If it extends * to the right margin, it will wrap there, and only the * portion before that wrap will be highlighted on screen * display (Yuk!) but we may as well show the rest of the * full value on the next or more lines. - FM */ while (I.value[i]) HTML_put_character(me, I.value[i++]); } else { /* * The submit or reset button is not in a PRE block. Note * that if a wrap occurs before outputting the entire * value, the wrapped portion will not be highlighted or * clearly indicated as part of the link for submission or * reset (Yuk!). We'll replace any spaces in the submit or * reset button value with nbsp, to promote a wrap at the * space we ensured would be present before the start of * the string, as when we use all underscores instead of * the INPUT's actual value, but we could still get a wrap * at the right margin, instead, if the value is greater * than a line width for the current style. Also, if chars * somehow ended up longer than the length of the actual * value (shouldn't have), we'll continue padding with nbsp * up to the length of chars. - FM */ for (i = 0; I.value[i]; i++) HTML_put_character(me, (char) (I.value[i] == ' ' ? HT_NON_BREAK_SPACE : I.value[i])); while (i++ < chars) HTML_put_character(me, HT_NON_BREAK_SPACE); } if (HTCJK == JAPANESE) { HText_updateKcode(me->text, kcode); HText_updateSpecifiedKcode(me->text, specified_kcode); } } if (chars != 0) { HText_endInput(me->text); } FREE(ImageSrc); if (strcasecomp(NonNull(I.type), "submit")) FREE(I_value); FREE(I_name); } break; case HTML_TEXTAREA: /* * Set to know we are in a textarea. */ me->inTEXTAREA = TRUE; /* * Get ready for the value. */ HTChunkClear(&me->textarea); if (present && present[HTML_TEXTAREA_NAME] && value[HTML_TEXTAREA_NAME]) { StrAllocCopy(me->textarea_name, value[HTML_TEXTAREA_NAME]); me->textarea_name_cs = ATTR_CS_IN; if (StrChr(value[HTML_TEXTAREA_NAME], '&') != NULL) { UNESCAPE_FIELDNAME_TO_STD(&me->textarea_name); } } else { StrAllocCopy(me->textarea_name, ""); } if (present && present[HTML_TEXTAREA_ACCEPT_CHARSET]) { if (value[HTML_TEXTAREA_ACCEPT_CHARSET]) { StrAllocCopy(me->textarea_accept_cs, value[HTML_TEXTAREA_ACCEPT_CHARSET]); TRANSLATE_AND_UNESCAPE_TO_STD(&me->textarea_accept_cs); } else { StrAllocCopy(me->textarea_accept_cs, "UNKNOWN"); } } else { FREE(me->textarea_accept_cs); } if (present && present[HTML_TEXTAREA_COLS] && value[HTML_TEXTAREA_COLS] && isdigit(UCH(*value[HTML_TEXTAREA_COLS]))) { me->textarea_cols = atoi(value[HTML_TEXTAREA_COLS]); } else { int width; width = LYcolLimit - me->new_style->leftIndent - me->new_style->rightIndent; if (dump_output_immediately) /* don't waste too much for this */ width = HTMIN(width, DFT_TEXTAREA_COLS); if (width > 1 && (width - 1) * 6 < MAX_LINE - 3 - me->new_style->leftIndent - me->new_style->rightIndent) me->textarea_cols = width; else me->textarea_cols = DFT_TEXTAREA_COLS; } LimitValue(me->textarea_cols, MAX_TEXTAREA_COLS); if (present && present[HTML_TEXTAREA_ROWS] && value[HTML_TEXTAREA_ROWS] && isdigit(UCH(*value[HTML_TEXTAREA_ROWS]))) { me->textarea_rows = atoi(value[HTML_TEXTAREA_ROWS]); } else { me->textarea_rows = DFT_TEXTAREA_ROWS; } LimitValue(me->textarea_rows, MAX_TEXTAREA_ROWS); /* * Lynx treats disabled and readonly textarea's the same - * unmodifiable in either case. */ me->textarea_readonly = NO; if (present && present[HTML_TEXTAREA_READONLY]) me->textarea_readonly = YES; me->textarea_disabled = NO; if (present && present[HTML_TEXTAREA_DISABLED]) me->textarea_disabled = YES; if (present && present[HTML_TEXTAREA_ID] && non_empty(value[HTML_TEXTAREA_ID])) { StrAllocCopy(id_string, value[HTML_TEXTAREA_ID]); TRANSLATE_AND_UNESCAPE_TO_STD(&id_string); if ((*id_string != '\0') && (ID_A = HTAnchor_findChildAndLink(me->node_anchor, /* Parent */ id_string, /* Tag */ NULL, /* Addresss */ (HTLinkType *) 0))) { /* Type */ HText_beginAnchor(me->text, me->inUnderline, ID_A); HText_endAnchor(me->text, 0); StrAllocCopy(me->textarea_id, id_string); } else { FREE(me->textarea_id); } FREE(id_string); } else { FREE(me->textarea_id); } break; case HTML_SELECT: /* * Check for an already open SELECT block. - FM */ if (me->inSELECT) { if (LYBadHTML(me)) { LYShowBadHTML("Bad HTML: SELECT start tag in SELECT element. Faking SELECT end tag. *****\n"); } if (me->sp->tag_number != HTML_SELECT) { SET_SKIP_STACK(HTML_SELECT); } HTML_end_element(me, HTML_SELECT, include); } /* * Start a new SELECT block. - FM */ LYHandleSELECT(me, present, (STRING2PTR) value, include, TRUE); break; case HTML_OPTION: { /* * An option is a special case of an input field. */ InputFieldData I; /* * Make sure we're in a select tag. */ if (!me->inSELECT) { if (LYBadHTML(me)) { LYShowBadHTML("Bad HTML: OPTION tag not within SELECT tag\n"); } /* * Too likely to cause a crash, so we'll ignore it. - FM */ break; } if (!me->first_option) { /* * Finish the data off. */ HTChunkTerminate(&me->option); /* * Finish the previous option @@@@@ */ HText_setLastOptionValue(me->text, me->option.data, me->LastOptionValue, MIDDLE_ORDER, me->LastOptionChecked, me->UCLYhndl, ATTR_CS_IN); } /* * If it's not a multiple option list and select popups are * enabled, then don't use the checkbox/button method, and don't * put anything on the screen yet. */ if (me->first_option || HTCurSelectGroupType == F_CHECKBOX_TYPE || LYSelectPopups == FALSE) { if (HTCurSelectGroupType == F_CHECKBOX_TYPE || LYSelectPopups == FALSE) { /* * Start a newline before each option. */ LYEnsureSingleSpace(me); } else { /* * Add option list designation character. */ HText_appendCharacter(me->text, '['); me->in_word = YES; } /* * Inititialize. */ memset(&I, 0, sizeof(I)); I.name_cs = -1; I.value_cs = current_char_set; I.type = "OPTION"; if ((present && present[HTML_OPTION_SELECTED]) || (me->first_option && LYSelectPopups == FALSE && HTCurSelectGroupType == F_RADIO_TYPE)) I.checked = YES; if (present && present[HTML_OPTION_VALUE] && value[HTML_OPTION_VALUE]) { /* * Convert any HTML entities or decimal escaping. - FM */ StrAllocCopy(I_value, value[HTML_OPTION_VALUE]); me->HiddenValue = TRUE; TRANSLATE_AND_UNESCAPE_ENTITIES6(&I_value, ATTR_CS_IN, ATTR_CS_IN, NO, me->UsePlainSpace, me->HiddenValue); I.value_cs = ATTR_CS_IN; me->HiddenValue = FALSE; I.value = I_value; } if (me->select_disabled || (0 && present && present[HTML_OPTION_DISABLED])) { /* 2009/5/25 - suppress check for "disabled" attribute * for Debian #525934 -TD */ I.disabled = YES; } if (present && present[HTML_OPTION_ID] && non_empty(value[HTML_OPTION_ID])) { if ((ID_A = HTAnchor_findChildAndLink(me->node_anchor, /* Parent */ value[HTML_OPTION_ID], /* Tag */ NULL, /* Addresss */ 0)) != NULL) { /* Type */ HText_beginAnchor(me->text, me->inUnderline, ID_A); HText_endAnchor(me->text, 0); I.id = value[HTML_OPTION_ID]; } } HText_beginInput(me->text, me->inUnderline, &I); if (HTCurSelectGroupType == F_CHECKBOX_TYPE) { /* * Put a "[_]" placeholder, and one space (collapsible) * before the label that is expected to follow. - FM */ HText_appendCharacter(me->text, '['); HText_appendCharacter(me->text, '_'); HText_appendCharacter(me->text, ']'); HText_appendCharacter(me->text, ' '); HText_setLastChar(me->text, ' '); /* absorb white space */ me->in_word = NO; } else if (LYSelectPopups == FALSE) { /* * Put a "(_)" placeholder, and one space (collapsible) * before the label that is expected to follow. - FM */ HText_appendCharacter(me->text, '('); HText_appendCharacter(me->text, '_'); HText_appendCharacter(me->text, ')'); HText_appendCharacter(me->text, ' '); HText_setLastChar(me->text, ' '); /* absorb white space */ me->in_word = NO; } } /* * Get ready for the next value. */ HTChunkClear(&me->option); if ((present && present[HTML_OPTION_SELECTED]) || (me->first_option && LYSelectPopups == FALSE && HTCurSelectGroupType == F_RADIO_TYPE)) me->LastOptionChecked = TRUE; else me->LastOptionChecked = FALSE; me->first_option = FALSE; if (present && present[HTML_OPTION_VALUE] && value[HTML_OPTION_VALUE]) { if (!I_value) { /* * Convert any HTML entities or decimal escaping. - FM */ StrAllocCopy(I_value, value[HTML_OPTION_VALUE]); me->HiddenValue = TRUE; TRANSLATE_AND_UNESCAPE_ENTITIES6(&I_value, ATTR_CS_IN, ATTR_CS_IN, NO, me->UsePlainSpace, me->HiddenValue); me->HiddenValue = FALSE; } StrAllocCopy(me->LastOptionValue, I_value); } else { StrAllocCopy(me->LastOptionValue, me->option.data); } /* * If this is a popup option, print its option for use in selecting * option by number. - LE */ if (HTCurSelectGroupType == F_RADIO_TYPE && LYSelectPopups && fields_are_numbered()) { char marker[8]; int opnum = HText_getOptionNum(me->text); if (opnum > 0 && opnum < 100000) { sprintf(marker, "(%d)", opnum); HTML_put_string(me, marker); for (i = (int) strlen(marker); i < 5; ++i) { HTML_put_character(me, '_'); } } } FREE(I_value); } break; case HTML_TABLE: /* * Not fully implemented. Just treat as a division with respect to any * ALIGN attribute, with a default of HT_LEFT, or leave as a PRE block * if we are presently in one. - FM * * Also notify simple table tracking code unless in a preformatted * section, or (currently) non-left alignment. * * If page author is using a TABLE within PRE, it's probably formatted * specifically to work well for Lynx without simple table tracking * code. Cancel tracking, it would only make things worse. - kw */ #ifdef EXP_NESTED_TABLES if (!nested_tables) #endif { HText_cancelStbl(me->text); } if (me->inA) { SET_SKIP_STACK(HTML_A); HTML_end_element(me, HTML_A, include); } if (me->Underline_Level > 0) { SET_SKIP_STACK(HTML_U); HTML_end_element(me, HTML_U, include); } me->inTABLE = TRUE; if (me->sp->style->id == ST_Preformatted) { UPDATE_STYLE; CHECK_ID(HTML_TABLE_ID); break; } if (me->Division_Level < (MAX_NESTING - 1)) { me->Division_Level++; } else { CTRACE((tfp, "HTML: ****** Maximum nesting of %d divisions/tables exceeded!\n", MAX_NESTING)); } if (present && present[HTML_TABLE_ALIGN] && non_empty(value[HTML_TABLE_ALIGN])) { if (!strcasecomp(value[HTML_TABLE_ALIGN], "center")) { if (no_table_center) { me->DivisionAlignments[me->Division_Level] = HT_LEFT; change_paragraph_style(me, styles[HTML_DLEFT]); UPDATE_STYLE; me->current_default_alignment = styles[HTML_DLEFT]->alignment; } else { me->DivisionAlignments[me->Division_Level] = HT_CENTER; change_paragraph_style(me, styles[HTML_DCENTER]); UPDATE_STYLE; me->current_default_alignment = styles[HTML_DCENTER]->alignment; } stbl_align = HT_CENTER; } else if (!strcasecomp(value[HTML_TABLE_ALIGN], "right")) { me->DivisionAlignments[me->Division_Level] = HT_RIGHT; change_paragraph_style(me, styles[HTML_DRIGHT]); UPDATE_STYLE; me->current_default_alignment = styles[HTML_DRIGHT]->alignment; stbl_align = HT_RIGHT; } else { me->DivisionAlignments[me->Division_Level] = HT_LEFT; change_paragraph_style(me, styles[HTML_DLEFT]); UPDATE_STYLE; me->current_default_alignment = styles[HTML_DLEFT]->alignment; if (!strcasecomp(value[HTML_TABLE_ALIGN], "left") || !strcasecomp(value[HTML_TABLE_ALIGN], "justify")) stbl_align = HT_LEFT; } } else { me->DivisionAlignments[me->Division_Level] = HT_LEFT; change_paragraph_style(me, styles[HTML_DLEFT]); UPDATE_STYLE; me->current_default_alignment = styles[HTML_DLEFT]->alignment; /* stbl_align remains HT_ALIGN_NONE */ } CHECK_ID(HTML_TABLE_ID); HText_startStblTABLE(me->text, stbl_align); break; case HTML_TR: /* * Not fully implemented. Just start a new row, if needed, act on an * ALIGN attribute if present, and check for an ID link. - FM * Also notify simple table tracking code. - kw */ if (me->inA) { SET_SKIP_STACK(HTML_A); HTML_end_element(me, HTML_A, include); } if (me->Underline_Level > 0) { SET_SKIP_STACK(HTML_U); HTML_end_element(me, HTML_U, include); } UPDATE_STYLE; if (!HText_LastLineEmpty(me->text, FALSE)) { HText_setLastChar(me->text, ' '); /* absorb white space */ HText_appendCharacter(me->text, '\r'); } me->in_word = NO; if (me->sp->style->id == ST_Preformatted) { CHECK_ID(HTML_TR_ID); me->inP = FALSE; break; } if (LYoverride_default_alignment(me)) { me->sp->style->alignment = styles[me->sp[0].tag_number]->alignment; } else if (me->List_Nesting_Level >= 0 || ((me->Division_Level < 0) && (me->sp->style->id == ST_Normal || me->sp->style->id == ST_Preformatted))) { me->sp->style->alignment = HT_LEFT; } else { me->sp->style->alignment = (short) me->current_default_alignment; } if (present && present[HTML_TR_ALIGN] && value[HTML_TR_ALIGN]) { if (!strcasecomp(value[HTML_TR_ALIGN], "center") && !(me->List_Nesting_Level >= 0 && !me->inP)) { if (no_table_center) me->sp->style->alignment = HT_LEFT; else me->sp->style->alignment = HT_CENTER; stbl_align = HT_CENTER; } else if (!strcasecomp(value[HTML_TR_ALIGN], "right") && !(me->List_Nesting_Level >= 0 && !me->inP)) { me->sp->style->alignment = HT_RIGHT; stbl_align = HT_RIGHT; } else if (!strcasecomp(value[HTML_TR_ALIGN], "left") || !strcasecomp(value[HTML_TR_ALIGN], "justify")) { me->sp->style->alignment = HT_LEFT; stbl_align = HT_LEFT; } } CHECK_ID(HTML_TR_ID); me->inP = FALSE; HText_startStblTR(me->text, stbl_align); break; case HTML_THEAD: case HTML_TFOOT: case HTML_TBODY: HText_endStblTR(me->text); /* * Not fully implemented. Just check for an ID link. - FM */ if (me->inA) { SET_SKIP_STACK(HTML_A); HTML_end_element(me, HTML_A, include); } if (me->Underline_Level > 0) { SET_SKIP_STACK(HTML_U); HTML_end_element(me, HTML_U, include); } UPDATE_STYLE; if (me->inTABLE) { if (present && present[HTML_TR_ALIGN] && value[HTML_TR_ALIGN]) { if (!strcasecomp(value[HTML_TR_ALIGN], "center")) { stbl_align = HT_CENTER; } else if (!strcasecomp(value[HTML_TR_ALIGN], "right")) { stbl_align = HT_RIGHT; } else if (!strcasecomp(value[HTML_TR_ALIGN], "left") || !strcasecomp(value[HTML_TR_ALIGN], "justify")) { stbl_align = HT_LEFT; } } HText_startStblRowGroup(me->text, stbl_align); } CHECK_ID(HTML_TR_ID); break; case HTML_COL: case HTML_COLGROUP: /* * Not fully implemented. Just check for an ID link. - FM */ if (me->inA) { SET_SKIP_STACK(HTML_A); HTML_end_element(me, HTML_A, include); } if (me->Underline_Level > 0) { SET_SKIP_STACK(HTML_U); HTML_end_element(me, HTML_U, include); } UPDATE_STYLE; if (me->inTABLE) { int span = 1; if (present && present[HTML_COL_SPAN] && value[HTML_COL_SPAN] && isdigit(UCH(*value[HTML_COL_SPAN]))) span = atoi(value[HTML_COL_SPAN]); if (present && present[HTML_COL_ALIGN] && value[HTML_COL_ALIGN]) { if (!strcasecomp(value[HTML_COL_ALIGN], "center")) { stbl_align = HT_CENTER; } else if (!strcasecomp(value[HTML_COL_ALIGN], "right")) { stbl_align = HT_RIGHT; } else if (!strcasecomp(value[HTML_COL_ALIGN], "left") || !strcasecomp(value[HTML_COL_ALIGN], "justify")) { stbl_align = HT_LEFT; } } HText_startStblCOL(me->text, span, stbl_align, (BOOL) (ElementNumber == HTML_COLGROUP)); } CHECK_ID(HTML_COL_ID); break; case HTML_TH: case HTML_TD: if (me->inA) { SET_SKIP_STACK(HTML_A); HTML_end_element(me, HTML_A, include); } if (me->Underline_Level > 0) { SET_SKIP_STACK(HTML_U); HTML_end_element(me, HTML_U, include); } UPDATE_STYLE; CHECK_ID(HTML_TD_ID); /* * Not fully implemented. Just add a collapsible space and break - FM * Also notify simple table tracking code. - kw */ HTML_put_character(me, ' '); { int colspan = 1, rowspan = 1; if (present && present[HTML_TD_COLSPAN] && value[HTML_TD_COLSPAN] && isdigit(UCH(*value[HTML_TD_COLSPAN]))) colspan = atoi(value[HTML_TD_COLSPAN]); if (present && present[HTML_TD_ROWSPAN] && value[HTML_TD_ROWSPAN] && isdigit(UCH(*value[HTML_TD_ROWSPAN]))) rowspan = atoi(value[HTML_TD_ROWSPAN]); if (present && present[HTML_TD_ALIGN] && value[HTML_TD_ALIGN]) { if (!strcasecomp(value[HTML_TD_ALIGN], "center")) { stbl_align = HT_CENTER; } else if (!strcasecomp(value[HTML_TD_ALIGN], "right")) { stbl_align = HT_RIGHT; } else if (!strcasecomp(value[HTML_TD_ALIGN], "left") || !strcasecomp(value[HTML_TD_ALIGN], "justify")) { stbl_align = HT_LEFT; } } HText_startStblTD(me->text, colspan, rowspan, stbl_align, (BOOL) (ElementNumber == HTML_TH)); } me->in_word = NO; break; case HTML_MATH: /* * We're getting it as Literal text, which, until we can process it, * we'll display as is, within brackets to alert the user. - FM */ HTChunkClear(&me->math); CHECK_ID(HTML_GEN_ID); break; default: break; } /* end switch */ if (ElementNumber >= HTML_ELEMENTS || HTML_dtd.tags[ElementNumber].contents != SGML_EMPTY) { if (me->skip_stack > 0) { CTRACE((tfp, "HTML:begin_element: internal call (level %d), leaving on stack - `%s'\n", me->skip_stack, NONNULL(GetHTStyleName(me->sp->style)))); me->skip_stack--; return status; } if (me->sp == me->stack) { if (me->stack_overrun == FALSE) { HTAlert(HTML_STACK_OVERRUN); CTRACE((tfp, "HTML: ****** Maximum nesting of %d tags exceeded!\n", MAX_NESTING)); me->stack_overrun = TRUE; } return HT_ERROR; } CTRACE((tfp, "HTML:begin_element[%d]: adding style to stack - %s (%s)\n", (int) STACKLEVEL(me), NONNULL(GetHTStyleName(me->new_style)), HTML_dtd.tags[ElementNumber].name)); (me->sp)--; me->sp[0].style = me->new_style; /* Stack new style */ me->sp[0].tag_number = ElementNumber; #ifdef USE_JUSTIFY_ELTS if (wait_for_this_stacked_elt < 0 && HTML_dtd.tags[ElementNumber].can_justify == FALSE) wait_for_this_stacked_elt = (int) (me->stack - me->sp) + MAX_NESTING; #endif } #ifdef USE_JUSTIFY_ELTS if (in_DT && ElementNumber == HTML_DD) in_DT = FALSE; else if (ElementNumber == HTML_DT) in_DT = TRUE; #endif #if defined(USE_COLOR_STYLE) /* end really empty tags straight away */ if (ReallyEmptyTagNum(element_number)) { CTRACE2(TRACE_STYLE, (tfp, "STYLE.begin_element:ending \"EMPTY\" element style\n")); HText_characterStyle(me->text, hcode, STACK_OFF); FastTrimColorClass(HTML_dtd.tags[element_number].name, HTML_dtd.tags[element_number].name_len, Style_className, &Style_className_end, &hcode); } #endif /* USE_COLOR_STYLE */ return status; } /* End Element * ----------- * * When we end an element, the style must be returned to that * in effect before that element. Note that anchors (etc?) * don't have an associated style, so that we must scan down the * stack for an element with a defined style. (In fact, the styles * should be linked to the whole stack not just the top one.) * TBL 921119 */ static int HTML_end_element(HTStructured * me, int element_number, char **include) { static char empty[1]; int i = 0; int status = HT_OK; char *temp = NULL, *cp = NULL; BOOL BreakFlag = FALSE; BOOL intern_flag = FALSE; #ifdef USE_COLOR_STYLE BOOL skip_stack_requested = FALSE; #endif EMIT_IFDEF_USE_JUSTIFY_ELTS(BOOL reached_awaited_stacked_elt = FALSE); if ((me->sp >= (me->stack + MAX_NESTING - 1) || element_number != me->sp[0].tag_number) && HTML_dtd.tags[element_number].contents != SGML_EMPTY) { CTRACE((tfp, "HTML: end of element %s when expecting end of %s\n", HTML_dtd.tags[element_number].name, (me->sp == me->stack + MAX_NESTING - 1) ? "none" : (me->sp->tag_number < 0) ? "*invalid tag*" : (me->sp->tag_number >= HTML_ELEMENTS) ? "special tag" : HTML_dtd.tags[me->sp->tag_number].name)); } /* * If we're seeking MAPs, skip everything that's not a MAP or AREA tag. - * FM */ if (LYMapsOnly) { if (!(element_number == HTML_MAP || element_number == HTML_AREA || element_number == HTML_OBJECT)) { return HT_OK; } } /* * Pop state off stack if we didn't declare the element SGML_EMPTY in * HTMLDTD.c. - FM & KW */ if (HTML_dtd.tags[element_number].contents != SGML_EMPTY) { #ifdef USE_COLOR_STYLE skip_stack_requested = (BOOL) (me->skip_stack > 0); #endif if ((element_number != me->sp[0].tag_number) && me->skip_stack <= 0 && HTML_dtd.tags[HTML_LH].contents != SGML_EMPTY && (me->sp[0].tag_number == HTML_UL || me->sp[0].tag_number == HTML_OL || me->sp[0].tag_number == HTML_MENU || me->sp[0].tag_number == HTML_DIR || me->sp[0].tag_number == HTML_LI) && (element_number == HTML_H1 || element_number == HTML_H2 || element_number == HTML_H3 || element_number == HTML_H4 || element_number == HTML_H5 || element_number == HTML_H6)) { /* * Set the break flag if we're popping a dummy HTML_LH substituted * for an HTML_H# encountered in a list. */ BreakFlag = TRUE; } if (me->skip_stack == 0 && element_number == HTML_OBJECT && me->sp[0].tag_number == HTML_OBJECT_M && (me->sp < (me->stack + MAX_NESTING - 1))) me->sp[0].tag_number = HTML_OBJECT; if (me->skip_stack > 0) { CTRACE2(TRACE_STYLE, (tfp, "HTML:end_element: Internal call (level %d), leaving on stack - %s\n", me->skip_stack, NONNULL(GetHTStyleName(me->sp->style)))); me->skip_stack--; } else if (element_number == HTML_OBJECT && me->sp[0].tag_number != HTML_OBJECT && me->sp[0].tag_number != HTML_OBJECT_M && me->objects_mixed_open > 0 && !(me->objects_figged_open > 0 && me->sp[0].tag_number == HTML_FIG)) { /* * Ignore non-corresponding OBJECT tags that we didn't push because * the SGML parser was supposed to go on parsing the contents * non-literally. - kw */ CTRACE2(TRACE_STYLE, (tfp, "HTML:end_element[%d]: %s (level %d), %s - %s\n", (int) STACKLEVEL(me), "Special OBJECT handling", me->objects_mixed_open, "leaving on stack", NONNULL(GetHTStyleName(me->sp->style)))); me->objects_mixed_open--; } else if (me->stack_overrun == TRUE && element_number != me->sp[0].tag_number) { /* * Ignore non-corresponding tags if we had a stack overrun. This * is not a completely fail-safe strategy for protection against * any seriously adverse consequences of a stack overrun, and the * rendering of the document will not be as intended, but we expect * overruns to be rare, and this should offer reasonable protection * against crashes if an overrun does occur. - FM */ return HT_OK; /* let's pretend... */ } else if (element_number == HTML_SELECT && me->sp[0].tag_number != HTML_SELECT) { /* * Ignore non-corresponding SELECT tags, since we probably popped * it and closed the SELECT block to deal with markup which amounts * to a nested SELECT, or an out of order FORM end tag. - FM */ return HT_OK; } else if ((element_number != me->sp[0].tag_number) && HTML_dtd.tags[HTML_LH].contents == SGML_EMPTY && (me->sp[0].tag_number == HTML_UL || me->sp[0].tag_number == HTML_OL || me->sp[0].tag_number == HTML_MENU || me->sp[0].tag_number == HTML_DIR || me->sp[0].tag_number == HTML_LI) && (element_number == HTML_H1 || element_number == HTML_H2 || element_number == HTML_H3 || element_number == HTML_H4 || element_number == HTML_H5 || element_number == HTML_H6)) { /* * It's an H# for which we substituted an HTML_LH, which we've * declared as SGML_EMPTY, so just return. - FM */ return HT_OK; } else if (me->sp < (me->stack + MAX_NESTING - 1)) { #ifdef USE_JUSTIFY_ELTS if (wait_for_this_stacked_elt == me->stack - me->sp + MAX_NESTING) reached_awaited_stacked_elt = TRUE; #endif if (element_number == HTML_OBJECT) { if (me->sp[0].tag_number == HTML_FIG && me->objects_figged_open > 0) { /* * It's an OBJECT for which we substituted a FIG, so pop * the FIG and pretend that's what we are being called for. * - kw */ CTRACE2(TRACE_STYLE, (tfp, "HTML:end_element[%d]: %s (level %d), %s - %s\n", (int) STACKLEVEL(me), "Special OBJECT->FIG handling", me->objects_figged_open, "treating as end FIG", NONNULL(GetHTStyleName(me->sp->style)))); me->objects_figged_open--; element_number = HTML_FIG; } } (me->sp)++; CTRACE2(TRACE_STYLE, (tfp, "HTML:end_element[%d]: Popped style off stack - %s\n", (int) STACKLEVEL(me), NONNULL(GetHTStyleName(me->sp->style)))); } else { CTRACE2(TRACE_STYLE, (tfp, "Stack underflow error! Tried to pop off more styles than exist in stack\n")); } } if (BreakFlag == TRUE) { #ifdef USE_JUSTIFY_ELTS if (reached_awaited_stacked_elt) wait_for_this_stacked_elt = -1; #endif return HT_OK; /* let's pretend... */ } /* * Check for unclosed TEXTAREA. - FM */ if (me->inTEXTAREA && element_number != HTML_TEXTAREA) { if (LYBadHTML(me)) { LYShowBadHTML("Bad HTML: Missing TEXTAREA end tag\n"); } } if (!me->text && !LYMapsOnly) { UPDATE_STYLE; } /* * Handle the end tag. - FM */ switch (element_number) { case HTML_HTML: if (me->inA || me->inSELECT || me->inTEXTAREA) { if (LYBadHTML(me)) { char *msg = NULL; HTSprintf0(&msg, "Bad HTML: %s%s%s%s%s not closed before HTML end tag *****\n", me->inSELECT ? "SELECT" : "", (me->inSELECT && me->inTEXTAREA) ? ", " : "", me->inTEXTAREA ? "TEXTAREA" : "", (((me->inSELECT || me->inTEXTAREA) && me->inA) ? ", " : ""), me->inA ? "A" : ""); LYShowBadHTML(msg); FREE(msg); } } break; case HTML_HEAD: if (me->inBASE && (LYIsUIPage3(me->node_anchor->address, UIP_LIST_PAGE, 0) || LYIsUIPage3(me->node_anchor->address, UIP_ADDRLIST_PAGE, 0))) { /* If we are parsing the List Page, and have a BASE after we are * done with the HEAD element, propagate it back to the node_anchor * object. The base should have been inserted by showlist() to * record what document the List Page is about, and other functions * may later look for it in the anchor. - kw */ StrAllocCopy(me->node_anchor->content_base, me->base_href); } if (HText_hasToolbar(me->text)) HText_appendParagraph(me->text); break; case HTML_TITLE: HTChunkTerminate(&me->title); HTAnchor_setTitle(me->node_anchor, me->title.data); HTChunkClear(&me->title); /* * Check if it's a bookmark file, and if so, and multiple bookmark * support is on, or it's off but this isn't the default bookmark file * (e.g., because it was on before, and this is another bookmark file * that has been retrieved as a previous document), insert the current * description string and filepath for it. We pass the strings back to * the SGML parser so that any 8 bit or multibyte/CJK characters will * be handled by the parser's state and charset routines. - FM */ if (non_empty(me->node_anchor->bookmark)) { if ((LYMultiBookmarks != MBM_OFF) || (non_empty(bookmark_page) && strcmp(me->node_anchor->bookmark, bookmark_page))) { if (!include) include = &me->xinclude; for (i = 0; i <= MBM_V_MAXFILES; i++) { if (MBM_A_subbookmark[i] && !strcmp(MBM_A_subbookmark[i], me->node_anchor->bookmark)) { StrAllocCat(*include, "

"); StrAllocCat(*include, gettext("Description:")); StrAllocCat(*include, " "); StrAllocCopy(temp, ((MBM_A_subdescript[i] && *MBM_A_subdescript[i]) ? MBM_A_subdescript[i] : gettext("(none)"))); LYEntify(&temp, TRUE); StrAllocCat(*include, temp); StrAllocCat(*include, "
   "); StrAllocCat(*include, gettext("Filepath:")); StrAllocCat(*include, " "); StrAllocCopy(temp, ((MBM_A_subbookmark[i] && *MBM_A_subbookmark[i]) ? MBM_A_subbookmark[i] : gettext("(unknown)"))); LYEntify(&temp, TRUE); StrAllocCat(*include, temp); FREE(temp); StrAllocCat(*include, "

"); break; } } } } break; case HTML_STYLE: /* * We're getting it as Literal text, which, for now, we'll just ignore. * - FM */ HTChunkTerminate(&me->style_block); CTRACE2(TRACE_STYLE, (tfp, "HTML: STYLE content =\n%s\n", me->style_block.data)); HTChunkClear(&me->style_block); break; case HTML_SCRIPT: /* * We're getting it as Literal text, which, for now, we'll just ignore. * - FM */ HTChunkTerminate(&me->script); CTRACE((tfp, "HTML: SCRIPT content =\n%s\n", me->script.data)); HTChunkClear(&me->script); break; case HTML_BODY: if (me->inA || me->inSELECT || me->inTEXTAREA) { if (LYBadHTML(me)) { char *msg = NULL; HTSprintf0(&msg, "Bad HTML: %s%s%s%s%s not closed before BODY end tag *****\n", me->inSELECT ? "SELECT" : "", (me->inSELECT && me->inTEXTAREA) ? ", " : "", me->inTEXTAREA ? "TEXTAREA" : "", (((me->inSELECT || me->inTEXTAREA) && me->inA) ? ", " : ""), me->inA ? "A" : ""); LYShowBadHTML(msg); FREE(msg); } } break; case HTML_FRAMESET: change_paragraph_style(me, me->sp->style); /* Often won't really change */ break; case HTML_NOFRAMES: case HTML_IFRAME: LYEnsureDoubleSpace(me); LYResetParagraphAlignment(me); change_paragraph_style(me, me->sp->style); /* Often won't really change */ break; case HTML_BANNER: case HTML_MARQUEE: case HTML_BLOCKQUOTE: case HTML_BQ: case HTML_ADDRESS: /* * Set flag to know that style has ended. Fall through. i_prior_style = -1; */ change_paragraph_style(me, me->sp->style); UPDATE_STYLE; if (me->sp->tag_number == element_number) LYEnsureDoubleSpace(me); if (me->List_Nesting_Level >= 0) HText_NegateLineOne(me->text); break; case HTML_CENTER: case HTML_DIV: if (me->Division_Level >= 0) me->Division_Level--; if (me->Division_Level >= 0) { if (me->sp->style->alignment != me->DivisionAlignments[me->Division_Level]) { if (me->inP) LYEnsureSingleSpace(me); me->sp->style->alignment = me->DivisionAlignments[me->Division_Level]; } } change_paragraph_style(me, me->sp->style); if (me->style_change) { actually_set_style(me); if (me->List_Nesting_Level >= 0) HText_NegateLineOne(me->text); } else if (me->inP) LYEnsureSingleSpace(me); me->current_default_alignment = me->sp->style->alignment; break; case HTML_H1: /* header styles */ case HTML_H2: case HTML_H3: case HTML_H4: case HTML_H5: case HTML_H6: if (me->Division_Level >= 0) { me->sp->style->alignment = me->DivisionAlignments[me->Division_Level]; } else if (me->sp->style->id == ST_HeadingCenter || me->sp->style->id == ST_Heading1) { me->sp->style->alignment = HT_CENTER; } else if (me->sp->style->id == ST_HeadingRight) { me->sp->style->alignment = HT_RIGHT; } else { me->sp->style->alignment = HT_LEFT; } change_paragraph_style(me, me->sp->style); UPDATE_STYLE; if (styles[element_number]->font & HT_BOLD) { if (me->inBoldA == FALSE && me->inBoldH == TRUE) { HText_appendCharacter(me->text, LY_BOLD_END_CHAR); } me->inBoldH = FALSE; } if (me->List_Nesting_Level >= 0) HText_NegateLineOne(me->text); if (me->Underline_Level > 0 && me->inUnderline == FALSE) { HText_appendCharacter(me->text, LY_UNDERLINE_START_CHAR); me->inUnderline = TRUE; } break; case HTML_P: LYHandlePlike(me, (const BOOL *) 0, (STRING2PTR) 0, include, 0, FALSE); break; case HTML_FONT: me->inFONT = FALSE; break; case HTML_B: /* Physical character highlighting */ case HTML_BLINK: case HTML_I: case HTML_U: case HTML_CITE: /* Logical character highlighting */ case HTML_EM: case HTML_STRONG: /* * Ignore any emphasis end tags if the Underline_Level is not set. - * FM */ if (me->Underline_Level <= 0) break; /* * Adjust the Underline level counter, and turn off underlining if * appropriate. - FM */ me->Underline_Level--; if (me->inUnderline && me->Underline_Level < 1) { HText_appendCharacter(me->text, LY_UNDERLINE_END_CHAR); me->inUnderline = FALSE; CTRACE((tfp, "Ending underline\n")); } else { CTRACE((tfp, "Underline Level is %d\n", me->Underline_Level)); } break; case HTML_ABBR: /* Miscellaneous character containers */ case HTML_ACRONYM: case HTML_AU: case HTML_AUTHOR: case HTML_BIG: case HTML_CODE: case HTML_DFN: case HTML_KBD: case HTML_SAMP: case HTML_SMALL: case HTML_SUP: case HTML_TT: case HTML_VAR: break; case HTML_SUB: HText_appendCharacter(me->text, ']'); break; case HTML_DEL: case HTML_S: case HTML_STRIKE: HTML_put_character(me, ' '); if (me->inUnderline == FALSE) HText_appendCharacter(me->text, LY_UNDERLINE_START_CHAR); HTML_put_string(me, ":DEL]"); if (me->inUnderline == FALSE) HText_appendCharacter(me->text, LY_UNDERLINE_END_CHAR); HTML_put_character(me, ' '); me->in_word = NO; break; case HTML_INS: HTML_put_character(me, ' '); if (me->inUnderline == FALSE) HText_appendCharacter(me->text, LY_UNDERLINE_START_CHAR); HTML_put_string(me, ":INS]"); if (me->inUnderline == FALSE) HText_appendCharacter(me->text, LY_UNDERLINE_END_CHAR); HTML_put_character(me, ' '); me->in_word = NO; break; case HTML_Q: if (me->Quote_Level > 0) me->Quote_Level--; /* * Should check LANG and/or DIR attributes, and the * me->node_anchor->charset and/or yet to be added structure elements, * to determine whether we should use chevrons, but for now we'll * always use double- or single-quotes. - FM */ if (!(me->Quote_Level & 1)) HTML_put_character(me, '"'); else HTML_put_character(me, '\''); break; case HTML_PRE: /* Formatted text */ /* * Set to know that we are no longer in a PRE block. */ HText_appendCharacter(me->text, '\n'); me->inPRE = FALSE; /* FALLTHRU */ case HTML_LISTING: /* Literal text */ /* FALLTHRU */ case HTML_XMP: /* FALLTHRU */ case HTML_PLAINTEXT: if (me->comment_start) HText_appendText(me->text, me->comment_start); change_paragraph_style(me, me->sp->style); /* Often won't really change */ if (me->List_Nesting_Level >= 0) { UPDATE_STYLE; HText_NegateLineOne(me->text); } break; case HTML_NOTE: case HTML_FN: change_paragraph_style(me, me->sp->style); /* Often won't really change */ UPDATE_STYLE; if (me->sp->tag_number == element_number) LYEnsureDoubleSpace(me); if (me->List_Nesting_Level >= 0) HText_NegateLineOne(me->text); me->inLABEL = FALSE; break; case HTML_OL: me->OL_Counter[me->List_Nesting_Level < 11 ? me->List_Nesting_Level : 11] = OL_VOID; /* FALLTHRU */ case HTML_DL: /* FALLTHRU */ case HTML_UL: /* FALLTHRU */ case HTML_MENU: /* FALLTHRU */ case HTML_DIR: me->List_Nesting_Level--; CTRACE((tfp, "HTML_end_element: Reducing List Nesting Level to %d\n", me->List_Nesting_Level)); #ifdef USE_JUSTIFY_ELTS if (element_number == HTML_DL) in_DT = FALSE; /*close the term that was without definition. */ #endif change_paragraph_style(me, me->sp->style); /* Often won't really change */ UPDATE_STYLE; if (me->List_Nesting_Level >= 0) LYEnsureSingleSpace(me); break; case HTML_SPAN: /* * Should undo anything we did based on LANG and/or DIR attributes, and * the me->node_anchor->charset and/or yet to be added structure * elements. - FM */ break; case HTML_BDO: /* * Should undo anything we did based on DIR (and/or LANG) attributes, * and the me->node_anchor->charset and/or yet to be added structure * elements. - FM */ break; case HTML_A: /* * Ignore any spurious A end tags. - FM */ if (me->inA == FALSE) break; /* * Set to know that we are no longer in an anchor. */ me->inA = FALSE; #ifdef MARK_HIDDEN_LINKS if (non_empty(hidden_link_marker) && HText_isAnchorBlank(me->text, me->CurrentANum)) { HText_appendText(me->text, hidden_link_marker); } #endif UPDATE_STYLE; if (me->inBoldA == TRUE && me->inBoldH == FALSE) HText_appendCharacter(me->text, LY_BOLD_END_CHAR); HText_endAnchor(me->text, me->CurrentANum); me->CurrentANum = 0; me->inBoldA = FALSE; if (me->Underline_Level > 0 && me->inUnderline == FALSE) { HText_appendCharacter(me->text, LY_UNDERLINE_START_CHAR); me->inUnderline = TRUE; } break; case HTML_MAP: FREE(me->map_address); break; case HTML_BODYTEXT: /* * We may need to look at this someday to deal with OBJECTs optimally, * but just ignore it for now. - FM */ change_paragraph_style(me, me->sp->style); /* Often won't really change */ break; case HTML_TEXTFLOW: /* * We may need to look at this someday to deal with APPLETs optimally, * but just ignore it for now. - FM */ change_paragraph_style(me, me->sp->style); /* Often won't really change */ break; case HTML_FIG: LYHandleFIG(me, NULL, NULL, 0, 0, NULL, NULL, NO, FALSE, &intern_flag); break; case HTML_OBJECT: /* * Finish the data off. */ { int s = 0, e = 0; char *start = NULL, *first_end = NULL, *last_end = NULL; char *first_map = NULL, *last_map = NULL; BOOL have_param = FALSE; char *data = NULL; HTChunkTerminate(&me->object); data = me->object.data; while ((cp = StrChr(data, '<')) != NULL) { /* * Look for nested OBJECTs. This procedure could get tripped * up if invalid comments are present in the content, or if an * OBJECT end tag is present in a quoted attribute. - FM */ if (!StrNCmp(cp, "