#include <HTUtils.h>
#include <HTTP.h>
#include <HTAnchor.h> /* Anchor class */
#include <HTAccess.h>
#include <HTParse.h>
#include <LYCurses.h>
#include <GridText.h>
#include <LYGlobalDefs.h>
#include <LYUtils.h>
#include <LYCharSets.h>
#include <LYCharUtils.h>
#include <HTAlert.h>
#include <LYSignal.h>
#include <LYGetFile.h>
#include <LYPrint.h>
#include <LYOptions.h>
#include <LYHistory.h>
#include <LYStrings.h>
#include <LYClean.h>
#include <LYDownload.h>
#include <LYNews.h>
#include <LYMail.h>
#include <LYKeymap.h>
#include <LYBookmark.h>
#include <LYMap.h>
#include <LYList.h>
#ifdef DIRED_SUPPORT
#include <LYLocal.h>
#endif /* DIRED_SUPPORT */
#include <LYReadCFG.h>
#include <LYexit.h>
#include <LYLeaks.h>
#ifndef VMS
#ifdef SYSLOG_REQUESTED_URLS
#include <syslog.h>
#endif /* SYSLOG_REQUESTED_URLS */
#endif /* !VMS */
PRIVATE int fix_httplike_urls PARAMS((document *doc, UrlTypes type));
extern char * WWW_Download_File;
#ifdef VMS
extern BOOLEAN LYDidRename;
#endif /* VMS */
#ifdef VMS
#define STRNADDRCOMP strncasecomp
#else
#define STRNADDRCOMP strncmp
#endif /* !VMS */
PUBLIC int HTNoDataOK = 0;
/*
* getfile is the main mechanism to load a new document (or a previously
* laoded one whose rendering is cached in a HText structure) from
* mainloop, nearly everything goes through it.
* It should return one of the values
* NORMAL - requested document loaded successfully, usually [always?]
* its rendering is available as HTMainText. It can be an
* HTTP error message page or similar, we make no
* distinction here.
* NOT_FOUND - requested document cannot be accessed, and the reason
* is a real error (as may be caused by an invalid link),
* not just that lynx disallows access because of some
* permission restrictions, and we have no error page
* to show for it either.
* NULLFILE - requested document not loaded into HTMainText, either
* some interactive protocol was requested (like telnet),
* or lynx does not allow access,
* The distinction between NOT_FOUND and NULLFILE is not very crucial,
* but getting it right prevents mainloop from exiting with the wrong
* message if it happens for the first file, and from logging (or not
* logging) errors inappropriately with -traversal, and from sending
* bogus error mail with MAIL_SYSTEM_ERROR_LOGGING:TRUE. - kw
*/
PUBLIC BOOLEAN getfile ARGS1(
document *, doc)
{
int url_type = 0;
char *cp = NULL;
char *temp = NULL;
DocAddress WWWDoc; /* a WWW absolute doc address struct */
/*
* Reset LYCancelDownload to prevent unwanted delayed effect. - KW
*/
if (LYCancelDownload) {
CTRACE(tfp, "getfile: resetting LYCancelDownload to FALSE\n");
LYCancelDownload = FALSE;
}
/*
* Reset fake 'Z' to prevent unwanted delayed effect. - kw
*/
LYFakeZap(NO);
/*
* Reset redirection counter to prevent bogus TOO_MANY_REDIRECTIONS
* in rare situations if the previous cycle got to the limit, but
* did not fail for that reason because the URL of the final location
* was handled specially, not via HTLoadAbsolute. - kw
*/
redirection_attempts = 0;
Try_Redirected_URL:
/*
* Load the WWWDoc struct in case we need to use it.
*/
WWWDoc.address = doc->address;
WWWDoc.post_data = doc->post_data;
WWWDoc.post_content_type = doc->post_content_type;
WWWDoc.bookmark = doc->bookmark;
WWWDoc.isHEAD = doc->isHEAD;
WWWDoc.safe = doc->safe;
/*
* Reset HTPermitRedir, it has done its job if it was set. - kw
*/
HTPermitRedir = FALSE;
/*
* Reset WWW_Download_File just in case.
*/
FREE(WWW_Download_File);
/*
* Reset redirect_post_content just in case.
*/
redirect_post_content = FALSE;
/*
* This flag is a hack to allow us to pass on the fact
* that 'no data' may not really be an error although
* HTLoadAbsolute returned NO. There should be a better
* way... HT_NO_DATA should always mean 'not data but
* not an error', and be passed on to us as that, but
* current usage if HT_NO_DATA vs HT_NOT_LOADED has
* to be reviewed everywhere.
* Anyway, some protocol module can set it to say
* 'I really mean it', we have to reset it here. - kw
*/
HTNoDataOK = 0;
CTRACE(tfp,"getfile: getting %s\n\n",doc->address);
/*
* Protect against denial of service attacks
* via the port 19 CHARGEN service, and block
* connections to the port 25 ESMTP service.
* Also reject any likely spoof attempts via
* wrap arounds at 65536. - FM
*/
if ((temp = HTParse(doc->address, "", PARSE_HOST)) != NULL &&
strlen(temp) > 3) {
char *cp1;
if ((cp1 = strchr(temp, '@')) == NULL)
cp1 = temp;
if ((cp = strrchr(cp1, ':')) != NULL) {
long int value;
cp++;
if (sscanf(cp, "%ld", &value) == 1) {
if (value == 19 || value == 65555) {
HTAlert(PORT_NINETEEN_INVALID);
FREE(temp);
return(NULLFILE);
}
if (value == 25 || value == 65561) {
HTAlert(PORT_TWENTYFIVE_INVALID);
FREE(temp);
return(NULLFILE);
}
if (value > 65535 || value < 0) {
char *msg = 0;
HTSprintf0(&msg, PORT_INVALID, (unsigned long)value);
HTAlert(msg);
FREE(msg);
FREE(temp);
return(NULLFILE);
}
} else if (isdigit((unsigned char)*cp)) {
HTAlert(URL_PORT_BAD);
FREE(temp);
return(NULLFILE);
}
}
}
cp = NULL;
FREE(temp);
/*
* Check to see if this is a universal document ID
* that lib WWW wants to handle.
*
* Some special URL's we handle ourselves. :)
*/
if ((url_type = is_url(doc->address)) != 0) {
if (LYValidate && !LYPermitURL) {
if (!(url_type == HTTP_URL_TYPE ||
url_type == HTTPS_URL_TYPE ||
url_type == LYNXHIST_URL_TYPE ||
url_type == LYNXKEYMAP_URL_TYPE ||
url_type == LYNXIMGMAP_URL_TYPE ||
url_type == LYNXCOOKIE_URL_TYPE ||
url_type == LYNXMESSAGES_URL_TYPE ||
(url_type == LYNXOPTIONS_URL_TYPE &&
WWWDoc.post_data) ||
0==STRNADDRCOMP(WWWDoc.address, helpfilepath,
strlen(helpfilepath)) ||
(lynxlistfile != NULL &&
0==STRNADDRCOMP(WWWDoc.address, lynxlistfile,
strlen(lynxlistfile))) ||
(lynxlinksfile != NULL &&
0==STRNADDRCOMP(WWWDoc.address, lynxlinksfile,
strlen(lynxlinksfile))) ||
(lynxjumpfile != NULL &&
0==STRNADDRCOMP(WWWDoc.address, lynxjumpfile,
strlen(lynxjumpfile))))) {
HTUserMsg(NOT_HTTP_URL_OR_ACTION);
return(NULLFILE);
}
}
if (traversal) {
/*
* Only traverse http URLs.
*/
if (url_type != HTTP_URL_TYPE &&
url_type != LYNXIMGMAP_URL_TYPE)
return(NULLFILE);
} else if (check_realm && !LYPermitURL && !LYJumpFileURL) {
if (!(0==strncmp(startrealm, WWWDoc.address,
strlen(startrealm)) ||
url_type == LYNXHIST_URL_TYPE ||
url_type == LYNXKEYMAP_URL_TYPE ||
url_type == LYNXIMGMAP_URL_TYPE ||
url_type == LYNXCOOKIE_URL_TYPE ||
url_type == LYNXPRINT_URL_TYPE ||
url_type == LYNXOPTIONS_URL_TYPE ||
url_type == LYNXCFG_URL_TYPE ||
url_type == LYNXCOMPILE_OPTS_URL_TYPE ||
url_type == LYNXMESSAGES_URL_TYPE ||
url_type == LYNXDOWNLOAD_URL_TYPE ||
url_type == MAILTO_URL_TYPE ||
url_type == NEWSPOST_URL_TYPE ||
url_type == NEWSREPLY_URL_TYPE ||
url_type == SNEWSPOST_URL_TYPE ||
url_type == SNEWSREPLY_URL_TYPE ||
(!LYUserSpecifiedURL &&
(url_type == LYNXEXEC_URL_TYPE ||
url_type == LYNXPROG_URL_TYPE ||
url_type == LYNXCGI_URL_TYPE)) ||
(WWWDoc.bookmark != NULL &&
*WWWDoc.bookmark != '\0') ||
0==STRNADDRCOMP(WWWDoc.address, helpfilepath,
strlen(helpfilepath)) ||
(lynxlistfile != NULL &&
0==STRNADDRCOMP(WWWDoc.address, lynxlistfile,
strlen(lynxlistfile))) ||
(lynxjumpfile != NULL &&
0==STRNADDRCOMP(WWWDoc.address, lynxjumpfile,
strlen(lynxjumpfile))))) {
HTUserMsg(NOT_IN_STARTING_REALM);
return(NULLFILE);
}
}
if (WWWDoc.post_data &&
url_type != HTTP_URL_TYPE &&
url_type != HTTPS_URL_TYPE &&
url_type != LYNXCGI_URL_TYPE &&
url_type != LYNXIMGMAP_URL_TYPE &&
url_type != GOPHER_URL_TYPE &&
url_type != CSO_URL_TYPE &&
url_type != PROXY_URL_TYPE &&
url_type != LYNXOPTIONS_URL_TYPE &&
!(url_type == FILE_URL_TYPE &&
*(LYlist_temp_url()) &&
!strncmp(WWWDoc.address, LYlist_temp_url(),
strlen(LYlist_temp_url())))) {
CTRACE(tfp, "getfile: dropping post_data!\n");
HTAlert(IGNORED_POST);
FREE(doc->post_data);
FREE(doc->post_content_type);
WWWDoc.post_data = NULL;
WWWDoc.post_content_type = NULL;
}
#ifndef VMS
#ifdef SYSLOG_REQUESTED_URLS
syslog(LOG_INFO|LOG_LOCAL5, "%s", doc->address);
#endif /* SYSLOG_REQUESTED_URLS */
#endif /* !VMS */
if (url_type == UNKNOWN_URL_TYPE ||
url_type == AFS_URL_TYPE ||
url_type == PROSPERO_URL_TYPE) {
HTAlert(UNSUPPORTED_URL_SCHEME);
return(NULLFILE);
} else if (url_type == DATA_URL_TYPE) {
HTAlert(UNSUPPORTED_DATA_URL);
return(NULLFILE);
} else if (url_type == LYNXPRINT_URL_TYPE) {
return(printfile(doc));
#ifndef NO_OPTION_FORMS
} else if (url_type == LYNXOPTIONS_URL_TYPE) {
/* proceed forms-based options menu */
return(postoptions(doc));
#endif
} else if (url_type == LYNXCFG_URL_TYPE &&
!no_lynxcfg_info) {
/* @@@ maybe we should generate a specific error message
if attempted but restricted. - kw */
/* show/change/reload lynx.cfg settings */
return(lynx_cfg_infopage(doc));
#if defined(HAVE_CONFIG_H) && !defined(NO_CONFIG_INFO)
} else if (url_type == LYNXCOMPILE_OPTS_URL_TYPE &&
!no_compileopts_info) {
/* @@@ maybe we should generate a specific error message
if attempted but restricted or not supported. - kw */
/* show compile-time settings */
return(lynx_compile_opts(doc));
#endif
#ifndef DISABLE_NEWS
} else if (url_type == NEWSPOST_URL_TYPE ||
url_type == NEWSREPLY_URL_TYPE ||
url_type == SNEWSPOST_URL_TYPE ||
url_type == SNEWSREPLY_URL_TYPE) {
if (no_newspost) {
HTUserMsg(NEWSPOSTING_DISABLED);
return(NULLFILE);
} else if (!news_ok && (
url_type == NEWSPOST_URL_TYPE ||
url_type == NEWSREPLY_URL_TYPE)) {
HTUserMsg(NEWS_DISABLED);
return(NULLFILE);
} else {
HTLoadAbsolute(&WWWDoc);
return(NULLFILE);
}
#endif
} else if (url_type == LYNXDOWNLOAD_URL_TYPE) {
LYDownload(doc->address);
#ifdef VMS
if (LYDidRename) {
/*
* The temporary file was saved to disk via a
* rename(), so we can't access the temporary
* file again via the download menu. Clear the
* flag, and return NULLFILE to pop. - FM
*/
LYDidRename = FALSE;
return(NULLFILE);
} else {
return(NORMAL);
}
#else
return(NORMAL);
#endif /* VMS */
} else if (url_type == LYNXDIRED_URL_TYPE) {
#ifdef DIRED_SUPPORT
if (no_dired_support) {
HTUserMsg(DIRED_DISABLED);
return(NULLFILE);
} else {
local_dired(doc);
WWWDoc.address = doc->address;
WWWDoc.post_data = doc->post_data;
WWWDoc.post_content_type = doc->post_content_type;
WWWDoc.bookmark = doc->bookmark;
WWWDoc.isHEAD = doc->isHEAD;
WWWDoc.safe = doc->safe;
if (!HTLoadAbsolute(&WWWDoc))
return(NOT_FOUND);
return(NORMAL);
}
#else
HTUserMsg(DIRED_DISABLED);
return(NULLFILE);
#endif /* DIRED_SUPPORT */
}
if (LYNoRefererHeader == FALSE &&
LYNoRefererForThis == FALSE) {
if (no_filereferer == TRUE &&
!strncmp(HTLoadedDocumentURL(), "file:", 5)) {
LYNoRefererForThis = TRUE;
}
if (LYNoRefererForThis == FALSE &&
(cp = strchr(HTLoadedDocumentURL(), '?')) != NULL &&
strchr(cp, '=') != NULL) {
/*
* Don't send a Referer header if the URL is
* the reply from a form with method GET, in
* case the content has personal data (e.g.,
* a password or credit card number) which
* would become visible in logs. - FM
*/
LYNoRefererForThis = TRUE;
cp = NULL;
}
}
if (url_type == LYNXHIST_URL_TYPE) {
/*
* 'doc' will change to the new file
* if we had a successful LYpop_num(),
* and the return value will be FALSE
* if we had a cancel. - FM
*/
if ((historytarget(doc) == FALSE) ||
!doc || !doc->address) {
return(NOT_FOUND);
}
/*
* We changed it so reload.
*/
WWWDoc.address = doc->address;
WWWDoc.post_data = doc->post_data;
WWWDoc.post_content_type = doc->post_content_type;
WWWDoc.bookmark = doc->bookmark;
WWWDoc.isHEAD = doc->isHEAD;
WWWDoc.safe = doc->safe;
#ifndef DONT_TRACK_INTERNAL_LINKS
if (doc->internal_link && !reloading) {
LYinternal_flag = TRUE;
}
#endif
if (!HTLoadAbsolute(&WWWDoc)) {
return(NOT_FOUND);
}
return(NORMAL);
} else if (url_type == LYNXEXEC_URL_TYPE ||
url_type == LYNXPROG_URL_TYPE) {
#ifdef EXEC_LINKS
if (no_exec &&
!exec_ok(HTLoadedDocumentURL(),
doc->address+9, ALWAYS_EXEC_PATH)) {
HTUserMsg(EXECUTION_DISABLED);
} else if (no_bookmark_exec &&
HTLoadedDocumentBookmark()) {
HTUserMsg(BOOKMARK_EXEC_DISABLED);
} else if (local_exec || (local_exec_on_local_files &&
exec_ok(HTLoadedDocumentURL(),
doc->address+9, EXEC_PATH))) {
char *p, addressbuf[1024];
/*
* Bug puts slash on end if none is in the string.
*/
char *last_slash = strrchr(doc->address,'/');
if (last_slash - doc->address
== (int)strlen(doc->address) - 1)
doc->address[strlen(doc->address)-1] = '\0';
p = doc->address;
/*
* Convert '~' to $HOME.
*/
if ((cp = strchr(doc->address, '~'))) {
strncpy(addressbuf, doc->address, cp-doc->address);
addressbuf[cp - doc->address] = '\0';
p = wwwName(Home_Dir());
strcat(addressbuf, p);
strcat(addressbuf, cp+1);
p = addressbuf;
}
/*
* Show URL before executing it.
*/
HTInfoMsg(doc->address);
stop_curses();
/*
* Run the command.
*/
if (strstr(p,"//") == p+9)
LYSystem(p+11);
else
LYSystem(p+9);
if (url_type != LYNXPROG_URL_TYPE) {
/*
* Make sure user gets to see screen output.
*/
#ifndef VMS
signal(SIGINT, SIG_IGN);
#endif /* !VMS */
printf("\n%s", RETURN_TO_LYNX);
fflush(stdout);
LYgetch();
#ifdef VMS
HadVMSInterrupt = FALSE;
#endif /* VMS */
}
if (!dump_output_immediately) {
start_curses();
LYAddVisitedLink(doc);
}
} else {
char *buf = 0;
HTSprintf0(&buf,
EXECUTION_DISABLED_FOR_FILE,
key_for_func(LYK_OPTIONS));
HTAlert(buf);
FREE(buf);
}
#else /* no exec_links */
HTUserMsg(EXECUTION_NOT_COMPILED);
#endif /* EXEC_LINKS */
return(NULLFILE);
} else if (url_type == MAILTO_URL_TYPE) {
if (no_mail) {
HTUserMsg(MAIL_DISABLED);
} else {
HTParentAnchor *tmpanchor;
CONST char *title;
char *tmptitle = NULL;
title = "";
if ((tmpanchor = HTAnchor_parent(
HTAnchor_findAddress(&WWWDoc)
)) != NULL &&
HTAnchor_title(tmpanchor)) {
title = HTAnchor_title(tmpanchor);
} else if (HTMainAnchor && !LYUserSpecifiedURL) {
title = HTAnchor_subject(HTMainAnchor);
if (title && *title) {
if (strncasecomp(title, "Re:", 3)) {
StrAllocCopy(tmptitle, "Re: ");
StrAllocCat(tmptitle, title);
title = tmptitle;
}
} else {
title = "";
}
}
cp = (char *)strchr(doc->address,':')+1;
reply_by_mail(cp,
((HTMainAnchor && !LYUserSpecifiedURL) ?
(char *)HTMainAnchor->address :
(char *)doc->address),
title,
(HTMainAnchor && !LYUserSpecifiedURL) ?
HTMainAnchor->message_id : NULL);
FREE(tmptitle);
}
return(NULLFILE);
/*
* From here on we could have a remote host,
* so check if that's allowed.
*/
} else if (local_host_only &&
url_type != LYNXKEYMAP_URL_TYPE &&
url_type != LYNXIMGMAP_URL_TYPE &&
url_type != LYNXCOOKIE_URL_TYPE &&
url_type != LYNXMESSAGES_URL_TYPE &&
url_type != LYNXCGI_URL_TYPE &&
!(url_type == NEWS_URL_TYPE &&
strncmp(doc->address, "news://", 7)) &&
!(LYisLocalHost(doc->address) ||
LYisLocalAlias(doc->address))) {
HTUserMsg(ACCESS_ONLY_LOCALHOST);
return(NULLFILE);
/*
* Disable www telnet access if not telnet_ok.
*/
} else if (url_type == TELNET_URL_TYPE ||
url_type == TN3270_URL_TYPE ||
url_type == TELNET_GOPHER_URL_TYPE) {
char * proxy;
if (!telnet_ok) {
HTUserMsg(TELNET_DISABLED);
return(NULLFILE);
} else if (no_telnet_port && strchr(doc->address+7, ':')) {
HTUserMsg(TELNET_PORT_SPECS_DISABLED);
return(NULLFILE);
/*
* Detect weird case where interactive protocol would
* be proxied, and to a non-interactive protocol at that.
*/
} else if ((proxy = (char *)getenv(
(url_type==TN3270_URL_TYPE) ? "tn3270_proxy" :
(url_type==TELNET_GOPHER_URL_TYPE) ? "gopher_proxy" :
"telnet_proxy")) != NULL &&
*proxy != '\0' &&
!override_proxy(doc->address) &&
(strncmp(proxy, "telnet:", 7) &&
strncmp(proxy, "tn3270:", 7) &&
strncmp(proxy, "rlogin:", 7))) {
/* Do nothing, fall through to generic code - kw */
} else {
stop_curses();
HTLoadAbsolute(&WWWDoc);
if (!dump_output_immediately) {
start_curses();
fflush(stdout);
LYAddVisitedLink(doc);
}
return(NULLFILE);
}
/*
* Disable www news access if not news_ok.
*/
#ifndef DISABLE_NEWS
} else if (!news_ok && (
url_type == NEWS_URL_TYPE ||
url_type == NNTP_URL_TYPE)) {
HTUserMsg(NEWS_DISABLED);
return(NULLFILE);
#endif
} else if (url_type == RLOGIN_URL_TYPE) {
char * proxy;
if (!rlogin_ok) {
HTUserMsg(RLOGIN_DISABLED);
return(NULLFILE);
/*
* Detect weird case where interactive protocol would
* be proxied, and to a non-interactive protocol at that.
*/
} else if ((proxy = (char *)getenv(
"rlogin_proxy")) != NULL &&
*proxy != '\0' &&
!override_proxy(doc->address) &&
(strncmp(proxy, "telnet:", 7) &&
strncmp(proxy, "tn3270:", 7) &&
strncmp(proxy, "rlogin:", 7))) {
/* Do nothing, fall through to generic code - kw */
} else {
stop_curses();
HTLoadAbsolute(&WWWDoc);
fflush(stdout);
if (!dump_output_immediately) {
start_curses();
LYAddVisitedLink(doc);
}
return(NULLFILE);
}
/*
* If its a gopher index type and there isn't a search
* term already attached then do this. Otherwise
* just load it!
*/
} else if (url_type == INDEX_GOPHER_URL_TYPE &&
strchr(doc->address,'?') == NULL) {
int status;
/*
* Make sure we don't have a gopher+ escaped tab
* instead of a gopher0 question mark delimiting
* the search term. - FM
*/
if ((cp = strstr(doc->address, "%09")) != NULL) {
*cp = '\0';
StrAllocCopy(temp, doc->address);
cp += 3;
if (*cp && strncmp(cp, "%09", 3)) {
StrAllocCat(temp, "?");
StrAllocCat(temp, cp);
if ((cp = strstr(temp, "%09")) != NULL) {
*cp = '\0';
}
}
StrAllocCopy(doc->address, temp);
FREE(temp);
goto Try_Redirected_URL;
}
/*
* Load it because the do_www_search routine
* uses the base url of the currently loaded
* document :(
*/
if (!HTLoadAbsolute(&WWWDoc))
return(NOT_FOUND);
status = do_www_search(doc);
if (status == NULLFILE) {
LYpop(doc);
WWWDoc.address = doc->address;
WWWDoc.post_data = doc->post_data;
WWWDoc.post_content_type = doc->post_content_type;
WWWDoc.bookmark = doc->bookmark;
WWWDoc.isHEAD = doc->isHEAD;
WWWDoc.safe = doc->safe;
status = HTLoadAbsolute(&WWWDoc);
}
return(status);
}
{
if (url_type == FTP_URL_TYPE && !ftp_ok) {
HTUserMsg(FTP_DISABLED);
return(NULLFILE);
}
if (url_type == HTML_GOPHER_URL_TYPE) {
char *tmp=NULL;
/*
* If tuple's Path=GET%20/... convert to an http URL.
*/
if ((cp=strchr(doc->address+9, '/')) != NULL &&
0==strncmp(++cp, "hGET%20/", 8)) {
StrAllocCopy(tmp, "http://");
CTRACE(tfp, "getfile: URL '%s'\n",
doc->address);
*cp = '\0';
StrAllocCat(tmp, doc->address+9);
/*
* If the port is defaulted, it should stay 70.
*/
if (strchr(tmp+6, ':') == NULL) {
StrAllocCat(tmp, "70/");
tmp[strlen(tmp)-4] = ':';
}
if (strlen(cp+7) > 1)
StrAllocCat(tmp, cp+8);
StrAllocCopy(doc->address, tmp);
CTRACE(tfp, " changed to '%s'\n",
doc->address);
FREE(tmp);
url_type = HTTP_URL_TYPE;
}
}
if (url_type == HTTP_URL_TYPE ||
url_type == HTTPS_URL_TYPE ||
url_type == FTP_URL_TYPE ||
url_type == CSO_URL_TYPE)
fix_httplike_urls(doc, url_type);
WWWDoc.address = doc->address; /* possible reload */
#ifdef DIRED_SUPPORT
lynx_edit_mode = FALSE;
#endif /* DIRED_SUPPORT */
if (url_type == FILE_URL_TYPE) {
/*
* If a file URL has a '~' as the lead character
* of its first symbolic element, convert the '~'
* to Home_Dir(), then append the rest of of path,
* if present, skipping "user" if "~user" was
* entered, simplifying, and eliminating any
* residual relative elements. - FM
*/
if (((cp = HTParse(doc->address, "",
PARSE_PATH+PARSE_ANCHOR+PARSE_PUNCTUATION))
!= NULL) &&
!strncmp(cp, "/~", 2)) {
char *cp1 = strstr(doc->address, "/~");
char *cp2;
CTRACE(tfp, "getfile: URL '%s'\n",
doc->address);
*cp1 = '\0';
cp1 += 2;
StrAllocCopy(temp, doc->address);
StrAllocCopy(cp, wwwName(Home_Dir()));
if (!LYIsHtmlSep(*cp))
LYAddHtmlSep(&temp);
StrAllocCat(temp, cp);
if ((cp2 = strchr(cp1, '/')) != NULL) {
LYTrimRelFromAbsPath(cp2);
StrAllocCat(temp, cp2);
}
StrAllocCopy(doc->address, temp);
FREE(temp);
CTRACE(tfp, " changed to '%s'\n",
doc->address);
WWWDoc.address = doc->address;
}
FREE(cp);
}
if (url_type == LYNXMESSAGES_URL_TYPE) {
int rv;
/* show list of recent statusline messages */
if ((rv = LYshow_statusline_messages(doc)) != NORMAL) {
return rv;
}
WWWDoc.address = doc->address;
WWWDoc.post_data = doc->post_data;
WWWDoc.post_content_type = doc->post_content_type;
WWWDoc.bookmark = doc->bookmark;
WWWDoc.isHEAD = doc->isHEAD;
WWWDoc.safe = doc->safe;
} else {
CTRACE_SLEEP(MessageSecs);
user_message(WWW_WAIT_MESSAGE, doc->address);
}
if (TRACE) {
#ifdef USE_SLANG
if (LYCursesON) {
addstr("*\n");
refresh();
}
#endif /* USE_SLANG */
fprintf(tfp,"\n");
}
if (!HTLoadAbsolute(&WWWDoc)) {
/*
* Check for redirection.
*/
if (use_this_url_instead != NULL) {
char *pound;
if (!is_url(use_this_url_instead)) {
/*
* The server did not return a complete
* URL in its Location: header, probably
* due to a FORM or other CGI script written
* by someone who doesn't know that the http
* protocol requires that it be a complete
* URL, or using a server which does not treat
* such a redirect string from the script as
* an instruction to resolve it versus the
* initial request, check authentication with
* that URL, and then act on it without
* returning redirection to us. We'll
* violate the http protocol and resolve it
* ourselves using the URL of the original
* request as the BASE, rather than doing
* the RIGHT thing and returning an invalid
* address message. - FM
*/
HTUserMsg(LOCATION_NOT_ABSOLUTE);
temp = HTParse(use_this_url_instead,
WWWDoc.address,
PARSE_ALL);
if (temp && *temp) {
StrAllocCopy(use_this_url_instead, temp);
}
FREE(temp);
}
url_type = is_url(use_this_url_instead);
if (!HTPermitRedir &&
(url_type == LYNXDOWNLOAD_URL_TYPE ||
url_type == LYNXEXEC_URL_TYPE ||
url_type == LYNXPROG_URL_TYPE ||
#ifdef DIRED_SUPPORT
url_type == LYNXDIRED_URL_TYPE ||
#endif /* DIRED_SUPPORT */
url_type == LYNXPRINT_URL_TYPE ||
url_type == LYNXOPTIONS_URL_TYPE ||
url_type == LYNXCFG_URL_TYPE ||
url_type == LYNXCOMPILE_OPTS_URL_TYPE ||
url_type == LYNXHIST_URL_TYPE ||
url_type == LYNXCOOKIE_URL_TYPE ||
(LYValidate &&
url_type != HTTP_URL_TYPE &&
url_type != HTTPS_URL_TYPE) ||
((no_file_url || no_goto_file) &&
url_type == FILE_URL_TYPE) ||
(no_goto_lynxcgi &&
url_type == LYNXCGI_URL_TYPE) ||
(no_goto_cso &&
url_type == CSO_URL_TYPE) ||
(no_goto_finger &&
url_type == FINGER_URL_TYPE) ||
(no_goto_ftp &&
url_type == FTP_URL_TYPE) ||
(no_goto_gopher &&
url_type == GOPHER_URL_TYPE) ||
(no_goto_http &&
url_type == HTTP_URL_TYPE) ||
(no_goto_https &&
url_type == HTTPS_URL_TYPE) ||
(no_goto_mailto &&
url_type == MAILTO_URL_TYPE) ||
#ifndef DISABLE_NEWS
(no_goto_news &&
url_type == NEWS_URL_TYPE) ||
(no_goto_nntp &&
url_type == NNTP_URL_TYPE) ||
#endif
(no_goto_rlogin &&
url_type == RLOGIN_URL_TYPE) ||
#ifndef DISABLE_NEWS
(no_goto_snews &&
url_type == SNEWS_URL_TYPE) ||
#endif
(no_goto_telnet &&
url_type == TELNET_URL_TYPE) ||
(no_goto_tn3270 &&
url_type == TN3270_URL_TYPE) ||
(no_goto_wais &&
url_type == WAIS_URL_TYPE))) {
/*
* Some schemes are not acceptable from
* server redirections. - KW & FM
*/
HTAlert(ILLEGAL_REDIRECTION_URL);
if (LYCursesON) {
_user_message(WWW_ILLEGAL_URL_MESSAGE,
use_this_url_instead);
sleep(AlertSecs);
} else {
fprintf(stderr,
WWW_ILLEGAL_URL_MESSAGE,
use_this_url_instead);
}
FREE(use_this_url_instead);
return(NULLFILE);
}
if ((pound = strchr(doc->address, '#')) != NULL &&
strchr(use_this_url_instead, '#') == NULL) {
/*
* Our requested URL had a fragment
* associated with it, and the redirection
* URL doesn't, so we'll append the fragment
* associated with the original request. If
* it's bogus for the redirection URL, we'll
* be positioned at the top of that document,
* so there's no harm done. - FM
*/
CTRACE(tfp,
"getfile: Adding fragment '%s' to redirection URL.\n",
pound);
StrAllocCat(use_this_url_instead, pound);
}
CTRACE_SLEEP(MessageSecs);
_user_message(WWW_USING_MESSAGE,
use_this_url_instead);
sleep(InfoSecs);
CTRACE(tfp, "\n");
StrAllocCopy(doc->address,
use_this_url_instead);
FREE(use_this_url_instead);
if (redirect_post_content == FALSE) {
/*
* Freeing the content also yields
* a GET request. - FM
*/
FREE(doc->post_data);
FREE(doc->post_content_type);
}
/*
* Go to top to check for URL's which get
* special handling and/or security checks
* in Lynx. - FM
*/
goto Try_Redirected_URL;
}
if (HTNoDataOK)
return(NULLFILE);
return(NOT_FOUND);
}
lynx_mode = NORMAL_LYNX_MODE;
/*
* Some URL's don't actually return a document;
* compare doc->address with the document that is
* actually loaded and return NULLFILE if not
* loaded. If www_search_result is not -1
* then this is a reference to a named anchor
* within the same document; do NOT return
* NULLFILE in that case.
*/
{
char *pound;
/*
* Check for a #fragment selector.
*/
pound = (char *)strchr(doc->address, '#');
/*
* Check to see if there is a temp
* file waiting for us to download.
*/
if (WWW_Download_File) {
HTParentAnchor *tmpanchor;
char *fname = NULL;
/*
* Check for a suggested filename from
* the Content-Disposition header. - FM
*/
if (((tmpanchor = HTAnchor_parent(
HTAnchor_findAddress(&WWWDoc)
)) != NULL) &&
HTAnchor_SugFname(tmpanchor) != NULL) {
StrAllocCopy(fname,
HTAnchor_SugFname(tmpanchor));
} else {
StrAllocCopy(fname, doc->address);
}
/*
* Check whether this is a compressed file,
* which we don't uncompress for downloads,
* and adjust any suffix appropriately. - FM
*/
if (tmpanchor != NULL) {
HTCheckFnameForCompression(&fname, tmpanchor,
FALSE);
}
if (LYdownload_options(&fname,
WWW_Download_File) < 0) {
FREE(fname);
return(NOT_FOUND);
}
LYAddVisitedLink(doc);
StrAllocCopy(doc->address, fname);
FREE(fname);
doc->internal_link = FALSE;
WWWDoc.address = doc->address;
FREE(doc->post_data);
WWWDoc.post_data = NULL;
FREE(doc->post_content_type);
WWWDoc.post_content_type = NULL;
WWWDoc.bookmark = doc->bookmark = FALSE;
WWWDoc.isHEAD = doc->isHEAD = FALSE;
WWWDoc.safe = doc->safe = FALSE;
HTOutputFormat = WWW_PRESENT;
if (!HTLoadAbsolute(&WWWDoc))
return(NOT_FOUND);
else
return(NORMAL);
} else if (pound == NULL &&
/*
* HTAnchor hash-table searches are now
* case-sensitive (hopefully, without
* anchor deletion problems), so this
* is too. - FM
*/
(strcmp(doc->address,
HTLoadedDocumentURL()) ||
/*
* Also check the post_data elements. - FM
*/
strcmp((doc->post_data ?
doc->post_data : ""),
HTLoadedDocumentPost_data()) ||
/*
* Also check the isHEAD element. - FM
*/
doc->isHEAD != HTLoadedDocumentIsHEAD())) {
/*
* Nothing needed to be shown.
*/
LYAddVisitedLink(doc);
return(NULLFILE);
} else {
/*
* May set www_search_result.
*/
if (pound != NULL)
HTFindPoundSelector(pound+1);
return(NORMAL);
}
}
}
} else {
CTRACE_SLEEP(MessageSecs);
HTUserMsg2(WWW_BAD_ADDR_MESSAGE, doc->address);
CTRACE(tfp,"\n");
return(NULLFILE);
}
}
/*
* The user wants to select a link or page by number.
* If follow_link_number returns DO_LINK_STUFF do_link
* will be run immediately following its execution.
* If follow_link_number returns DO_GOTOLINK_STUFF
* it has updated the passed in doc for positioning on a link.
* If follow_link_number returns DO_GOTOPAGE_STUFF
* it has set doc->line to the top line of the desired page
* for displaying that page.
* If follow_link_number returns PRINT_ERROR an error message
* will be given to the user.
* If follow_link_number returns DO_FORMS_STUFF some forms stuff
* will be done. (Not yet implemented.)
* If follow_link_number returns DO_NOTHING nothing special
* will run after it.
*/
PUBLIC int follow_link_number ARGS4(
int, c,
int, cur,
document *, doc,
int *, num)
{
char temp[120];
char *p = temp;
int rel = 0;
int new_top, new_link;
BOOL want_go;
int curline = *num; /* passed in from mainloop() */
CTRACE(tfp,"follow_link_number(%d,%d,...)\n",c,cur);
temp[0] = c;
temp[1] = '\0';
*num = -1;
_statusline(FOLLOW_LINK_NUMBER);
/*
* Get the number, possibly with a letter suffix, from the user.
*/
if (LYgetstr(temp, VISIBLE, sizeof(temp), NORECALL) < 0 || *temp == 0) {
HTInfoMsg(CANCELLED);
return(DO_NOTHING);
}
*num = atoi(p);
while ( isdigit(*p) )
++p;
c = *p; /* reuse c; 0 or g or p or + or - */
switch ( c ) {
case '+': case '-':
/* 123+ or 123- */
rel = c; c = *++p;
break;
default:
rel = *++p;
case 0:
break;
}
/* don't currently check for errors typing suffix */
CTRACE(tfp," temp=%s, *num=%d, rel='%c'\n",temp,*num,rel);
/*
* Check if we had a 'p' or 'P' following the number as
* a flag for displaying the page with that number. - FM
*/
if (( c == 'p' || c == 'P') && display_lines == 0) {
CTRACE(tfp," curline=%d, LYlines=%d, display too small!\n",
curline,LYlines);
return(PRINT_ERROR);
} else if ( c == 'p' || c == 'P' ) {
int nlines = HText_getNumOfLines();
int npages = ((nlines + 1) > display_lines) ?
(((nlines + 1) + (display_lines - 1))/(display_lines))
: 1;
int curpage = ((curline + 1) > display_lines) ?
(((curline + 1) + (display_lines - 1))/(display_lines))
: 1;
CTRACE(tfp," nlines=%d, npages=%d, curline=%d, curpage=%d\n",
nlines,npages,curline,curpage);
if (*num < 1)
*num = rel ? 0 : 1;
if ( rel == '+' )
*num = curpage + *num;
else if ( rel == '-' )
*num = curpage - *num;
doc->line = (npages <= 1) ?
1 :
((*num <= npages) ? (((*num - 1) * display_lines) + 1)
: (((npages - 1) * display_lines) + 1));
return(DO_GOTOPAGE_STUFF);
}
/*
* Check if we want to make the link corresponding to the
* number the current link, rather than ACTIVATE-ing it.
*/
want_go = ( c == 'g' || c == 'G' );
/* If rel, add or subtract num from current link, or
* nearest previous/subsequent link if current link is not on screen.
*/
if ( rel )
*num = HTGetRelLinkNum( *num, rel, cur );
/*
* If we have a valid number, act on it.
*/
if (*num > 0) {
int info;
/*
* Get the lname, and hightext, directly from www
* structures and add it to the cur link so that
* we can pass it transparently on to getfile(),
* and load new_top and new_link if we instead want
* to make the link number current. These things
* are done so that a link can be selected anywhere
* in the current document, whether it is displayed
* on the screen or not!
*/
if ((info = HTGetLinkInfo(*num,
want_go,
&new_top,
&new_link,
&links[cur].hightext,
&links[cur].lname)) == WWW_INTERN_LINK_TYPE) {
links[cur].type = WWW_INTERN_LINK_TYPE;
return(DO_LINK_STUFF);
} else if (info == LINK_LINE_FOUND) {
doc->line = new_top + 1;
doc->link = new_link;
return(DO_GOTOLINK_STUFF);
} else if (info) {
links[cur].type = WWW_LINK_TYPE;
return(DO_LINK_STUFF);
} else {
return(PRINT_ERROR);
}
} else {
return(PRINT_ERROR);
}
}
#if defined(EXEC_LINKS) || defined(LYNXCGI_LINKS)
struct trust {
char *src;
char *path;
int type;
struct trust *next;
};
static struct trust trusted_exec_default = {
"file://localhost/", "", EXEC_PATH, NULL
};
static struct trust always_trusted_exec_default = {
"none", "", ALWAYS_EXEC_PATH, NULL
};
static struct trust trusted_cgi_default = {
"", "", CGI_PATH, NULL
};
static struct trust *trusted_exec = &trusted_exec_default;
static struct trust *always_trusted_exec = &always_trusted_exec_default;
static struct trust *trusted_cgi = &trusted_cgi_default;
#ifdef LY_FIND_LEAKS
PRIVATE void LYTrusted_free NOARGS
{
struct trust *cur;
struct trust *next;
if (trusted_exec != &trusted_exec_default) {
cur = trusted_exec;
while (cur) {
FREE(cur->src);
FREE(cur->path);
next = cur->next;
FREE(cur);
cur = next;
}
}
if (always_trusted_exec != &always_trusted_exec_default) {
cur = always_trusted_exec;
while (cur) {
FREE(cur->src);
FREE(cur->path);
next = cur->next;
FREE(cur);
cur = next;
}
}
if (trusted_cgi != &trusted_cgi_default) {
cur = trusted_cgi;
while (cur) {
FREE(cur->src);
FREE(cur->path);
next = cur->next;
FREE(cur);
cur = next;
}
}
return;
}
#endif /* LY_FIND_LEAKS */
PUBLIC void add_trusted ARGS2(
char *, str,
int, type)
{
struct trust *tp;
char *path;
char *src = str;
int Type = type;
static BOOLEAN first = TRUE;
if (!src)
return;
if (first) {
#ifdef LY_FIND_LEAKS
atexit(LYTrusted_free);
#endif
first = FALSE;
}
path = strchr(src, '\t');
if (path)
*path++ = '\0';
else
path = "";
tp = (struct trust *)malloc(sizeof(*tp));
if (tp == NULL)
outofmem(__FILE__, "add_trusted");
tp->src = NULL;
tp->path = NULL;
tp->type = Type;
StrAllocCopy(tp->src, src);
StrAllocCopy(tp->path, path);
if (Type == EXEC_PATH) {
if (trusted_exec == &trusted_exec_default)
tp->next = NULL;
else
tp->next = trusted_exec;
trusted_exec = tp;
} else if (Type == ALWAYS_EXEC_PATH) {
if (always_trusted_exec == &always_trusted_exec_default)
tp->next = NULL;
else
tp->next = always_trusted_exec;
always_trusted_exec = tp;
} else if (Type == CGI_PATH) {
if (trusted_cgi == &trusted_cgi_default)
tp->next = NULL;
else
tp->next = trusted_cgi;
trusted_cgi = tp;
}
}
/*
* Check to see if the supplied paths is allowed to be executed.
*/
PUBLIC BOOLEAN exec_ok ARGS3(
CONST char *, source,
CONST char *, linktext,
int, type)
{
struct trust *tp;
CONST char *cp;
CONST char *allowed_extra_chars;
int Type = type;
/*
* Always OK if it is a jump file shortcut.
*/
if (LYJumpFileURL)
return TRUE;
/*
* Choose the trust structure based on the type.
*/
if (Type == EXEC_PATH) {
tp = trusted_exec;
} else if (Type == ALWAYS_EXEC_PATH) {
tp = always_trusted_exec;
} else if (Type == CGI_PATH) {
tp = trusted_cgi;
} else {
HTAlert(MALFORMED_EXEC_REQUEST);
return FALSE;
}
#ifdef VMS
/*
* Security: reject on relative path.
*/
if ((cp = strchr(linktext, '[')) != NULL) {
char *cp1;
if (((cp1 = strchr(cp, '-')) != NULL) &&
strchr(cp1, ']') != NULL) {
while (cp1[1] == '-')
cp1++;
if (cp1[1] == ']' ||
cp1[1] == '.') {
HTAlert(RELPATH_IN_EXEC_LINK);
return FALSE;
}
}
}
#else
/*
* Security: reject on relative path.
*/
if (strstr(linktext, "../") != NULL) {
HTAlert(RELPATH_IN_EXEC_LINK);
return FALSE;
}
/*
* Security: reject on strange character.
*/
if (Type == CGI_PATH)
allowed_extra_chars = " _-:./@~$&+=\t";
else
allowed_extra_chars = " _-:./@~$+=\t";
for (cp = linktext; *cp != '\0'; cp++) {
if (!isalnum(*cp) && !strchr(allowed_extra_chars, *cp)) {
char *buf = 0;
HTSprintf0(&buf,
BADCHAR_IN_EXEC_LINK,
*cp);
HTAlert(buf);
FREE(buf);
return FALSE;
}
}
#endif /* VMS */
check_tp_for_entry:
while (tp) {
if (tp->type == Type) {
char CONST *command = linktext;
if (strstr(command,"//") == linktext) {
command += 2;
}
if (STRNADDRCOMP(source, tp->src, strlen(tp->src)) == 0 &&
STRNADDRCOMP(command, tp->path, strlen(tp->path)) == 0)
return TRUE;
}
tp = tp->next;
}
if (Type == EXEC_PATH &&
always_trusted_exec != &always_trusted_exec_default) {
Type = ALWAYS_EXEC_PATH;
tp = always_trusted_exec;
goto check_tp_for_entry;
}
if (!(no_exec && type == ALWAYS_EXEC_PATH))
HTAlert(BADLOCPATH_IN_EXEC_LINK);
return FALSE;
}
#endif /* EXEC_LINKS || LYNXCGI_LINKS */
PRIVATE int fix_httplike_urls ARGS2(
document *, doc,
UrlTypes, type)
{
char *slash;
/*
* If there's a fragment present, our simplistic methods won't
* work. - kw
*/
if (strchr(doc->address, '#'))
return 0;
#ifndef DISABLE_FTP
/*
* If it's an ftp URL with a trailing slash, trim it off.
*/
if (type == FTP_URL_TYPE &&
LYIsHtmlSep(doc->address[strlen(doc->address)-1])) {
char * proxy;
char *path = HTParse(doc->address, "", PARSE_PATH|PARSE_PUNCTUATION);
/*
* If the path is a lone slash, we're done. - FM
*/
if (path) {
if (LYIsHtmlSep(path[0]) && path[1] == '\0') {
FREE(path);
return 0;
}
FREE(path);
}
/*
* If we're proxying ftp, don't trim anything. - KW
*/
if (((proxy = (char *)getenv("ftp_proxy")) != NULL) &&
*proxy != '\0' && !override_proxy(doc->address))
return 0;
/*
* If we get to here, trim the trailing slash. - FM
*/
CTRACE(tfp, "fix_httplike_urls: URL '%s'\n", doc->address);
LYTrimHtmlSep(doc->address);
CTRACE(tfp, " changed to '%s'\n", doc->address);
CTRACE_SLEEP(MessageSecs);
}
#endif /* DISABLE_FTP */
/*
* If there isn't a slash besides the two at the beginning, append one.
*/
if ((slash = strrchr(doc->address, '/')) != NULL) {
if (!LYIsHtmlSep(*(slash-1)) || *(slash-2) != ':') {
return(0);
}
if ((type == HTTP_URL_TYPE ||
type == HTTPS_URL_TYPE) &&
((slash-2) - strchr(doc->address, ':'))) {
/*
* Turns out we were not looking at the right slash after all,
* there must have been more than one "://" which is valid
* at least for http URLs (later occurrences can be part of
* a query string, for example), so leave this alone, too. - kw
*/
return(0);
}
}
CTRACE(tfp, "fix_httplike_urls: URL '%s'\n", doc->address);
LYAddHtmlSep(&(doc->address));
CTRACE(tfp, " changed to '%s'\n", doc->address);
CTRACE_SLEEP(MessageSecs);
return(1);
}