/* WorldWideWeb - Wide Area Informaion Server Access HTWAIS.c
** ==================================================
**
** This module allows a WWW server or client to read data from a
** remote WAIS
** server, and provide that data to a WWW client in hypertext form.
** Source files, once retrieved, are stored and used to provide
** information about the index when that is acessed.
**
** Authors
** BK Brewster Kahle, Thinking Machines, <Brewster@think.com>
** TBL Tim Berners-Lee, CERN <timbl@info.cern.ch>
** FM Foteos Macrides, WFEB <macrides@sci.wfeb.edu>
**
** History
** Sep 91 TBL adapted shell-ui.c (BK) with HTRetrieve.c from WWW.
** Feb 91 TBL Generated HTML cleaned up a bit (quotes, escaping)
** Refers to lists of sources.
** Mar 93 TBL Lib 2.0 compatible module made.
** May 94 FM Added DIRECT_WAIS support for VMS.
**
** Bugs
** Uses C stream i/o to read and write sockets, which won't work
** on VMS TCP systems.
**
** Should cache connections.
**
** ANSI C only as written
**
** Bugs fixed
** NT Nathan Torkington (Nathan.Torkington@vuw.ac.nz)
**
** WAIS comments:
**
** 1. Separate directories for different system's .o would help
** 2. Document ids are rather long!
**
** W WW Address mapping convention:
**
** /servername/database/type/length/document-id
**
** /servername/database?word+word+word
*/
/* WIDE AREA INFORMATION SERVER SOFTWARE:
No guarantees or restrictions. See the readme file for the full standard
disclaimer.
Brewster@think.com
*/
#include "HTUtils.h"
#include "tcp.h"
#include "HTParse.h"
#include "HTAccess.h" /* We implement a protocol */
#include "HTML.h" /* The object we will generate */
#include "HTFormat.h"
#include "HTTCP.h"
#include "HTCJK.h"
#include "HTAlert.h"
/* #include "HTWSRC.h" */ /* Need some bits from here */
/* #include "ParseWSRC.h" */
/* From WAIS
** ---------
*/
#ifdef VMS
#include "HTVMS_WaisUI.h"
#include "HTVMS_WaisProt.h"
#else
#include <ui.h>
#endif /* VMS */
#define MAX_MESSAGE_LEN 100000
#define CHARS_PER_PAGE 10000 /* number of chars retrieved in each request */
#define WAISSEARCH_DATE "Fri Jul 19 1991"
/* FROM WWW
** --------
*/
#include "LYLeaks.h"
#define FREE(x) if (x) {free(x); x = NULL;}
extern int HTCheckForInterrupt NOPARAMS;
#define DIRECTORY "/cnidr.org:210/directory-of-servers"
/* #define DIRECTORY "/quake.think.com:210/directory-of-servers" */
#define BIG 1024 /* identifier size limit @@@@@ */
#define BUFFER_SIZE 4096 /* Arbitrary size for efficiency */
#define HEX_ESCAPE '%'
extern HTCJKlang HTCJK;
extern int WWW_TraceFlag; /* Control diagnostic output */
extern FILE * logfile; /* Log file output */
PRIVATE BOOL as_gate; /* Client is using us as gateway */
PRIVATE char line[2048]; /* For building strings to display */
/* Must be able to take id */
#define PUTC(c) (*target->isa->put_character)(target, c)
#define PUTS(s) (*target->isa->put_string)(target, s)
#define START(e) (*target->isa->start_element)(target, e, 0, 0, 0)
#define END(e) (*target->isa->end_element)(target, e, 0)
#define MAYBE_END(e) if (HTML_dtd.tags[e].contents != SGML_EMPTY) \
(*target->isa->end_element)(target, e, 0)
#define FREE_TARGET (*target->isa->_free)(target)
struct _HTStructured {
CONST HTStructuredClass * isa;
/* ... */
};
struct _HTStream {
CONST HTStreamClass * isa;
/* ... */
};
/* ------------------------------------------------------------------------ */
/* ---------------- Local copy of connect_to_server calls ----------------- */
/* ------------------------------------------------------------------------ */
/* Returns 1 on success, 0 on fail, -1 on interrupt. */
PRIVATE int fd_mosaic_connect_to_server ARGS3(
char *, host_name,
long, port,
long *, fd)
{
/*
** New version.
*/
char dummy[256];
int status;
sprintf (dummy, "wais://%s:%d/", host_name, port);
status = HTDoConnect (dummy, "WAIS", 210, (int *)fd);
if (status == HT_INTERRUPTED) {
return -1;
}
if (status < 0)
return 0;
return 1;
}
/* Returns 1 on success, 0 on fail, -1 on interrupt. */
#ifdef VMS
PRIVATE int mosaic_connect_to_server ARGS3(
char *, host_name,
long, port,
long *, fdp)
#else
PRIVATE int mosaic_connect_to_server ARGS3(
char *, host_name,
long, port,
FILE **, fp)
#endif /* VMS */
{
#ifndef VMS
FILE* file;
#endif /* VMS */
long fd;
int rv;
rv = fd_mosaic_connect_to_server (host_name, port, &fd);
if (rv == 0) {
HTAlert ("Could not connect to WAIS server.");
return 0;
} else if (rv == -1) {
HTAlert ("Connection interrupted.");
return -1;
}
#ifndef VMS
if ((file = fdopen(fd,"r+")) == NULL) {
HTAlert ("Could not open WAIS connection for reading.");
return 0;
}
*fp = file;
#else
*fdp = fd;
#endif /* VMS */
return 1;
}
/* ------------------------------------------------------------------------ */
/* ------------------------------------------------------------------------ */
/* showDiags
*/
/* modified from Jonny G's version in ui/question.c */
PRIVATE void showDiags ARGS2(
HTStream *, target,
diagnosticRecord **, d)
{
long i;
for (i = 0; d[i] != NULL; i++) {
if (d[i]->ADDINFO != NULL) {
PUTS("Diagnostic code is ");
PUTS(d[i]->DIAG);
PUTC(' ');
PUTS(d[i]->ADDINFO);
PUTC('\n'); ;
}
}
}
/* Matrix of allowed characters in filenames
** -----------------------------------------
*/
PRIVATE BOOL acceptable[256];
PRIVATE BOOL acceptable_inited = NO;
PRIVATE void init_acceptable NOARGS
{
unsigned int i;
char * good =
"abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789./-_$";
for(i=0; i<256; i++) acceptable[i] = NO;
for(;*good; good++) acceptable[(unsigned int)*good] = YES;
acceptable_inited = YES;
}
/* Transform file identifier into WWW address
** ------------------------------------------
**
**
** On exit,
** returns nil if error
** pointer to malloced string (must be freed) if ok
*/
PRIVATE char * WWW_from_archie ARGS1(
char *, file)
{
char * end;
char * result;
char * colon;
for(end=file; *end > ' '; end++); /* assumes ASCII encoding*/
result = (char *)malloc(10 + (end-file));
if (!result) return result; /* Malloc error */
strcpy(result, "file://");
strncat(result, file, end-file);
colon = strchr(result+7, ':'); /* Expect colon after host */
if (colon) {
for(; colon[0]; colon[0]=colon[1], colon++); /* move down */
}
return result;
} /* WWW_from_archie */
/* Transform document identifier into URL
** --------------------------------------
**
** Bugs: A static buffer of finite size is used!
** The format of the docid MUST be good!
**
** On exit,
** returns nil if error
** pointer to malloced string (must be freed) if ok
*/
PRIVATE char hex [17] = "0123456789ABCDEF";
extern char from_hex PARAMS((char a)); /* In HTWSRC @@ */
PRIVATE char * WWW_from_WAIS ARGS1(
any *, docid)
{
static char buf[BIG];
char * q = buf;
char * p = (docid->bytes);
int i, l;
if (TRACE) {
char *p;
fprintf(stderr, "WAIS id (%d bytes) is ", (int)docid->size);
for (p = docid->bytes; p < docid->bytes+docid->size; p++) {
if ((*p >= ' ') && (*p<= '~')) /* Assume ASCII! */
fprintf(stderr, "%c", *p);
else
fprintf(stderr, "<%x>", (unsigned)*p);
}
fprintf(stderr, "\n");
}
for (p = docid->bytes;
(p < docid->bytes+docid->size) && (q < &buf[BIG]);) {
if (TRACE)
fprintf(stderr, " Record type %d, length %d\n", p[0], p[1]);
if (*p > 10) {
if (TRACE)
fprintf(stderr, "Eh? DOCID record type of %d!\n", *p);
return 0;
}
{ /* Bug fix -- allow any byte value 15 Apr 93 */
unsigned int i = (unsigned) *p++;
if (i > 99) {
*q++ = (i/100) + '0';
i = i % 100;
}
if (i > 9) {
*q++ = (i/10) + '0';
i = i % 10;
}
*q++ = i + '0'; /* Record type */
}
*q++ = '='; /* Separate */
l = *p++; /* Length */
for (i = 0; i < l; i++, p++){
if (!acceptable[*p]) {
*q++ = HEX_ESCAPE; /* Means hex commming */
*q++ = hex[(*p) >> 4];
*q++ = hex[(*p) & 15];
}
else *q++ = *p;
}
*q++= ';'; /* Terminate field */
}
*q++ = 0; /* Terminate string */
if (TRACE)
fprintf(stderr, "WWW form of id: %s\n", buf);
{
char * result = (char *)malloc(strlen(buf)+1);
if (!result)
outofmem(__FILE__, "WWW_from_WAIS");
strcpy(result, buf);
return result;
}
} /* WWW_from_WAIS */
/* Transform URL into WAIS document identifier
** -------------------------------------------
**
** On entry,
** docname points to valid name produced originally by
** WWW_from_WAIS
** On exit,
** docid->size is valid
** docid->bytes is malloced and must later be freed.
*/
PRIVATE any * WAIS_from_WWW ARGS2(
any *, docid,
char *, docname)
{
char *z; /* Output pointer */
char *sor; /* Start of record - points to size field. */
char *p; /* Input pointer */
char *q; /* Poisition of "=" */
char *s; /* Position of semicolon */
int n; /* size */
if (TRACE)
fprintf(stderr, "WWW id (to become WAIS id): %s\n", docname);
for (n = 0, p = docname; *p; p++) { /* Count sizes of strings */
n++;
if (*p == ';')
n--; /* Not converted */
else if (*p == HEX_ESCAPE)
n = n-2; /* Save two bytes */
docid->size = n;
}
if (!(docid->bytes = (char *) malloc(docid->size))) /* result record */
outofmem(__FILE__, "WAIS_from_WWW");
z = docid->bytes;
for (p = docname; *p; ) { /* Convert of strings */
/* Record type */
*z = 0; /* Initialize record type */
while (*p >= '0' && *p <= '9') {
*z = *z*10 + (*p++ - '0'); /* Decode decimal record type */
}
z++;
if (*p != '=')
return 0;
q = p;
/* *z++ = *p++ - '0';
q = strchr(p , '=');
if (!q) return 0;
*/
s = strchr(q, ';'); /* (Check only) */
if (!s)
return 0; /* Bad! No ';'; */
sor = z; /* Remember where the size field was */
z++; /* Skip record size for now */
for (p = q+1; *p != ';';) {
if (*p == HEX_ESCAPE) {
char c;
unsigned int b;
p++;
c = *p++;
b = from_hex(c);
c = *p++;
if (!c)
break; /* Odd number of chars! */
*z++ = (b<<4) + from_hex(c);
} else {
*z++ = *p++; /* Record */
}
}
*sor = (z-sor-1); /* Fill in size -- not counting size itself */
p++; /* After semicolon: start of next record */
}
if (TRACE) {
char *p;
fprintf(stderr, "WAIS id (%d bytes) is ", (int)docid->size);
for (p = docid->bytes; p < docid->bytes+docid->size; p++) {
if ((*p >= ' ') && (*p<= '~')) /* Assume ASCII! */
fprintf(stderr, "%c", *p);
else
fprintf(stderr, "<%x>", (unsigned)*p);
}
fprintf(stderr, "\n");
}
return docid; /* Ok */
} /* WAIS_from_WWW */
/* Send a plain text record to the client output_text_record()
** --------------------------------------
*/
PRIVATE void output_text_record ARGS4(
HTStream *, target,
WAISDocumentText *, record,
boolean, quote_string_quotes,
boolean, binary)
{
long count;
/* printf(" Text\n");
print_any(" DocumentID: ", record->DocumentID);
printf(" VersionNumber: %d\n", record->VersionNumber);
*/
if (binary) {
(*target->isa->put_block)(target,
record->DocumentText->bytes,
record->DocumentText->size);
return;
}
for (count = 0; count < record->DocumentText->size; count++){
long ch = (unsigned char)record->DocumentText->bytes[count];
if (ch == 27) { /* What is this in for? Tim */
/* then we have an escape code */
/* if the next letter is '(' or ')', then ignore two letters */
if ('(' == record->DocumentText->bytes[count + 1] ||
')' == record->DocumentText->bytes[count + 1])
count += 1; /* it is a term marker */
else count += 4; /* it is a paragraph marker */
} else if (ch == '\n' || ch == '\r') {
PUTC('\n');
} else if (HTCJK != NOCJK || ch == '\t' || isprint(ch)){
PUTC(ch);
}
}
} /* output text record */
/* Format A Search response for the client display_search_response
** ---------------------------------------
*/
/* modified from tracy shen's version in wutil.c
* displays either a text record or a set of headlines.
*/
PRIVATE void display_search_response ARGS4(
HTStructured *, target,
SearchResponseAPDU *, response,
char *, database,
char *, keywords)
{
WAISSearchResponse *info;
long i, k;
BOOL archie = strstr(database, "archie")!=0; /* Specical handling */
if (TRACE)
fprintf(stderr, "HTWAIS: Displaying search response\n");
PUTS("Index ");
START(HTML_EM);
PUTS(database);
END(HTML_EM);
sprintf(line, " contains the following %d item%s relevant to \"",
(int)(response->NumberOfRecordsReturned),
response->NumberOfRecordsReturned ==1 ? "" : "s");
PUTS(line);
START(HTML_EM);
PUTS(keywords);
END(HTML_EM);
PUTS("\".\n");
PUTS("The first figure after each entry is its relative score, ");
PUTS("the second is the number of lines in the item.");
START(HTML_BR);
START(HTML_BR);
PUTS("\n");
START(HTML_OL);
if (response->DatabaseDiagnosticRecords != 0) {
info = (WAISSearchResponse *)response->DatabaseDiagnosticRecords;
i =0;
if (info->Diagnostics != NULL)
showDiags((HTStream*)target, info->Diagnostics);
if (info->DocHeaders != 0) {
for (k = 0; info->DocHeaders[k] != 0; k++ ) {
WAISDocumentHeader* head = info->DocHeaders[k];
char * headline = trim_junk(head->Headline);
any * docid = head->DocumentID;
char * docname; /* printable version of docid */
i++;
/*
** Make a printable string out of the document id.
*/
if (TRACE)
fprintf(stderr,
"HTWAIS: %2ld: Score: %4ld, lines:%4ld '%s'\n",
i,
(long int)(info->DocHeaders[k]->Score),
(long int)(info->DocHeaders[k]->Lines),
headline);
START(HTML_LI);
if (archie) {
char * www_name = WWW_from_archie(headline);
if (www_name) {
HTStartAnchor(target, NULL, www_name);
PUTS(headline);
END(HTML_A);
FREE(www_name);
} else {
PUTS(headline);
PUTS(" (bad file name)");
}
} else { /* Not archie */
docname = WWW_from_WAIS(docid);
if (docname) {
char * dbname = HTEscape(database, URL_XPALPHAS);
sprintf(line,
"/%s/%s/%d/%s", /* W3 address */
dbname,
head->Types ? head->Types[0] : "TEXT",
(int)(head->DocumentLength),
docname);
HTStartAnchor(target, NULL,
((head->Types) &&
(!strcmp(head->Types[0], "URL")))
?
headline : line); /* NT, Sep 93 */
PUTS(headline);
END(HTML_A);
FREE(dbname);
FREE(docname);
} else {
PUTS("(bad doc id)");
}
}
sprintf(line, "%5ld %5ld ",
head->Score,
head->Lines);
PUTS( line);
MAYBE_END(HTML_LI);
} /* next document header */
} /* if there were any document headers */
if (info->ShortHeaders != 0) {
k = 0;
while (info->ShortHeaders[k] != 0) {
i++;
PUTS( "(Short Header record, can't display)");
}
}
if (info->LongHeaders != 0) {
k = 0;
while (info->LongHeaders[k] != 0) {
i++;
PUTS( "\nLong Header record, can't display\n");
}
}
if (info->Text != 0) {
k = 0;
while (info->Text[k] != 0) {
i++;
PUTS( "\nText record\n");
output_text_record((HTStream*)target,
info->Text[k++], false, false);
}
}
if (info->Headlines != 0) {
k = 0;
while (info->Headlines[k] != 0) {
i++;
PUTS( "\nHeadline record, can't display\n");
/* dsply_headline_record( info->Headlines[k++]); */
}
}
if (info->Codes != 0) {
k = 0;
while (info->Codes[k] != 0) {
i++;
PUTS( "\nCode record, can't display\n");
/* dsply_code_record( info->Codes[k++]); */
}
}
} /* Loop: display user info */
END(HTML_OL);
PUTC('\n'); ;
}
/* Load by name HTLoadWAIS
** ============
**
** This renders any object or search as required.
*/
PUBLIC int HTLoadWAIS ARGS4(
CONST char *, arg,
HTParentAnchor *, anAnchor,
HTFormat, format_out,
HTStream*, sink)
#define MAX_KEYWORDS_LENGTH 1000
#define MAX_SERVER_LENGTH 1000
#define MAX_DATABASE_LENGTH 1000
#define MAX_SERVICE_LENGTH 1000
#define MAXDOCS 200
{
static CONST char * error_header =
"<h1>Access error</h1>\nThe following error occured in accesing a WAIS server:<P>\n";
char * key; /* pointer to keywords in URL */
char* request_message = NULL; /* arbitrary message limit */
char* response_message = NULL; /* arbitrary message limit */
long request_buffer_length; /* how of the request is left */
SearchResponseAPDU *retrieval_response = 0;
char keywords[MAX_KEYWORDS_LENGTH + 1];
char *server_name;
char *wais_database = NULL; /* name of current database */
char *www_database; /* Same name escaped */
char *service;
char *doctype;
char *doclength;
long document_length;
char *docname;
#ifdef VMS
long connection = 0;
#else
FILE *connection = NULL;
#endif /* VMS */
char * names; /* Copy of arg to be hacked up */
BOOL ok = NO;
int return_status = HT_LOADED;
int rv;
extern FILE * connect_to_server();
if (!acceptable_inited)
init_acceptable();
/* Decipher and check syntax of WWW address:
** ----------------------------------------
**
** First we remove the "wais:" if it was spcified. 920110
*/
names = HTParse(arg, "", PARSE_HOST | PARSE_PATH | PARSE_PUNCTUATION);
key = strchr(names, '?');
if (key) {
char * p;
*key++ = 0; /* Split off keywords */
for (p=key; *p; p++) if (*p == '+') *p = ' ';
HTUnEscape(key);
}
if (names[0] == '/') {
server_name = names+1;
if (as_gate =(*server_name == '/'))
server_name++; /* Accept one or two */
www_database = strchr(server_name,'/');
if (www_database) {
*www_database++ = 0; /* Separate database name */
doctype = strchr(www_database, '/');
if (key) ok = YES; /* Don't need doc details */
else if (doctype) { /* If not search parse doc details */
*doctype++ = 0; /* Separate rest of doc address */
doclength = strchr(doctype, '/');
if (doclength) {
*doclength++ = 0;
document_length = atol(doclength);
if (document_length) {
docname = strchr(doclength, '/');
if (docname) {
*docname++ = 0;
ok = YES; /* To avoid a goto! */
} /* if docname */
} /* if document_length valid */
} /* if doclength */
} else { /* no doctype? Assume index required */
if (!key)
key = "";
ok = YES;
} /* if doctype */
} /* if database */
}
if (!ok)
return HTLoadError(sink, 500, "Syntax error in WAIS URL");
if (TRACE)
fprintf(stderr, "HTWAIS: Parsed OK\n");
service = strchr(names, ':');
if (service)
*service++ = 0;
else
service = "210";
if (server_name[0] == 0) {
#ifdef VMS
connection = 0;
#else
connection = NULL;
#endif /* VMS */
} else if (!(key && !*key)) {
int status;
if (TRACE)
fprintf (stderr, "===WAIS=== calling mosaic_connect_to_server\n");
status = mosaic_connect_to_server(server_name,
atoi(service),
&connection);
if (status == 0) {
if (TRACE)
fprintf (stderr, "===WAIS=== connection failed\n");
FREE(names);
return HT_NOT_LOADED;
} else if (status == -1) {
if (TRACE)
fprintf (stderr, "===WAIS=== connection interrupted\n");
FREE(names);
return HT_NOT_LOADED;
}
}
StrAllocCopy(wais_database,www_database);
HTUnEscape(wais_database);
/*
** This below fixed size stuff is terrible.
*/
#ifdef VMS
if (!(request_message =
(char*)calloc((size_t)MAX_MESSAGE_LEN*sizeof(char),1)))
outofmem(__FILE__, "HTLoadWAIS");
if (!(response_message =
(char*)calloc((size_t)MAX_MESSAGE_LEN*sizeof(char),1)))
outofmem(__FILE__, "HTLoadWAIS");
#else
request_message = (char*)s_malloc((size_t)MAX_MESSAGE_LEN * sizeof(char));
response_message = (char*)s_malloc((size_t)MAX_MESSAGE_LEN * sizeof(char));
#endif /* VMS */
/*
** If keyword search is performed but there are no keywords,
** the user has followed a link to the index itself. It would be
** appropriate at this point to send him the .SRC file - how?
*/
if (key && !*key) { /* I N D E X */
#ifdef CACHE_FILE_PREFIX
char filename[256];
FILE * fp;
#endif
HTStructured * target = HTML_new(anAnchor, format_out, sink);
START(HTML_HEAD);
PUTS("\n");
HTStartIsIndex(target, "Enter WAIS query: ", NULL);
PUTS("\n");
{
START(HTML_TITLE);
PUTS(wais_database);
PUTS(" (WAIS Index)");
END(HTML_TITLE);
PUTS("\n");
END(HTML_HEAD);
PUTS("\n");
START(HTML_H1);
PUTS("WAIS Index: ");
START(HTML_EM);
PUTS(wais_database);
END(HTML_EM);
END(HTML_H1);
PUTS("\n");
PUTS("This is a link for searching the ");
START(HTML_EM);
PUTS(wais_database);
END(HTML_EM);
PUTS(" WAIS Index.\n");
}
/*
** If we have seen a source file for this database, use that.
*/
#ifdef CACHE_FILE_PREFIX
sprintf(filename, "%sWSRC-%s:%s:%.100s.txt",
CACHE_FILE_PREFIX,
server_name, service, www_database);
fp = fopen(filename, "r"); /* Have we found this already? */
if (TRACE) fprintf(stderr,
"HTWAIS: Description of server %s %s.\n",
filename,
fp ? "exists already" : "does NOT exist!");
if (fp) {
char c;
START(HTML_PRE); /* Preformatted description */
PUTS("\n");
while((c=getc(fp))!=EOF) PUTC(c); /* Transfer file */
END(HTML_PRE);
fclose(fp);
#endif
START(HTML_P);
PUTS("\nEnter the 's'earch command and then specify search words.\n");
FREE_TARGET;
} else if (key) { /* S E A R C H */
char *p;
HTStructured * target;
strncpy(keywords, key, MAX_KEYWORDS_LENGTH);
while(p=strchr(keywords, '+')) *p = ' ';
/*
** Send advance title to get something fast to the other end.
*/
target = HTML_new(anAnchor, format_out, sink);
START(HTML_HEAD);
PUTS("\n");
HTStartIsIndex(target, "Enter WAIS query: ", NULL);
PUTS("\n");
START(HTML_TITLE);
PUTS(keywords);
PUTS(" (in ");
PUTS(wais_database);
PUTS(")");
END(HTML_TITLE);
PUTS("\n");
END(HTML_HEAD);
PUTS("\n");
START(HTML_H1);
PUTS("WAIS Search of \"");
START(HTML_EM);
PUTS(keywords);
END(HTML_EM);
PUTS("\" in: ");
START(HTML_EM);
PUTS(wais_database);
END(HTML_EM);
END(HTML_H1);
PUTS("\n");
request_buffer_length = MAX_MESSAGE_LEN; /* Amount left */
if (TRACE) fprintf(stderr, "HTWAIS: Search for `%s' in `%s'\n",
keywords, wais_database);
if(NULL ==
generate_search_apdu(request_message + HEADER_LENGTH,
&request_buffer_length,
keywords, wais_database, NULL, MAXDOCS)) {
#ifdef VMS
HTAlert ("HTWAIS: Request too large.");
return_status = HT_NOT_LOADED;
FREE_TARGET;
goto CleanUp;
#else
panic("request too large");
#endif /* VMS */
}
HTProgress("Searching WAIS database...");
rv = interpret_message (request_message,
MAX_MESSAGE_LEN - request_buffer_length,
response_message,
MAX_MESSAGE_LEN,
connection,
false /* true verbose */
);
if (rv == HT_INTERRUPTED) {
HTAlert ("Search interrupted.");
return_status = HT_INTERRUPTED;
FREE_TARGET;
goto CleanUp;
} else if (!rv) {
#ifdef VMS
HTAlert ("HTWAIS: Return message too large.");
return_status = HT_NOT_LOADED;
FREE_TARGET;
goto CleanUp;
#else
panic("returned message too large");
#endif /* VMS */
} else { /* returned message ok */
SearchResponseAPDU *query_response = 0;
readSearchResponseAPDU(&query_response,
response_message + HEADER_LENGTH);
display_search_response(target,
query_response, wais_database, keywords);
if (query_response->DatabaseDiagnosticRecords)
freeWAISSearchResponse(
query_response->DatabaseDiagnosticRecords);
freeSearchResponseAPDU( query_response);
} /* returned message not too large */
FREE_TARGET;
} else { /* D O C U M E N T F E T C H */
HTFormat format_in;
boolean binary; /* how to transfer stuff coming over */
HTStream * target;
long count;
any doc_chunk;
any * docid = &doc_chunk;
if (TRACE) fprintf(stderr,
"HTWAIS: Retrieve document id `%s' type `%s' length %ld\n",
docname, doctype, document_length);
format_in =
!strcmp(doctype, "WSRC") ? HTAtom_for("application/x-wais-source") :
!strcmp(doctype, "TEXT") ? HTAtom_for("text/plain") :
!strcmp(doctype, "HTML") ? HTAtom_for("text/html") :
!strcmp(doctype, "GIF") ? HTAtom_for("image/gif") :
HTAtom_for("application/octet-stream");
binary =
0 != strcmp(doctype, "WSRC") &&
0 != strcmp(doctype, "TEXT") &&
0 != strcmp(doctype, "HTML") ;
target = HTStreamStack(format_in, format_out, sink, anAnchor);
if (!target)
return HTLoadError(sink, 500,
"Can't convert format of WAIS document");
/*
** Decode hex or litteral format for document ID.
*/
WAIS_from_WWW(docid, docname);
/*
** Loop over slices of the document.
*/
for (count = 0;
count * CHARS_PER_PAGE < document_length;
count++) {
#ifdef VMS
char *type = NULL;
StrAllocCopy(type, doctype);
#else
char *type = s_strdup(doctype); /* Gets freed I guess */
#endif /* VMS */
request_buffer_length = MAX_MESSAGE_LEN; /* Amount left */
if (TRACE)
fprintf(stderr, "HTWAIS: Slice number %ld\n", count);
if (HTCheckForInterrupt()) {
HTAlert ("Data transfer interrupted.");
(*target->isa->_abort)(target, NULL);
#ifdef VMS
FREE(type);
#endif /* VMS */
return_status = HT_NOT_LOADED;
goto CleanUp;
}
if (0 ==
generate_retrieval_apdu(request_message + HEADER_LENGTH,
&request_buffer_length,
docid,
CT_byte,
count * CHARS_PER_PAGE,
((count + 1) * CHARS_PER_PAGE <= document_length ?
(count + 1) * CHARS_PER_PAGE :
document_length),
type,
wais_database)) {
#ifdef VMS
HTAlert ("HTWAIS: Request too long.");
return_status = HT_NOT_LOADED;
FREE_TARGET;
FREE(type);
FREE(docid->bytes);
goto CleanUp;
#else
panic("request too long");
#endif /* VMS */
}
/*
** Actually do the transaction given by request_message.
*/
HTProgress("Fetching WAIS document...");
rv = interpret_message(request_message,
MAX_MESSAGE_LEN - request_buffer_length,
response_message,
MAX_MESSAGE_LEN,
connection,
false /* true verbose */
);
if (rv == HT_INTERRUPTED) {
HTAlert ("Data transfer interrupted.");
return_status = HT_INTERRUPTED;
FREE_TARGET;
FREE(type);
FREE(docid->bytes);
goto CleanUp;
} else if (!rv) {
#ifdef VMS
HTAlert ("HTWAIS: Return message too large.");
return_status = HT_NOT_LOADED;
FREE_TARGET;
FREE(type);
FREE(docid->bytes);
goto CleanUp;
#else
panic("Returned message too large");
#endif /* VMS */
}
/*
** Parse the result which came back into memory.
*/
readSearchResponseAPDU(&retrieval_response,
response_message + HEADER_LENGTH);
if (NULL ==
((WAISSearchResponse *)
retrieval_response->DatabaseDiagnosticRecords)->Text) {
/* display_search_response(target, retrieval_response,
wais_database, keywords); */
PUTS("No text was returned!\n");
/* panic("No text was returned"); */
} else {
output_text_record(target,
((WAISSearchResponse *)
retrieval_response->DatabaseDiagnosticRecords)->Text[0],
false, binary);
} /* If text existed */
#ifdef VMS
FREE(type);
#endif /* VMS */
} /* Loop over slices */
FREE_TARGET;
FREE(docid->bytes);
freeWAISSearchResponse( retrieval_response->DatabaseDiagnosticRecords);
freeSearchResponseAPDU( retrieval_response);
} /* If document rather than search */
CleanUp:
/*
** (This postponed until later, after a timeout:)
*/
#ifdef VMS
if (connection)
NETCLOSE((int)connection);
#else
if (connection)
fclose(connection);
#endif /* VMS */
FREE(wais_database);
#ifdef VMS
FREE(request_message);
FREE(response_message);
#else
s_free(request_message);
s_free(response_message);
#endif /* VMS */
FREE(names);
return (return_status);
}
#ifdef GLOBALDEF_IS_MACRO
#define _HTWAIS_C_1_INIT { "wais", HTLoadWAIS, NULL }
GLOBALDEF(HTProtocol, HTWAIS, _HTWAIS_C_1_INIT);
#else
GLOBALDEF PUBLIC HTProtocol HTWAIS = { "wais", HTLoadWAIS, NULL };
#endif /* GLOBALDEF_IS_MACRO */