/* WorldWideWeb - Wide Area Informaion Server Access HTWAIS.c ** ================================================== ** ** This module allows a WWW server or client to read data from a ** remote WAIS ** server, and provide that data to a WWW client in hypertext form. ** Source files, once retrieved, are stored and used to provide ** information about the index when that is acessed. ** ** Authors ** BK Brewster Kahle, Thinking Machines, ** TBL Tim Berners-Lee, CERN ** FM Foteos Macrides, WFEB ** ** History ** Sep 91 TBL adapted shell-ui.c (BK) with HTRetrieve.c from WWW. ** Feb 91 TBL Generated HTML cleaned up a bit (quotes, escaping) ** Refers to lists of sources. ** Mar 93 TBL Lib 2.0 compatible module made. ** May 94 FM Added DIRECT_WAIS support for VMS. ** ** Bugs ** Uses C stream i/o to read and write sockets, which won't work ** on VMS TCP systems. ** ** Should cache connections. ** ** ANSI C only as written ** ** Bugs fixed ** NT Nathan Torkington (Nathan.Torkington@vuw.ac.nz) ** ** WAIS comments: ** ** 1. Separate directories for different system's .o would help ** 2. Document ids are rather long! ** ** W WW Address mapping convention: ** ** /servername/database/type/length/document-id ** ** /servername/database?word+word+word */ /* WIDE AREA INFORMATION SERVER SOFTWARE: No guarantees or restrictions. See the readme file for the full standard disclaimer. Brewster@think.com */ #include "HTUtils.h" #include "tcp.h" #include "HTParse.h" #include "HTAccess.h" /* We implement a protocol */ #include "HTML.h" /* The object we will generate */ #include "HTFormat.h" #include "HTTCP.h" #include "HTCJK.h" #include "HTAlert.h" /* #include "HTWSRC.h" */ /* Need some bits from here */ /* #include "ParseWSRC.h" */ /* From WAIS ** --------- */ #ifdef VMS #include "HTVMS_WaisUI.h" #include "HTVMS_WaisProt.h" #else #include #endif /* VMS */ #define MAX_MESSAGE_LEN 100000 #define CHARS_PER_PAGE 10000 /* number of chars retrieved in each request */ #define WAISSEARCH_DATE "Fri Jul 19 1991" /* FROM WWW ** -------- */ #include "LYLeaks.h" #define FREE(x) if (x) {free(x); x = NULL;} extern int HTCheckForInterrupt NOPARAMS; #define DIRECTORY "/cnidr.org:210/directory-of-servers" /* #define DIRECTORY "/quake.think.com:210/directory-of-servers" */ #define BIG 1024 /* identifier size limit @@@@@ */ #define BUFFER_SIZE 4096 /* Arbitrary size for efficiency */ #define HEX_ESCAPE '%' extern HTCJKlang HTCJK; extern int WWW_TraceFlag; /* Control diagnostic output */ extern FILE * logfile; /* Log file output */ PRIVATE BOOL as_gate; /* Client is using us as gateway */ PRIVATE char line[2048]; /* For building strings to display */ /* Must be able to take id */ #define PUTC(c) (*target->isa->put_character)(target, c) #define PUTS(s) (*target->isa->put_string)(target, s) #define START(e) (*target->isa->start_element)(target, e, 0, 0, 0) #define END(e) (*target->isa->end_element)(target, e, 0) #define MAYBE_END(e) if (HTML_dtd.tags[e].contents != SGML_EMPTY) \ (*target->isa->end_element)(target, e, 0) #define FREE_TARGET (*target->isa->_free)(target) struct _HTStructured { CONST HTStructuredClass * isa; /* ... */ }; struct _HTStream { CONST HTStreamClass * isa; /* ... */ }; /* ------------------------------------------------------------------------ */ /* ---------------- Local copy of connect_to_server calls ----------------- */ /* ------------------------------------------------------------------------ */ /* Returns 1 on success, 0 on fail, -1 on interrupt. */ PRIVATE int fd_mosaic_connect_to_server ARGS3( char *, host_name, long, port, long *, fd) { /* ** New version. */ char dummy[256]; int status; sprintf (dummy, "wais://%s:%d/", host_name, port); status = HTDoConnect (dummy, "WAIS", 210, (int *)fd); if (status == HT_INTERRUPTED) { return -1; } if (status < 0) return 0; return 1; } /* Returns 1 on success, 0 on fail, -1 on interrupt. */ #ifdef VMS PRIVATE int mosaic_connect_to_server ARGS3( char *, host_name, long, port, long *, fdp) #else PRIVATE int mosaic_connect_to_server ARGS3( char *, host_name, long, port, FILE **, fp) #endif /* VMS */ { #ifndef VMS FILE* file; #endif /* VMS */ long fd; int rv; rv = fd_mosaic_connect_to_server (host_name, port, &fd); if (rv == 0) { HTAlert ("Could not connect to WAIS server."); return 0; } else if (rv == -1) { HTAlert ("Connection interrupted."); return -1; } #ifndef VMS if ((file = fdopen(fd,"r+")) == NULL) { HTAlert ("Could not open WAIS connection for reading."); return 0; } *fp = file; #else *fdp = fd; #endif /* VMS */ return 1; } /* ------------------------------------------------------------------------ */ /* ------------------------------------------------------------------------ */ /* showDiags */ /* modified from Jonny G's version in ui/question.c */ PRIVATE void showDiags ARGS2( HTStream *, target, diagnosticRecord **, d) { long i; for (i = 0; d[i] != NULL; i++) { if (d[i]->ADDINFO != NULL) { PUTS("Diagnostic code is "); PUTS(d[i]->DIAG); PUTC(' '); PUTS(d[i]->ADDINFO); PUTC('\n'); ; } } } /* Matrix of allowed characters in filenames ** ----------------------------------------- */ PRIVATE BOOL acceptable[256]; PRIVATE BOOL acceptable_inited = NO; PRIVATE void init_acceptable NOARGS { unsigned int i; char * good = "abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789./-_$"; for(i=0; i<256; i++) acceptable[i] = NO; for(;*good; good++) acceptable[(unsigned int)*good] = YES; acceptable_inited = YES; } /* Transform file identifier into WWW address ** ------------------------------------------ ** ** ** On exit, ** returns nil if error ** pointer to malloced string (must be freed) if ok */ PRIVATE char * WWW_from_archie ARGS1( char *, file) { char * end; char * result; char * colon; for(end=file; *end > ' '; end++); /* assumes ASCII encoding*/ result = (char *)malloc(10 + (end-file)); if (!result) return result; /* Malloc error */ strcpy(result, "file://"); strncat(result, file, end-file); colon = strchr(result+7, ':'); /* Expect colon after host */ if (colon) { for(; colon[0]; colon[0]=colon[1], colon++); /* move down */ } return result; } /* WWW_from_archie */ /* Transform document identifier into URL ** -------------------------------------- ** ** Bugs: A static buffer of finite size is used! ** The format of the docid MUST be good! ** ** On exit, ** returns nil if error ** pointer to malloced string (must be freed) if ok */ PRIVATE char hex [17] = "0123456789ABCDEF"; extern char from_hex PARAMS((char a)); /* In HTWSRC @@ */ PRIVATE char * WWW_from_WAIS ARGS1( any *, docid) { static char buf[BIG]; char * q = buf; char * p = (docid->bytes); int i, l; if (TRACE) { char *p; fprintf(stderr, "WAIS id (%d bytes) is ", (int)docid->size); for (p = docid->bytes; p < docid->bytes+docid->size; p++) { if ((*p >= ' ') && (*p<= '~')) /* Assume ASCII! */ fprintf(stderr, "%c", *p); else fprintf(stderr, "<%x>", (unsigned)*p); } fprintf(stderr, "\n"); } for (p = docid->bytes; (p < docid->bytes+docid->size) && (q < &buf[BIG]);) { if (TRACE) fprintf(stderr, " Record type %d, length %d\n", p[0], p[1]); if (*p > 10) { if (TRACE) fprintf(stderr, "Eh? DOCID record type of %d!\n", *p); return 0; } { /* Bug fix -- allow any byte value 15 Apr 93 */ unsigned int i = (unsigned) *p++; if (i > 99) { *q++ = (i/100) + '0'; i = i % 100; } if (i > 9) { *q++ = (i/10) + '0'; i = i % 10; } *q++ = i + '0'; /* Record type */ } *q++ = '='; /* Separate */ l = *p++; /* Length */ for (i = 0; i < l; i++, p++){ if (!acceptable[*p]) { *q++ = HEX_ESCAPE; /* Means hex commming */ *q++ = hex[(*p) >> 4]; *q++ = hex[(*p) & 15]; } else *q++ = *p; } *q++= ';'; /* Terminate field */ } *q++ = 0; /* Terminate string */ if (TRACE) fprintf(stderr, "WWW form of id: %s\n", buf); { char * result = (char *)malloc(strlen(buf)+1); if (!result) outofmem(__FILE__, "WWW_from_WAIS"); strcpy(result, buf); return result; } } /* WWW_from_WAIS */ /* Transform URL into WAIS document identifier ** ------------------------------------------- ** ** On entry, ** docname points to valid name produced originally by ** WWW_from_WAIS ** On exit, ** docid->size is valid ** docid->bytes is malloced and must later be freed. */ PRIVATE any * WAIS_from_WWW ARGS2( any *, docid, char *, docname) { char *z; /* Output pointer */ char *sor; /* Start of record - points to size field. */ char *p; /* Input pointer */ char *q; /* Poisition of "=" */ char *s; /* Position of semicolon */ int n; /* size */ if (TRACE) fprintf(stderr, "WWW id (to become WAIS id): %s\n", docname); for (n = 0, p = docname; *p; p++) { /* Count sizes of strings */ n++; if (*p == ';') n--; /* Not converted */ else if (*p == HEX_ESCAPE) n = n-2; /* Save two bytes */ docid->size = n; } if (!(docid->bytes = (char *) malloc(docid->size))) /* result record */ outofmem(__FILE__, "WAIS_from_WWW"); z = docid->bytes; for (p = docname; *p; ) { /* Convert of strings */ /* Record type */ *z = 0; /* Initialize record type */ while (*p >= '0' && *p <= '9') { *z = *z*10 + (*p++ - '0'); /* Decode decimal record type */ } z++; if (*p != '=') return 0; q = p; /* *z++ = *p++ - '0'; q = strchr(p , '='); if (!q) return 0; */ s = strchr(q, ';'); /* (Check only) */ if (!s) return 0; /* Bad! No ';'; */ sor = z; /* Remember where the size field was */ z++; /* Skip record size for now */ for (p = q+1; *p != ';';) { if (*p == HEX_ESCAPE) { char c; unsigned int b; p++; c = *p++; b = from_hex(c); c = *p++; if (!c) break; /* Odd number of chars! */ *z++ = (b<<4) + from_hex(c); } else { *z++ = *p++; /* Record */ } } *sor = (z-sor-1); /* Fill in size -- not counting size itself */ p++; /* After semicolon: start of next record */ } if (TRACE) { char *p; fprintf(stderr, "WAIS id (%d bytes) is ", (int)docid->size); for (p = docid->bytes; p < docid->bytes+docid->size; p++) { if ((*p >= ' ') && (*p<= '~')) /* Assume ASCII! */ fprintf(stderr, "%c", *p); else fprintf(stderr, "<%x>", (unsigned)*p); } fprintf(stderr, "\n"); } return docid; /* Ok */ } /* WAIS_from_WWW */ /* Send a plain text record to the client output_text_record() ** -------------------------------------- */ PRIVATE void output_text_record ARGS4( HTStream *, target, WAISDocumentText *, record, boolean, quote_string_quotes, boolean, binary) { long count; /* printf(" Text\n"); print_any(" DocumentID: ", record->DocumentID); printf(" VersionNumber: %d\n", record->VersionNumber); */ if (binary) { (*target->isa->put_block)(target, record->DocumentText->bytes, record->DocumentText->size); return; } for (count = 0; count < record->DocumentText->size; count++){ long ch = (unsigned char)record->DocumentText->bytes[count]; if (ch == 27) { /* What is this in for? Tim */ /* then we have an escape code */ /* if the next letter is '(' or ')', then ignore two letters */ if ('(' == record->DocumentText->bytes[count + 1] || ')' == record->DocumentText->bytes[count + 1]) count += 1; /* it is a term marker */ else count += 4; /* it is a paragraph marker */ } else if (ch == '\n' || ch == '\r') { PUTC('\n'); } else if (HTCJK != NOCJK || ch == '\t' || isprint(ch)){ PUTC(ch); } } } /* output text record */ /* Format A Search response for the client display_search_response ** --------------------------------------- */ /* modified from tracy shen's version in wutil.c * displays either a text record or a set of headlines. */ PRIVATE void display_search_response ARGS4( HTStructured *, target, SearchResponseAPDU *, response, char *, database, char *, keywords) { WAISSearchResponse *info; long i, k; BOOL archie = strstr(database, "archie")!=0; /* Specical handling */ if (TRACE) fprintf(stderr, "HTWAIS: Displaying search response\n"); PUTS("Index "); START(HTML_EM); PUTS(database); END(HTML_EM); sprintf(line, " contains the following %d item%s relevant to \"", (int)(response->NumberOfRecordsReturned), response->NumberOfRecordsReturned ==1 ? "" : "s"); PUTS(line); START(HTML_EM); PUTS(keywords); END(HTML_EM); PUTS("\".\n"); PUTS("The first figure after each entry is its relative score, "); PUTS("the second is the number of lines in the item."); START(HTML_BR); START(HTML_BR); PUTS("\n"); START(HTML_OL); if (response->DatabaseDiagnosticRecords != 0) { info = (WAISSearchResponse *)response->DatabaseDiagnosticRecords; i =0; if (info->Diagnostics != NULL) showDiags((HTStream*)target, info->Diagnostics); if (info->DocHeaders != 0) { for (k = 0; info->DocHeaders[k] != 0; k++ ) { WAISDocumentHeader* head = info->DocHeaders[k]; char * headline = trim_junk(head->Headline); any * docid = head->DocumentID; char * docname; /* printable version of docid */ i++; /* ** Make a printable string out of the document id. */ if (TRACE) fprintf(stderr, "HTWAIS: %2ld: Score: %4ld, lines:%4ld '%s'\n", i, (long int)(info->DocHeaders[k]->Score), (long int)(info->DocHeaders[k]->Lines), headline); START(HTML_LI); if (archie) { char * www_name = WWW_from_archie(headline); if (www_name) { HTStartAnchor(target, NULL, www_name); PUTS(headline); END(HTML_A); FREE(www_name); } else { PUTS(headline); PUTS(" (bad file name)"); } } else { /* Not archie */ docname = WWW_from_WAIS(docid); if (docname) { char * dbname = HTEscape(database, URL_XPALPHAS); sprintf(line, "/%s/%s/%d/%s", /* W3 address */ dbname, head->Types ? head->Types[0] : "TEXT", (int)(head->DocumentLength), docname); HTStartAnchor(target, NULL, ((head->Types) && (!strcmp(head->Types[0], "URL"))) ? headline : line); /* NT, Sep 93 */ PUTS(headline); END(HTML_A); FREE(dbname); FREE(docname); } else { PUTS("(bad doc id)"); } } sprintf(line, "%5ld %5ld ", head->Score, head->Lines); PUTS( line); MAYBE_END(HTML_LI); } /* next document header */ } /* if there were any document headers */ if (info->ShortHeaders != 0) { k = 0; while (info->ShortHeaders[k] != 0) { i++; PUTS( "(Short Header record, can't display)"); } } if (info->LongHeaders != 0) { k = 0; while (info->LongHeaders[k] != 0) { i++; PUTS( "\nLong Header record, can't display\n"); } } if (info->Text != 0) { k = 0; while (info->Text[k] != 0) { i++; PUTS( "\nText record\n"); output_text_record((HTStream*)target, info->Text[k++], false, false); } } if (info->Headlines != 0) { k = 0; while (info->Headlines[k] != 0) { i++; PUTS( "\nHeadline record, can't display\n"); /* dsply_headline_record( info->Headlines[k++]); */ } } if (info->Codes != 0) { k = 0; while (info->Codes[k] != 0) { i++; PUTS( "\nCode record, can't display\n"); /* dsply_code_record( info->Codes[k++]); */ } } } /* Loop: display user info */ END(HTML_OL); PUTC('\n'); ; } /* Load by name HTLoadWAIS ** ============ ** ** This renders any object or search as required. */ PUBLIC int HTLoadWAIS ARGS4( CONST char *, arg, HTParentAnchor *, anAnchor, HTFormat, format_out, HTStream*, sink) #define MAX_KEYWORDS_LENGTH 1000 #define MAX_SERVER_LENGTH 1000 #define MAX_DATABASE_LENGTH 1000 #define MAX_SERVICE_LENGTH 1000 #define MAXDOCS 200 { static CONST char * error_header = "

Access error

\nThe following error occured in accesing a WAIS server:

\n"; char * key; /* pointer to keywords in URL */ char* request_message = NULL; /* arbitrary message limit */ char* response_message = NULL; /* arbitrary message limit */ long request_buffer_length; /* how of the request is left */ SearchResponseAPDU *retrieval_response = 0; char keywords[MAX_KEYWORDS_LENGTH + 1]; char *server_name; char *wais_database = NULL; /* name of current database */ char *www_database; /* Same name escaped */ char *service; char *doctype; char *doclength; long document_length; char *docname; #ifdef VMS long connection = 0; #else FILE *connection = NULL; #endif /* VMS */ char * names; /* Copy of arg to be hacked up */ BOOL ok = NO; int return_status = HT_LOADED; int rv; extern FILE * connect_to_server(); if (!acceptable_inited) init_acceptable(); /* Decipher and check syntax of WWW address: ** ---------------------------------------- ** ** First we remove the "wais:" if it was spcified. 920110 */ names = HTParse(arg, "", PARSE_HOST | PARSE_PATH | PARSE_PUNCTUATION); key = strchr(names, '?'); if (key) { char * p; *key++ = 0; /* Split off keywords */ for (p=key; *p; p++) if (*p == '+') *p = ' '; HTUnEscape(key); } if (names[0] == '/') { server_name = names+1; if (as_gate =(*server_name == '/')) server_name++; /* Accept one or two */ www_database = strchr(server_name,'/'); if (www_database) { *www_database++ = 0; /* Separate database name */ doctype = strchr(www_database, '/'); if (key) ok = YES; /* Don't need doc details */ else if (doctype) { /* If not search parse doc details */ *doctype++ = 0; /* Separate rest of doc address */ doclength = strchr(doctype, '/'); if (doclength) { *doclength++ = 0; document_length = atol(doclength); if (document_length) { docname = strchr(doclength, '/'); if (docname) { *docname++ = 0; ok = YES; /* To avoid a goto! */ } /* if docname */ } /* if document_length valid */ } /* if doclength */ } else { /* no doctype? Assume index required */ if (!key) key = ""; ok = YES; } /* if doctype */ } /* if database */ } if (!ok) return HTLoadError(sink, 500, "Syntax error in WAIS URL"); if (TRACE) fprintf(stderr, "HTWAIS: Parsed OK\n"); service = strchr(names, ':'); if (service) *service++ = 0; else service = "210"; if (server_name[0] == 0) { #ifdef VMS connection = 0; #else connection = NULL; #endif /* VMS */ } else if (!(key && !*key)) { int status; if (TRACE) fprintf (stderr, "===WAIS=== calling mosaic_connect_to_server\n"); status = mosaic_connect_to_server(server_name, atoi(service), &connection); if (status == 0) { if (TRACE) fprintf (stderr, "===WAIS=== connection failed\n"); FREE(names); return HT_NOT_LOADED; } else if (status == -1) { if (TRACE) fprintf (stderr, "===WAIS=== connection interrupted\n"); FREE(names); return HT_NOT_LOADED; } } StrAllocCopy(wais_database,www_database); HTUnEscape(wais_database); /* ** This below fixed size stuff is terrible. */ #ifdef VMS if (!(request_message = (char*)calloc((size_t)MAX_MESSAGE_LEN*sizeof(char),1))) outofmem(__FILE__, "HTLoadWAIS"); if (!(response_message = (char*)calloc((size_t)MAX_MESSAGE_LEN*sizeof(char),1))) outofmem(__FILE__, "HTLoadWAIS"); #else request_message = (char*)s_malloc((size_t)MAX_MESSAGE_LEN * sizeof(char)); response_message = (char*)s_malloc((size_t)MAX_MESSAGE_LEN * sizeof(char)); #endif /* VMS */ /* ** If keyword search is performed but there are no keywords, ** the user has followed a link to the index itself. It would be ** appropriate at this point to send him the .SRC file - how? */ if (key && !*key) { /* I N D E X */ #ifdef CACHE_FILE_PREFIX char filename[256]; FILE * fp; #endif HTStructured * target = HTML_new(anAnchor, format_out, sink); START(HTML_HEAD); PUTS("\n"); HTStartIsIndex(target, "Enter WAIS query: ", NULL); PUTS("\n"); { START(HTML_TITLE); PUTS(wais_database); PUTS(" (WAIS Index)"); END(HTML_TITLE); PUTS("\n"); END(HTML_HEAD); PUTS("\n"); START(HTML_H1); PUTS("WAIS Index: "); START(HTML_EM); PUTS(wais_database); END(HTML_EM); END(HTML_H1); PUTS("\n"); PUTS("This is a link for searching the "); START(HTML_EM); PUTS(wais_database); END(HTML_EM); PUTS(" WAIS Index.\n"); } /* ** If we have seen a source file for this database, use that. */ #ifdef CACHE_FILE_PREFIX sprintf(filename, "%sWSRC-%s:%s:%.100s.txt", CACHE_FILE_PREFIX, server_name, service, www_database); fp = fopen(filename, "r"); /* Have we found this already? */ if (TRACE) fprintf(stderr, "HTWAIS: Description of server %s %s.\n", filename, fp ? "exists already" : "does NOT exist!"); if (fp) { char c; START(HTML_PRE); /* Preformatted description */ PUTS("\n"); while((c=getc(fp))!=EOF) PUTC(c); /* Transfer file */ END(HTML_PRE); fclose(fp); #endif START(HTML_P); PUTS("\nEnter the 's'earch command and then specify search words.\n"); FREE_TARGET; } else if (key) { /* S E A R C H */ char *p; HTStructured * target; strncpy(keywords, key, MAX_KEYWORDS_LENGTH); while(p=strchr(keywords, '+')) *p = ' '; /* ** Send advance title to get something fast to the other end. */ target = HTML_new(anAnchor, format_out, sink); START(HTML_HEAD); PUTS("\n"); HTStartIsIndex(target, "Enter WAIS query: ", NULL); PUTS("\n"); START(HTML_TITLE); PUTS(keywords); PUTS(" (in "); PUTS(wais_database); PUTS(")"); END(HTML_TITLE); PUTS("\n"); END(HTML_HEAD); PUTS("\n"); START(HTML_H1); PUTS("WAIS Search of \""); START(HTML_EM); PUTS(keywords); END(HTML_EM); PUTS("\" in: "); START(HTML_EM); PUTS(wais_database); END(HTML_EM); END(HTML_H1); PUTS("\n"); request_buffer_length = MAX_MESSAGE_LEN; /* Amount left */ if (TRACE) fprintf(stderr, "HTWAIS: Search for `%s' in `%s'\n", keywords, wais_database); if(NULL == generate_search_apdu(request_message + HEADER_LENGTH, &request_buffer_length, keywords, wais_database, NULL, MAXDOCS)) { #ifdef VMS HTAlert ("HTWAIS: Request too large."); return_status = HT_NOT_LOADED; FREE_TARGET; goto CleanUp; #else panic("request too large"); #endif /* VMS */ } HTProgress("Searching WAIS database..."); rv = interpret_message (request_message, MAX_MESSAGE_LEN - request_buffer_length, response_message, MAX_MESSAGE_LEN, connection, false /* true verbose */ ); if (rv == HT_INTERRUPTED) { HTAlert ("Search interrupted."); return_status = HT_INTERRUPTED; FREE_TARGET; goto CleanUp; } else if (!rv) { #ifdef VMS HTAlert ("HTWAIS: Return message too large."); return_status = HT_NOT_LOADED; FREE_TARGET; goto CleanUp; #else panic("returned message too large"); #endif /* VMS */ } else { /* returned message ok */ SearchResponseAPDU *query_response = 0; readSearchResponseAPDU(&query_response, response_message + HEADER_LENGTH); display_search_response(target, query_response, wais_database, keywords); if (query_response->DatabaseDiagnosticRecords) freeWAISSearchResponse( query_response->DatabaseDiagnosticRecords); freeSearchResponseAPDU( query_response); } /* returned message not too large */ FREE_TARGET; } else { /* D O C U M E N T F E T C H */ HTFormat format_in; boolean binary; /* how to transfer stuff coming over */ HTStream * target; long count; any doc_chunk; any * docid = &doc_chunk; if (TRACE) fprintf(stderr, "HTWAIS: Retrieve document id `%s' type `%s' length %ld\n", docname, doctype, document_length); format_in = !strcmp(doctype, "WSRC") ? HTAtom_for("application/x-wais-source") : !strcmp(doctype, "TEXT") ? HTAtom_for("text/plain") : !strcmp(doctype, "HTML") ? HTAtom_for("text/html") : !strcmp(doctype, "GIF") ? HTAtom_for("image/gif") : HTAtom_for("application/octet-stream"); binary = 0 != strcmp(doctype, "WSRC") && 0 != strcmp(doctype, "TEXT") && 0 != strcmp(doctype, "HTML") ; target = HTStreamStack(format_in, format_out, sink, anAnchor); if (!target) return HTLoadError(sink, 500, "Can't convert format of WAIS document"); /* ** Decode hex or litteral format for document ID. */ WAIS_from_WWW(docid, docname); /* ** Loop over slices of the document. */ for (count = 0; count * CHARS_PER_PAGE < document_length; count++) { #ifdef VMS char *type = NULL; StrAllocCopy(type, doctype); #else char *type = s_strdup(doctype); /* Gets freed I guess */ #endif /* VMS */ request_buffer_length = MAX_MESSAGE_LEN; /* Amount left */ if (TRACE) fprintf(stderr, "HTWAIS: Slice number %ld\n", count); if (HTCheckForInterrupt()) { HTAlert ("Data transfer interrupted."); (*target->isa->_abort)(target, NULL); #ifdef VMS FREE(type); #endif /* VMS */ return_status = HT_NOT_LOADED; goto CleanUp; } if (0 == generate_retrieval_apdu(request_message + HEADER_LENGTH, &request_buffer_length, docid, CT_byte, count * CHARS_PER_PAGE, ((count + 1) * CHARS_PER_PAGE <= document_length ? (count + 1) * CHARS_PER_PAGE : document_length), type, wais_database)) { #ifdef VMS HTAlert ("HTWAIS: Request too long."); return_status = HT_NOT_LOADED; FREE_TARGET; FREE(type); FREE(docid->bytes); goto CleanUp; #else panic("request too long"); #endif /* VMS */ } /* ** Actually do the transaction given by request_message. */ HTProgress("Fetching WAIS document..."); rv = interpret_message(request_message, MAX_MESSAGE_LEN - request_buffer_length, response_message, MAX_MESSAGE_LEN, connection, false /* true verbose */ ); if (rv == HT_INTERRUPTED) { HTAlert ("Data transfer interrupted."); return_status = HT_INTERRUPTED; FREE_TARGET; FREE(type); FREE(docid->bytes); goto CleanUp; } else if (!rv) { #ifdef VMS HTAlert ("HTWAIS: Return message too large."); return_status = HT_NOT_LOADED; FREE_TARGET; FREE(type); FREE(docid->bytes); goto CleanUp; #else panic("Returned message too large"); #endif /* VMS */ } /* ** Parse the result which came back into memory. */ readSearchResponseAPDU(&retrieval_response, response_message + HEADER_LENGTH); if (NULL == ((WAISSearchResponse *) retrieval_response->DatabaseDiagnosticRecords)->Text) { /* display_search_response(target, retrieval_response, wais_database, keywords); */ PUTS("No text was returned!\n"); /* panic("No text was returned"); */ } else { output_text_record(target, ((WAISSearchResponse *) retrieval_response->DatabaseDiagnosticRecords)->Text[0], false, binary); } /* If text existed */ #ifdef VMS FREE(type); #endif /* VMS */ } /* Loop over slices */ FREE_TARGET; FREE(docid->bytes); freeWAISSearchResponse( retrieval_response->DatabaseDiagnosticRecords); freeSearchResponseAPDU( retrieval_response); } /* If document rather than search */ CleanUp: /* ** (This postponed until later, after a timeout:) */ #ifdef VMS if (connection) NETCLOSE((int)connection); #else if (connection) fclose(connection); #endif /* VMS */ FREE(wais_database); #ifdef VMS FREE(request_message); FREE(response_message); #else s_free(request_message); s_free(response_message); #endif /* VMS */ FREE(names); return (return_status); } #ifdef GLOBALDEF_IS_MACRO #define _HTWAIS_C_1_INIT { "wais", HTLoadWAIS, NULL } GLOBALDEF(HTProtocol, HTWAIS, _HTWAIS_C_1_INIT); #else GLOBALDEF PUBLIC HTProtocol HTWAIS = { "wais", HTLoadWAIS, NULL }; #endif /* GLOBALDEF_IS_MACRO */