/** Routines that are shared across the two XML parsers and their callbacks to R. isBlank - determines if a string consists entirely of whitespace RS_XML(invokeFunction) - call a user-level function, previously located by RS_XML(findFunction). RS_XML(findFunction) - search a list or closure for a function object with a given name in that list. * See Copyright for the license status of this software. */ #include "Utils.h" #include /* For isspace() */ #ifdef LIBXML #ifdef FROM_GNOME_XML_DIR #include #else #include #endif #endif #include "RSCommon.h" /* for SET_NAMES */ /** Tests whether the string contains only white space or not. Returns 1 if is only white space. 0 otherwise. */ int isBlank(const char *str) { int blank=0; const char *ptr = str; while(ptr && (blank = isspace(ptr[0]))) { ptr++; } return(blank); } /** Does an in place trimming of a string by returning a pointer to the first non-white space character and also inserting a string terminator after the last non-whitespace character. */ char * trim(char *str) { char *tmp; /* If a degenerate string, just return. */ if(str == (char*)NULL || str[0] == '\0') return(str); /* Jumpt to the end */ tmp = str + strlen(str) - 1; while(tmp >= str && isspace(*tmp)) { tmp[0] = '\0'; tmp--; } if(tmp == str) { #if 0 if(strlen(tmp) > 1) tmp[0] = '\0'; #endif return(str); } #if 0 else tmp[1] = '\0'; #endif tmp = str; while(*tmp && isspace(*tmp)) { tmp++; } return(tmp); } USER_OBJECT_ RS_XML(treeApply)(USER_OBJECT_ rtree, USER_OBJECT_ function, USER_OBJECT_ args) { return(rtree); } /** Error handling utilities for use with the libxml document parsing mechanism. Intercept the error handling by replacing it with a routine of the same name and have it print to a buffer. Then call the Warning handler. Then the warnings will end up in the local system, accessible via the warnings() function. This allows them to be programmatically processed rather than having to process the output to the terminal (via catching it in a call sink()). */ #ifdef LIBXML #include void localXmlParserPrintFileInfo(xmlParserInputPtr input, char *buf, int nbuf); #ifndef USE_LINKED_ERROR_HANDLER void S_xmlParserError(void *ctx, const char *msg, ...) #else void xmlParserError(void *ctx, const char *msg, ...) #endif { va_list args; #if 1 va_start(args, msg); stop("XMLParserError", msg, args); #else xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; char buf[3000], *tmp; /* Empty the string buffer. */ memset(buf , '\0', sizeof(buf)/sizeof(buf[0])); /* Insert the file and line number. */ localXmlParserPrintFileInfo(ctxt->input, buf, 3000); /* Move to the end of the buffer's contents. */ tmp = buf + strlen(buf); va_start(args, msg); /* Write in the actual message. */ vsprintf(tmp, msg, args); va_end(args); Rf_warning("XML Parsing Error: %s", buf); #endif } #ifndef USE_LINKED_ERROR_HANDLER /* Set the default error handlers in the libxml library */ void RSXML_setErrorHandlers(void) { // Next 2 are deprecated in 2.10.x and will be made private #if LIBXML_VERSION < 21000 xmlDefaultSAXHandlerInit(); htmlDefaultSAXHandlerInit(); xmlDefaultSAXHandler.error = S_xmlParserError; htmlDefaultSAXHandler.error = S_xmlParserError; #endif #if 0 docbDefaultSAXHandlerInit(); docbDefaultSAXHandler.error = S_xmlParserError; #endif } #endif /** Write the file name and the current line number into the specified string. */ void localXmlParserPrintFileInfo(xmlParserInputPtr input, char *buf, int nbuf) { if (input != NULL) { if (input->filename) snprintf(buf, nbuf, "%s:%d: ", input->filename, input->line); else snprintf(buf, nbuf, "Entity: line %d: ", input->line); } } #endif /** Utility method for setting the names of a list/vector from an array of native strings rather than an R/S character vector structure. */ void RS_XML(SetNames)(int n, const char *cnames[], USER_OBJECT_ ans) { int i; USER_OBJECT_ names; PROTECT(names = NEW_CHARACTER(n)); for(i = 0; i < n ; i++) { /* could install as a pre-defined string. */ SET_STRING_ELT(names, i, mkChar(cnames[i])); } SET_NAMES(ans, names); UNPROTECT(1); } /* Set the class of the target object to be the character vector containing just the specified name. */ int RS_XML(SetClassName)(const char *localClassName, USER_OBJECT_ target) { USER_OBJECT_ className; PROTECT(className = NEW_CHARACTER(1)); SET_STRING_ELT(className, 0, mkChar(localClassName)); SET_CLASS(target, className); UNPROTECT(1); return(1); } #if LIBXML2 struct _xmlHashTable { struct _xmlHashEntry **table; int size; }; #endif #if OWN_XML_HASH_SIZE int xmlHashSize(xmlHashTablePtr table) { /* For version 2.2.* */ return(table->size); /* return(table->nb_entities); */ } #endif USER_OBJECT_ RS_XML(findFunction)(const char *opName, USER_OBJECT_ _userObject) { int i; USER_OBJECT_ fun = NULL; /* Get the names of the list. */ USER_OBJECT_ names = GET_NAMES(_userObject); /* lookup function in the names of the list */ for (i = 0; i < GET_LENGTH(names); i++) { if(!strcmp(opName, CHAR_DEREF(STRING_ELT(names, i)))) { fun = VECTOR_ELT(_userObject, i); break; } } return(fun); } SEXP R_makeRefObject(void *ref, const char *className) { SEXP klass, obj, sref; if(!ref) { Rf_warning("NULL value for external reference"); return(R_NilValue); } PROTECT(klass = MAKE_CLASS((char *) className)); /* XXX define MAKE_CLASS with const */ if(klass == R_NilValue) { /* Is this the right test? */ Rf_error("Cannot find class %s for external reference", className); } PROTECT(obj = NEW_OBJECT(klass)); PROTECT(sref = R_MakeExternalPtr(ref, Rf_install(className), R_NilValue)); obj = SET_SLOT(obj, Rf_install("ref"), sref); UNPROTECT(3); return(obj); } #include #define copyStrField(x) SET_VECTOR_ELT(ans, i, mkString(uri->x ? uri->x : "")); \ SET_STRING_ELT(names, i, mkChar(#x)); i++; SEXP R_parseURI(SEXP r_uri) { xmlURIPtr uri; SEXP ans, names; int i= 0; uri = xmlParseURI( CHAR( STRING_ELT( r_uri, 0 ))); if(!uri) { Rf_error("cannot parse URI %s", CHAR( STRING_ELT( r_uri, 0) ) ); } PROTECT(ans = NEW_LIST(8)); PROTECT(names = NEW_CHARACTER(8)); copyStrField(scheme); copyStrField(authority); copyStrField(server); copyStrField(user); copyStrField(path); copyStrField(query); copyStrField(fragment); SET_VECTOR_ELT(ans, i, ScalarInteger(uri->port)); SET_STRING_ELT(names, i, mkChar("port")); SET_NAMES(ans, names); UNPROTECT(2); return(ans); } #define min(x, y) ((x) < (y) ? (x) : (y)) SEXP RSXML_structuredStop(SEXP errorFun, xmlErrorPtr err) { SEXP e, ptr; int n = 8; if(!err) n = 2; PROTECT(e = allocVector(LANGSXP, n)); SETCAR(e, errorFun != NULL && errorFun != R_NilValue ? errorFun : Rf_install("xmlStructuredStop")); ptr = CDR(e); if(err) { SETCAR(ptr, mkString(err->message)); ptr= CDR(ptr); SETCAR(ptr, ScalarInteger(err->code)); ptr= CDR(ptr); SETCAR(ptr, ScalarInteger(err->domain)); ptr= CDR(ptr); SETCAR(ptr, ScalarInteger(err->line)); ptr= CDR(ptr); SETCAR(ptr, ScalarInteger(err->int2)); ptr= CDR(ptr); SETCAR(ptr, ScalarInteger(err->level)); ptr= CDR(ptr); SETCAR(ptr, err->file ? mkString(err->file) : NEW_CHARACTER(0)); } else { SETCAR(ptr, NEW_CHARACTER(0)); } Rf_eval(e, R_GlobalEnv); UNPROTECT(1); /* Shouldn't get back to here! Rf_eval() should raise an error.*/ return(R_NilValue); } /* Because we call this function via Rf_eval(), we end up with an extra call on the stack when we enter recover. */ SEXP stop(const char *className, const char *msg, ...) { char buf[10000]; SEXP error, e, ns_env, ns_name; va_list ap; va_start(ap, msg); /* Rvsnprintf(buf, sizeof(buf)/sizeof(buf[0]), msg, ap); */ vsnprintf(buf, sizeof(buf)/sizeof(buf[0]), msg, ap); va_end(ap); PROTECT(error = mkString(buf)); /* const char * classNames[] = {"simpleError", "error", "condition"}; PROTECT(tmp = allocVector(STRSXP, sizeof(classNames)/sizeof(classNames[0]))); for(i = 0; i < sizeof(classNames)/sizeof(classNames[0]); i++) SET_STRING_ELT(tmp, i+1, mkChar(classNames[i])); SET_STRING_ELT(tmp, 0, mkChar(className)); SET_CLASS(error, tmp); */ PROTECT(e = allocVector(LANGSXP, 2)); PROTECT(ns_name = mkString("XML")); PROTECT(ns_env = R_FindNamespace(ns_name)); SETCAR(e, findVarInFrame(ns_env, Rf_install("xmlStop"))); SETCAR(CDR(e), error); Rf_eval(e, R_GlobalEnv); UNPROTECT(4); /* errorcall(error, "%s", msg); UNPROTECT(1); */ return(error); }