/* -*- Mode: C; tab-width: 8; indent-tabs-mode: nil; c-basic-offset: 2 -*- */ /* ***** BEGIN LICENSE BLOCK ***** * Version: MPL 1.1/GPL 2.0/LGPL 2.1 * * The contents of this file are subject to the Mozilla Public License Version * 1.1 (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * http://www.mozilla.org/MPL/ * * Software distributed under the License is distributed on an "AS IS" basis, * WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License * for the specific language governing rights and limitations under the * License. * * The Original Code is mozilla.org code. * * The Initial Developer of the Original Code is * Netscape Communications Corporation. * Portions created by the Initial Developer are Copyright (C) 1998 * the Initial Developer. All Rights Reserved. * * Contributor(s): * * Alternatively, the contents of this file may be used under the terms of * either of the GNU General Public License Version 2 or later (the "GPL"), * or the GNU Lesser General Public License Version 2.1 or later (the "LGPL"), * in which case the provisions of the GPL or the LGPL are applicable instead * of those above. If you wish to allow use of your version of this file only * under the terms of either the GPL or the LGPL, and not to allow others to * use your version of this file under the terms of the MPL, indicate your * decision by deleting the provisions above and replace them with the notice * and other provisions required by the GPL or the LGPL. If you do not delete * the provisions above, a recipient may use your version of this file under * the terms of any one of the MPL, the GPL or the LGPL. * * ***** END LICENSE BLOCK ***** */ #include "rdf-int.h" #include char* error_string = NULL; int lineNumber = 0; static HashTable resourceHash = NULL; static RDF_Resource gURL = NULL; RDF_Resource getResource (char* key, int createp) { RDF_Resource existing = (RDF_Resource) HashLookup(resourceHash, key); if (existing) { return existing; } else if (createp){ existing = (RDF_Resource)fgetMem(sizeof(RDF_ResourceStruct)); existing->url = fcopyString(key); HashAdd(resourceHash, existing->url, existing); if (!gURL) { gURL = (RDF_Resource)fgetMem(sizeof(RDF_ResourceStruct)); gURL->url = fcopyString("URL"); HashAdd(resourceHash, gURL->url, gURL); } remoteStoreAdd(NULL, existing, gURL, existing->url, RDF_STRING_TYPE,1); return existing; } else return NULL; } char* RDF_ResourceID (RDF_Resource u) { return u->url; } static char* MemBlock = 0; size_t allocated = 0; #define MEM_BLOCK_SIZE 10000 char* fgetMem (size_t rsize) { char* ans = 0; size_t size = rsize + (4 - ldiv(rsize, 4).rem); if (!MemBlock || (size >= (MEM_BLOCK_SIZE - allocated))) { MemBlock = getMem(MEM_BLOCK_SIZE); allocated = 0; } ans = MemBlock; MemBlock = MemBlock + size; allocated = allocated + size; return ans; } void readRDFFile (char* file) { FILE* f = fopen(file, "r"); if (f) { RDFT rf = (RDFT)getRDFT(file, 1) ; int ok = 1; char* buff = (char*) malloc(100 * 1024); int len ; int i = 0; memset(buff, '\0', (100 * 1024)); memset(rf, '\0', sizeof(RDF_FileStruct)); rf->line = (char*)getMem(RDF_BUF_SIZE); rf->holdOver = (char*)getMem(RDF_BUF_SIZE); rf->depth = 1; rf->lastItem = rf->stack[0] ; while ((len = fread(buff, 1, (100 * 1024) -1, f)) > 0) { buff[len] = '\0'; printf("[%i] ", i++); fflush(0); if (!(ok = parseNextRDFXMLBlobInt(rf, buff, len))) { printf("Error in RDF File\n"); } } freeMem(rf->line); rf->line = NULL; freeMem(rf->holdOver); rf->holdOver = NULL; free(buff); printf("Finished reading %s\n", file); } else printf("Could not find %s\n", file); } static HashTable rdftHash = NULL; RDFT getRDFT (char* key, int createp) { RDFT existing = (RDFT) HashLookup(rdftHash, key); if (existing) { return existing; } else if (createp){ existing = (RDFT)getMem(sizeof(RDF_FileStruct)); existing->url = fcopyString(key); HashAdd(rdftHash, existing->url, existing); return existing; } else return NULL; } void rdf_init () { error_string = getMem(1000); resourceHash = NewHashTable((int)0x00000FFF); rdftHash = NewHashTable((int)0x00000FFF); } int rdf_DigestNewStuff (char* url, char* data, int len) { RDFT rf = (RDFT)getRDFT(url, 1) ; int ok = 1; RDF_Resource u; unloadRDFT(rf); memset(rf, '\0', sizeof(RDF_FileStruct)); rf->line = (char*)getMem(RDF_BUF_SIZE); rf->holdOver = (char*)getMem(RDF_BUF_SIZE); rf->depth = 1; rf->lastItem = rf->stack[0] ; ok = parseNextRDFXMLBlobInt(rf, data, len); /* if (!ok) unloadRDFT(rf); */ freeMem(rf->line); rf->line = NULL; freeMem(rf->holdOver); rf->holdOver = NULL; return ok; } int startsWith (const char* pattern, const char* uuid) { int l1 = strlen(pattern); int l2 = strlen(uuid); int n; if (l2 < l1) return 0; for (n = 0; n < l1; n++) { if (pattern[n] != uuid[n]) return 0; } return 1; } char* getMem (size_t n) { return (char*) calloc(1, n); } void freeMem(void* item) { free(item); } char decodeEntityRef (char* string, int* stringIndexPtr, int len) { if (startsWith("lt;", string)) { *stringIndexPtr = *stringIndexPtr + 3; return '<'; } else if (startsWith("gt;", string)) { *stringIndexPtr = *stringIndexPtr + 3; return '>'; } else if (startsWith("amp;", string)) { *stringIndexPtr = *stringIndexPtr + 4; return '&'; } else return '&'; } char * copyStringIgnoreWhiteSpace(char* string) { int len = strlen(string); char* buf = (char*)fgetMem(len + 1); int inWhiteSpace = 1; int buffIndex = 0; int stringIndex = 0; while (stringIndex < len) { char nextChar = *(string + stringIndex); int wsp = wsCharp(nextChar); if (!wsp) { if (nextChar == '&') { *(buf + buffIndex++) = decodeEntityRef(&string[stringIndex+1], &stringIndex, len-stringIndex); } else { *(buf + buffIndex++) = nextChar; } inWhiteSpace = 0; } else if (!inWhiteSpace) { *(buf + buffIndex++) = ' '; inWhiteSpace = 1; } else { inWhiteSpace = 1; } stringIndex++; } return buf; } char * getHref(char** attlist) { char* ans = getAttributeValue(attlist, "resource"); if (!ans) ans = getAttributeValue(attlist, "rdf:resource"); return ans; } char * getID(char** attlist) { char* ans = getAttributeValue(attlist, "id"); if (!ans) ans = getAttributeValue(attlist, "about"); if (!ans) ans = getAttributeValue(attlist, "rdf:about"); return ans; } int parseNextRDFXMLBlobInt(RDFT f, char* blob, int size) { int n, last, m; int somethingseenp = 0; n = last = 0; while (n < size) { char c = blob[n]; if ((c == '\n') || (c == '\r')) lineNumber++; m = 0; somethingseenp = 0; /* memset(f->line, '\0', RDF_BUF_SIZE-1); */ if (f->holdOver[0] != '\0') { memcpy(f->line, f->holdOver, strlen(f->holdOver)); m = strlen(f->holdOver); somethingseenp = 1; f->holdOver[0] = '\0'; /* memset(f->holdOver, '\0', RDF_BUF_SIZE-1); */ } while ((n < size) && (wsCharp(c)) && (!somethingseenp)) { c = blob[++n]; if ((c == '\n') || (c == '\r')) lineNumber++; } while ((m < RDF_BUF_SIZE-1) && (c != '<') && (c != '>')) { f->line[m] = c; m++; somethingseenp = (somethingseenp || (!(wsCharp(c)))); n++; if (n < size) c = blob[n]; else break; if ((c == '\n') || (c == '\r')) lineNumber++; } f->line[m] = '\0'; f->line[m+1] = '\0'; if (c == '>') f->line[m] = c; n++; if (m > 0) { if ((c == '<') || (c == '>')) { last = n; if (c == '<') { f->holdOver[0] = '<'; f->holdOver[1] = '\0'; } if (somethingseenp == 1) { parseNextRDFToken(f, f->line); } } else if (size > last) { memcpy(f->holdOver, f->line, m); f->holdOver[m] = '\0'; } } else if (c == '<') { f->holdOver[0] = '<'; f->holdOver[1] = '\0'; } } return(1); } char * getAttributeValue (char** attlist, char* elName) { size_t n = 0; if (!attlist) return NULL; while ((n < 2*MAX_ATTRIBUTES) && (*(attlist + n) != NULL)) { char* attname = *(attlist + n); char* base = strchr(attname, ':'); if (base) attname = base + 1; if (strcmp(attname, elName) == 0) return *(attlist + n + 1); n = n + 2; } return NULL; } char* copyString (char* str) { char* ans = getMem(strlen(str)+1); if (ans) { memcpy(ans, str, strlen(str)); return ans; } else return NULL; } char* fcopyString (char* str) { char* ans = fgetMem(strlen(str)+1); if (ans) { memcpy(ans, str, strlen(str)); return ans; } else return NULL; } void addElementProps (char** attlist, char* elementName, RDFT f, RDF_Resource obj) { int count = 0; while (count < 2*MAX_ATTRIBUTES) { char* attName = attlist[count++]; char* attValue = attlist[count++]; char* baseName; if ((attName == NULL) || (attValue == NULL)) break; baseName = strchr(attName, ':'); if (baseName) attName = baseName + 1; if (startsWith("xmlns", attName)) { /* addNameSpace(attName, attValue, f); */ } else if (!stringEquals(attName, "resource") && !stringEquals(attName, "rdf:resource") && !stringEquals(attName, "about") && !stringEquals(attName, "rdf:about") && !stringEquals(attName, "tv") && !stringEquals(attName, "id")) { remoteStoreAdd(f, obj, getResource(attName, 1), copyStringIgnoreWhiteSpace(attValue), RDF_STRING_TYPE, 1); } } } int parseNextRDFToken (RDFT f, char* token) { char* attlist[2*MAX_ATTRIBUTES+1]; char* elementName; if (token[0] != '<') { if ((f->status == EXPECTING_OBJECT) && (f->depth > 1)) { RDF_Resource u = f->stack[f->depth-2]; RDF_Resource s = f->stack[f->depth-1]; char* val = copyStringIgnoreWhiteSpace(token); remoteStoreAdd(f, u, s, val , RDF_STRING_TYPE, 1); return 1; } else { printf(error_string, "Did not expect \n\"%s\".\n Was expecting a tag.", token); return 0; } } else if (startsWith("