/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */ /* * This file is part of the LibreOffice project. * * This Source Code Form is subject to the terms of the Mozilla Public * License, v. 2.0. If a copy of the MPL was not distributed with this * file, You can obtain one at http://mozilla.org/MPL/2.0/. * * This file incorporates work covered by the following license notice: * * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed * with this work for additional information regarding copyright * ownership. The ASF licenses this file to you under the Apache * License, Version 2.0 (the "License"); you may not use this file * except in compliance with the License. You may obtain a copy of * the License at http://www.apache.org/licenses/LICENSE-2.0 . */ #include #import "OOoMetaDataParser.h" static NSSet *singleValueXMLElements; static NSSet *multiValueXMLElements; static NSDictionary *metaXML2MDIKeys; @implementation OOoMetaDataParser + (void)initialize { static BOOL isInitialized = NO; if (isInitialized == NO) { //set up the meta elements with only one value NSMutableSet *temp = [NSMutableSet new]; //FIXME these should use namespace URIs and not prefixes [temp addObject:@"dc:title"]; [temp addObject:@"dc:description"]; [temp addObject:@"meta:user-defined"]; singleValueXMLElements = [[NSSet setWithSet:temp] retain]; //set up the meta elements that can have more than one value [temp removeAllObjects]; [temp addObject:@"dc:subject"]; [temp addObject:@"meta:keyword"]; [temp addObject:@"meta:initial-creator"]; [temp addObject:@"dc:creator"]; multiValueXMLElements = [[NSSet setWithSet:temp] retain]; [temp release]; //set up the map to store the values with the correct MDI keys NSMutableDictionary *tempDict = [NSMutableDictionary new]; [tempDict setObject:(NSString*)kMDItemTitle forKey:@"dc:title"]; [tempDict setObject:(NSString*)kMDItemDescription forKey:@"dc:description"]; [tempDict setObject:(NSString*)kMDItemKeywords forKey:@"dc:subject"]; [tempDict setObject:(NSString*)kMDItemAuthors forKey:@"meta:initial-creator"]; [tempDict setObject:(NSString*)kMDItemAuthors forKey:@"dc:creator"]; [tempDict setObject:(NSString*)kMDItemKeywords forKey:@"meta:keyword"]; [tempDict setObject:@"org_openoffice_opendocument_custominfo1" forKey:@"Info 1"]; [tempDict setObject:@"org_openoffice_opendocument_custominfo2" forKey:@"Info 2"]; [tempDict setObject:@"org_openoffice_opendocument_custominfo3" forKey:@"Info 3"]; [tempDict setObject:@"org_openoffice_opendocument_custominfo4" forKey:@"Info 4"]; metaXML2MDIKeys = [[NSDictionary dictionaryWithDictionary:tempDict] retain]; [tempDict release]; isInitialized = YES; } } - (id)init { if ((self = [super init]) != nil) { shouldReadCharacters = NO; textCurrentElement = nil; return self; } return nil; } - (void)parseXML:(NSData*)data intoDictionary:(NSMutableDictionary*)dict { metaValues = dict; //NSLog(@"data: %@ %d", data, [data length]); //init parser settings shouldReadCharacters = NO; NSXMLParser *parser = [[NSXMLParser alloc] initWithData:data]; // class 'OOoMetaDataParser' does not implement the 'NSXMLParserDelegate' protocol // So instead of this: // [parser setDelegate:self]; // do this: ((id (*)(id, SEL, ...))objc_msgSend)(parser, @selector(setDelegate:), self); [parser setShouldResolveExternalEntities:NO]; [parser parse]; [parser release]; //NSLog(@"finished parsing meta"); } - (void)parser:(NSXMLParser *)parser didStartElement:(NSString *)elementName namespaceURI:(NSString *)namespaceURI qualifiedName:(NSString *)qualifiedName attributes:(NSDictionary *)attributeDict { (void) parser; // unused (void) namespaceURI; // FIXME this should not be ignored but should be used // instead of meta: prefix in the comparison below! (void) qualifiedName; // unused // NSLog(@"<%@>", elementName); if ([singleValueXMLElements containsObject:elementName] == YES) { shouldReadCharacters = YES; } else if ([multiValueXMLElements containsObject:elementName] == YES) { shouldReadCharacters = YES; } else { //we are not interested in this element shouldReadCharacters = NO; return; } if (shouldReadCharacters == YES) { textCurrentElement = [NSMutableString new]; isCustom = [elementName isEqualToString:@"meta:user-defined"]; if (isCustom == YES) { customAttribute = [[attributeDict objectForKey:@"meta:name"] retain]; //NSLog(customAttribute); } } //NSLog(@"start element %@", elementName); } - (void)parser:(NSXMLParser *)parser didEndElement:(NSString *)elementName namespaceURI:(NSString *)namespaceURI qualifiedName:(NSString *)qName { (void) parser; // unused (void) namespaceURI; // unused (void) qName; // unused // NSLog(@"", elementName); if (shouldReadCharacters == YES) { NSString *mdiName = nil; if (isCustom == YES) { mdiName = (NSString*)[metaXML2MDIKeys objectForKey:customAttribute]; } else { mdiName = (NSString*)[metaXML2MDIKeys objectForKey:elementName]; } //NSLog(@"mdiName: %@", mdiName); if (mdiName == nil) { return; } if ([singleValueXMLElements containsObject:elementName] == YES) { [metaValues setObject:textCurrentElement forKey:mdiName]; } else { // must be multi-value NSMutableArray *arr = [metaValues objectForKey:mdiName]; if (arr == nil) { // we have no array yet, create it arr = [[NSMutableArray new] autorelease]; // and store it [metaValues setObject:arr forKey:mdiName]; } // only store an element once, no need for duplicates if ([arr containsObject:textCurrentElement] == NO) { [arr addObject:textCurrentElement]; } } // cleanup part 1 [textCurrentElement release]; if (isCustom == YES) { [customAttribute release]; } } //cleanup part 2 shouldReadCharacters = NO; isCustom = NO; } - (void)parser:(NSXMLParser *)parser foundCharacters:(NSString *)string { (void) parser; // unused // NSLog(@"%@", string); if (shouldReadCharacters == NO) { return; } // this delegate method might be called several times for a single element, // so we have to collect the received data [textCurrentElement appendString:string]; //NSLog(@"chars read: %@", string); } - (void)parser:(NSXMLParser *)parser parseErrorOccurred:(NSError *)parseError { //NSLog(@"parsing finished with error"); NSLog(@"Error %li, Description: %@, Line: %li, Column: %li", (long) [parseError code], [[parser parserError] localizedDescription], (long) [parser lineNumber], (long) [parser columnNumber]); } @end /* vim:set shiftwidth=4 softtabstop=4 expandtab: */