2017-06-21 06:18:46 +02:00
|
|
|
//
|
|
|
|
// RSOPMLParser.m
|
2017-06-26 01:32:07 +02:00
|
|
|
// RSParser
|
2017-06-21 06:18:46 +02:00
|
|
|
//
|
|
|
|
// Created by Brent Simmons on 7/12/15.
|
|
|
|
// Copyright © 2015 Ranchero Software, LLC. All rights reserved.
|
|
|
|
//
|
|
|
|
|
|
|
|
#import "RSOPMLParser.h"
|
|
|
|
#import <libxml/xmlstring.h>
|
|
|
|
#import "RSSAXParser.h"
|
|
|
|
#import "RSOPMLItem.h"
|
|
|
|
#import "RSOPMLDocument.h"
|
|
|
|
#import "RSOPMLAttributes.h"
|
2017-06-26 01:32:07 +02:00
|
|
|
#import <RSParser/RSParser-Swift.h>
|
|
|
|
#import "RSOPMLError.h"
|
2017-06-21 06:18:46 +02:00
|
|
|
|
|
|
|
|
|
|
|
@interface RSOPMLParser () <RSSAXParserDelegate>
|
|
|
|
|
|
|
|
@property (nonatomic, readwrite) RSOPMLDocument *OPMLDocument;
|
|
|
|
@property (nonatomic, readwrite) NSError *error;
|
|
|
|
@property (nonatomic) NSMutableArray *itemStack;
|
|
|
|
|
|
|
|
@end
|
|
|
|
|
|
|
|
|
|
|
|
@implementation RSOPMLParser
|
|
|
|
|
2017-06-26 01:32:07 +02:00
|
|
|
#pragma mark - Class Methods
|
|
|
|
|
|
|
|
+ (RSOPMLDocument *)parseOPMLWithParserData:(ParserData *)parserData error:(NSError **)error {
|
|
|
|
|
|
|
|
RSOPMLParser *parser = [[RSOPMLParser alloc] initWithParserData:parserData];
|
|
|
|
|
|
|
|
RSOPMLDocument *document = parser.OPMLDocument;
|
2017-06-26 02:42:30 +02:00
|
|
|
if (parser.error && error) {
|
2017-06-26 01:32:07 +02:00
|
|
|
*error = parser.error;
|
|
|
|
return nil;
|
|
|
|
}
|
|
|
|
return document;
|
|
|
|
}
|
2017-06-21 06:18:46 +02:00
|
|
|
|
|
|
|
#pragma mark - Init
|
|
|
|
|
2017-06-26 01:32:07 +02:00
|
|
|
- (instancetype)initWithParserData:(ParserData *)parserData {
|
2017-06-21 06:18:46 +02:00
|
|
|
|
|
|
|
self = [super init];
|
|
|
|
if (!self) {
|
|
|
|
return nil;
|
|
|
|
}
|
|
|
|
|
2017-06-26 01:32:07 +02:00
|
|
|
[self parse:parserData];
|
2017-06-21 06:18:46 +02:00
|
|
|
|
|
|
|
return self;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
#pragma mark - Private
|
|
|
|
|
2017-06-26 01:32:07 +02:00
|
|
|
- (void)parse:(ParserData *)parserData {
|
2017-06-21 06:18:46 +02:00
|
|
|
|
|
|
|
@autoreleasepool {
|
|
|
|
|
2017-06-26 01:32:07 +02:00
|
|
|
if (![self canParseData:parserData.data]) {
|
2017-06-21 06:18:46 +02:00
|
|
|
|
|
|
|
NSString *filename = nil;
|
2017-06-26 01:32:07 +02:00
|
|
|
NSURL *url = [NSURL URLWithString:parserData.url];
|
2017-06-21 06:18:46 +02:00
|
|
|
if (url && url.isFileURL) {
|
|
|
|
filename = url.path.lastPathComponent;
|
|
|
|
}
|
2017-06-26 01:32:07 +02:00
|
|
|
if ([parserData.url hasPrefix:@"http"]) {
|
|
|
|
filename = parserData.url;
|
2017-06-21 06:18:46 +02:00
|
|
|
}
|
|
|
|
if (!filename) {
|
2017-06-26 01:32:07 +02:00
|
|
|
filename = parserData.url;
|
2017-06-21 06:18:46 +02:00
|
|
|
}
|
|
|
|
self.error = RSOPMLWrongFormatError(filename);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
RSSAXParser *parser = [[RSSAXParser alloc] initWithDelegate:self];
|
|
|
|
|
|
|
|
self.itemStack = [NSMutableArray new];
|
|
|
|
self.OPMLDocument = [RSOPMLDocument new];
|
|
|
|
[self pushItem:self.OPMLDocument];
|
|
|
|
|
2017-06-26 01:32:07 +02:00
|
|
|
[parser parseData:parserData.data];
|
2017-06-21 06:18:46 +02:00
|
|
|
[parser finishParsing];
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
- (BOOL)canParseData:(NSData *)d {
|
|
|
|
|
|
|
|
// Check for <opml and <outline near the top.
|
|
|
|
|
|
|
|
@autoreleasepool {
|
|
|
|
|
|
|
|
NSString *s = [[NSString alloc] initWithBytesNoCopy:(void *)d.bytes length:d.length encoding:NSUTF8StringEncoding freeWhenDone:NO];
|
|
|
|
if (!s) {
|
|
|
|
NSDictionary *options = @{NSStringEncodingDetectionSuggestedEncodingsKey : @[@(NSUTF8StringEncoding)]};
|
|
|
|
(void)[NSString stringEncodingForData:d encodingOptions:options convertedString:&s usedLossyConversion:nil];
|
|
|
|
}
|
|
|
|
if (!s) {
|
|
|
|
return NO;
|
|
|
|
}
|
|
|
|
|
|
|
|
static const NSInteger numberOfCharactersToSearch = 4096;
|
|
|
|
NSRange rangeToSearch = NSMakeRange(0, numberOfCharactersToSearch);
|
|
|
|
if (s.length < numberOfCharactersToSearch) {
|
|
|
|
rangeToSearch.length = s.length;
|
|
|
|
}
|
|
|
|
|
|
|
|
NSRange opmlRange = [s rangeOfString:@"<opml" options:NSCaseInsensitiveSearch range:rangeToSearch];
|
|
|
|
if (opmlRange.length < 1) {
|
|
|
|
return NO;
|
|
|
|
}
|
|
|
|
|
|
|
|
NSRange outlineRange = [s rangeOfString:@"<outline" options:NSLiteralSearch range:rangeToSearch];
|
|
|
|
if (outlineRange.length < 1) {
|
|
|
|
return NO;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (outlineRange.location < opmlRange.location) {
|
|
|
|
return NO;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return YES;
|
|
|
|
}
|
|
|
|
|
|
|
|
- (void)pushItem:(RSOPMLItem *)item {
|
|
|
|
|
|
|
|
[self.itemStack addObject:item];
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
- (void)popItem {
|
|
|
|
|
|
|
|
NSAssert(self.itemStack.count > 0, nil);
|
|
|
|
|
|
|
|
/*If itemStack is empty, bad things are happening.
|
|
|
|
But we still shouldn't crash in production.*/
|
|
|
|
|
|
|
|
if (self.itemStack.count > 0) {
|
|
|
|
[self.itemStack removeLastObject];
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
- (RSOPMLItem *)currentItem {
|
|
|
|
|
|
|
|
return self.itemStack.lastObject;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
#pragma mark - RSSAXParserDelegate
|
|
|
|
|
|
|
|
static const char *kOutline = "outline";
|
|
|
|
static const char kOutlineLength = 8;
|
|
|
|
|
|
|
|
- (void)saxParser:(RSSAXParser *)SAXParser XMLStartElement:(const xmlChar *)localName prefix:(const xmlChar *)prefix uri:(const xmlChar *)uri numberOfNamespaces:(NSInteger)numberOfNamespaces namespaces:(const xmlChar **)namespaces numberOfAttributes:(NSInteger)numberOfAttributes numberDefaulted:(int)numberDefaulted attributes:(const xmlChar **)attributes {
|
|
|
|
|
|
|
|
if (!RSSAXEqualTags(localName, kOutline, kOutlineLength)) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
RSOPMLItem *item = [RSOPMLItem new];
|
|
|
|
item.attributes = [SAXParser attributesDictionary:attributes numberOfAttributes:numberOfAttributes];
|
|
|
|
|
|
|
|
[[self currentItem] addChild:item];
|
|
|
|
[self pushItem:item];
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
- (void)saxParser:(RSSAXParser *)SAXParser XMLEndElement:(const xmlChar *)localName prefix:(const xmlChar *)prefix uri:(const xmlChar *)uri {
|
|
|
|
|
|
|
|
if (RSSAXEqualTags(localName, kOutline, kOutlineLength)) {
|
|
|
|
[self popItem];
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static const char *kText = "text";
|
|
|
|
static const NSInteger kTextLength = 5;
|
|
|
|
|
|
|
|
static const char *kTitle = "title";
|
|
|
|
static const NSInteger kTitleLength = 6;
|
|
|
|
|
|
|
|
static const char *kDescription = "description";
|
|
|
|
static const NSInteger kDescriptionLength = 12;
|
|
|
|
|
|
|
|
static const char *kType = "type";
|
|
|
|
static const NSInteger kTypeLength = 5;
|
|
|
|
|
|
|
|
static const char *kVersion = "version";
|
|
|
|
static const NSInteger kVersionLength = 8;
|
|
|
|
|
|
|
|
static const char *kHTMLURL = "htmlUrl";
|
|
|
|
static const NSInteger kHTMLURLLength = 8;
|
|
|
|
|
|
|
|
static const char *kXMLURL = "xmlUrl";
|
|
|
|
static const NSInteger kXMLURLLength = 7;
|
|
|
|
|
|
|
|
- (NSString *)saxParser:(RSSAXParser *)SAXParser internedStringForName:(const xmlChar *)name prefix:(const xmlChar *)prefix {
|
|
|
|
|
|
|
|
if (prefix) {
|
|
|
|
return nil;
|
|
|
|
}
|
|
|
|
|
|
|
|
size_t nameLength = strlen((const char *)name);
|
|
|
|
|
|
|
|
if (nameLength == kTextLength - 1) {
|
|
|
|
if (RSSAXEqualTags(name, kText, kTextLength)) {
|
|
|
|
return OPMLTextKey;
|
|
|
|
}
|
|
|
|
if (RSSAXEqualTags(name, kType, kTypeLength)) {
|
|
|
|
return OPMLTypeKey;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
else if (nameLength == kTitleLength - 1) {
|
|
|
|
if (RSSAXEqualTags(name, kTitle, kTitleLength)) {
|
|
|
|
return OPMLTitleKey;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
else if (nameLength == kXMLURLLength - 1) {
|
|
|
|
if (RSSAXEqualTags(name, kXMLURL, kXMLURLLength)) {
|
|
|
|
return OPMLXMLURLKey;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
else if (nameLength == kVersionLength - 1) {
|
|
|
|
if (RSSAXEqualTags(name, kVersion, kVersionLength)) {
|
|
|
|
return OPMLVersionKey;
|
|
|
|
}
|
|
|
|
if (RSSAXEqualTags(name, kHTMLURL, kHTMLURLLength)) {
|
|
|
|
return OPMLHMTLURLKey;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
else if (nameLength == kDescriptionLength - 1) {
|
|
|
|
if (RSSAXEqualTags(name, kDescription, kDescriptionLength)) {
|
|
|
|
return OPMLDescriptionKey;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static const char *kRSSUppercase = "RSS";
|
|
|
|
static const char *kRSSLowercase = "rss";
|
|
|
|
static const NSUInteger kRSSLength = 3;
|
|
|
|
static NSString *RSSUppercaseValue = @"RSS";
|
|
|
|
static NSString *RSSLowercaseValue = @"rss";
|
|
|
|
static NSString *emptyString = @"";
|
|
|
|
|
|
|
|
static BOOL equalBytes(const void *bytes1, const void *bytes2, NSUInteger length) {
|
|
|
|
|
|
|
|
return memcmp(bytes1, bytes2, length) == 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
- (NSString *)saxParser:(RSSAXParser *)SAXParser internedStringForValue:(const void *)bytes length:(NSUInteger)length {
|
|
|
|
|
|
|
|
|
|
|
|
if (length < 1) {
|
|
|
|
return emptyString;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (length == kRSSLength) {
|
|
|
|
|
|
|
|
if (equalBytes(bytes, kRSSUppercase, kRSSLength)) {
|
|
|
|
return RSSUppercaseValue;
|
|
|
|
}
|
|
|
|
else if (equalBytes(bytes, kRSSLowercase, kRSSLength)) {
|
|
|
|
return RSSLowercaseValue;
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
@end
|