/* -*- mode: objc; coding: utf-8 -*- */ /* Toilet Lisp, a Common Lisp subset for the Étoilé runtime. * Copyright (C) 2008 Matthias Andreas Benkard. * * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation, either version 3 of the License, or (at * your option) any later version. * * This program is distributed in the hope that it will be useful, but * WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program. If not, see . */ #import "MLKReader.h" #import "MLKCharacter.h" #import "MLKReadtable.h" #import "MLKReaderError.h" #import "MLKDynamicContext.h" #import "MLKEnvironment.h" #import "MLKPackage.h" #import "MLKFuncallable.h" #import "MLKCharacterStream.h" #import "MLKFloat.h" #import "MLKInteger.h" #import "MLKRatio.h" #import "MLKStringInputStream.h" #import "functions.h" #import "runtime-compatibility.h" #import "util.h" #import #import #import #import @implementation MLKReader +(id) readFromStream:(MLKCharacterStream *)stream eofError:(BOOL)eofError eofValue:(id)eofValue recursive:(BOOL)recursive preserveWhitespace:(BOOL)preserveWhitespace { return [self readFromStream:stream eofError:eofError eofValue:eofValue recursive:recursive preserveWhitespace:preserveWhitespace singleDotMarker:nil readingUninternedSymbol:NO]; } +(id) readFromStream:(MLKCharacterStream *)stream eofError:(BOOL)eofError eofValue:(id)eofValue recursive:(BOOL)recursive preserveWhitespace:(BOOL)preserveWhitespace singleDotMarker:(id)dotMarker readingUninternedSymbol:(BOOL)readingUninternedSymbol { unichar ch; NSMutableString *token; MLKReadtable *readtable; BOOL escaped; BOOL ever_escaped; ever_escaped = NO; readtable = [[MLKDynamicContext currentContext] valueForSymbol:[[MLKPackage findPackage:@"COMMON-LISP"] intern:@"*READTABLE*"]]; if (readingUninternedSymbol) { token = [NSMutableString stringWithString:@"#:"]; escaped = NO; goto read_token; } start: if ([stream isEOF]) { if (eofError) [NSException raise:@"MLKEndOfFileError" format:@"Premature end of file on stream %@.", stream]; else return eofValue; } ch = [stream readChar]; if ([readtable isWhitespaceCharacter:ch] || ch == '\0') goto start; if ([readtable isMacroCharacter:ch]) { NSArray *returnValues; id macrofun = [readtable macroFunctionForCharacter:ch]; NSArray *args = [NSArray arrayWithObjects: stream, [MLKCharacter characterWithUnichar:ch], nil]; if ([args count] != 2) { args = [NSMutableArray arrayWithCapacity:2]; [((NSMutableArray*)args) addObject:stream]; [((NSMutableArray*)args) addObject:[MLKCharacter characterWithUnichar:ch]]; } returnValues = [macrofun applyToArray:args]; if ([returnValues count]) return denullify ([returnValues objectAtIndex:0]); else goto start; } escaped = NO; if ([readtable isSingleEscapeCharacter:ch]) { if ([stream isEOF]) [NSException raise:@"MLKEndOfFileError" format:@"Premature end of file on stream %@.", stream];; token = [NSMutableString stringWithCapacity:8]; [token appendFormat:@"%C", [stream readChar]]; ever_escaped = YES; } if ([readtable isMultipleEscapeCharacter:ch]) { token = [NSMutableString stringWithCapacity:8]; escaped = YES; ever_escaped = YES; } if ([readtable isConstituentCharacter:ch]) { //NSLog (@"--> Constituent (%C)", ch); token = [NSMutableString stringWithCapacity:8]; [token appendFormat:@"%C", [readtable charWithReadtableCase:ch]]; } read_token: while (![stream isEOF]) { //NSLog (@"..."); ch = [stream readChar]; if ([readtable isConstituentCharacter:ch] || [readtable isNonTerminatingMacroCharacter:ch] || (escaped && (![readtable isMultipleEscapeCharacter:ch] && ![readtable isSingleEscapeCharacter:ch]))) { //NSLog (@"Constituent: 0x%x (%C)", ch, ch); if (escaped) [token appendFormat:@"%C", ch]; else [token appendFormat:@"%C", [readtable charWithReadtableCase:ch]]; } else if ([readtable isSingleEscapeCharacter:ch]) { //NSLog (@"Escape"); if ([stream isEOF]) [NSException raise:@"MLKEndOfFileError" format:@"Premature end of file on stream %@.", stream]; [token appendFormat:@"%C", [stream readChar]]; ever_escaped = YES; } else if ([readtable isMultipleEscapeCharacter:ch]) { //NSLog (@"Multi-Escape"); ever_escaped = YES; escaped = !escaped; } else if ([readtable isTerminatingMacroCharacter:ch]) { //NSLog (@"Terminating macro char"); [stream unreadChar:ch]; break; } else if ([readtable isConstituentCharacter:ch] && [readtable isInvalid:ch]) { //[[[MLKReaderError alloc] initWithStream:stream] raise]; [NSException raise:@"MLKReaderError" format:@"'%c' is an invalid constituent character.", ch]; } else if ([readtable isWhitespaceCharacter:ch]) { //NSLog (@"Whitespace"); if (preserveWhitespace) [stream unreadChar:ch]; break; } else { [NSException raise:@"MLKReaderError" format:@"'%c' is an unrecognized character.", ch]; } //NSLog(@"Token now: %@", token); } //NSLog (@"--> Interpret token: %@", token); if ([token isEqualToString:@"."]) { if (dotMarker) return dotMarker; else [NSException raise:@"MLKReaderError" format:@"Unexpectedly read a single dot."]; } return [self interpretToken:token readtable:readtable escaped:ever_escaped]; } +(BOOL) isPotentialNumber:(NSString *)token readtable:(MLKReadtable *)readtable base:(int)base { // Check whether the token is a potential number. // // See CLHS 2.3.1.1. unsigned long i; unichar first; // 1. Does it consist solely of characters allowed in a potential // number? for (i = 0; i < [token length]; i++) { unichar ch = [token characterAtIndex:i]; if (!([readtable isDigit:ch inBase:base] || [readtable isSign:ch] || [readtable isRatioMarker:ch] || [readtable isDecimalPoint:ch] || ch == '^' || ch == '_' || ([readtable isNumberMarker:ch] // Adjacent number markers aren't to be considered number // markers at all. && (i == 0 || ![readtable isNumberMarker:[token characterAtIndex:(i-1)]])))) return NO; } // 2. Does the token contain a digit? for (i = 0; i < [token length]; i++) { unichar ch = [token characterAtIndex:i]; if ([readtable isDigit:ch inBase:base]) goto digitFound; } return NO; digitFound: // 3. Is the first character okay? first = [token characterAtIndex:0]; if (!([readtable isDigit:first inBase:base] || [readtable isSign:first] || [readtable isDecimalPoint:first] || first == '^' || first == '_')) return NO; // 4. Does the token not end with a sign? if ([readtable isSign:[token characterAtIndex:([token length]-1)]]) return NO; return YES; } +(id) interpretToken:(NSString *)token readtable:(MLKReadtable *)readtable escaped:(BOOL)escaped { int base; //NSLog(@"Interpreting token: %@", token); base = [[[MLKDynamicContext currentContext] valueForSymbol:[[MLKPackage findPackage:@"COMMON-LISP"] intern:@"*READ-BASE*"]] intValue]; if (!escaped && [self isPotentialNumber:token readtable:readtable base:base]) { unsigned long i, firstNum, secondNum, exponent, exponentMarkerPos; unichar sign, exponentSign; unichar firstSeparator, exponentMarker; BOOL negative; // Read the sign (if present). if ([readtable isSign:[token characterAtIndex:0]]) { sign = [token characterAtIndex:0]; i = 1; firstNum = 1; } else { i = 0; firstNum = 0; } negative = (firstNum > 0 && [readtable isMinusSign:sign]); while ((i < [token length]) && [readtable isDecimalDigit:[token characterAtIndex:i]]) i++; if (i == [token length]) { //NSLog (@"..."); return MLKCanoniseInteger ([MLKInteger integerWithString: [token substringWithRange: NSMakeRange (firstNum, [token length] - firstNum)] negative:negative base:10]); } firstSeparator = [token characterAtIndex:i]; if (!([readtable isDecimalPoint:firstSeparator] || [readtable isExponentMarker:[token characterAtIndex:i]])) goto digits; i++; secondNum = i; if (i == [token length] && [readtable isDecimalPoint:firstSeparator]) { //NSLog (@"+++"); return MLKCanoniseInteger ([MLKInteger integerWithString: [token substringWithRange: NSMakeRange (firstNum, [token length] - firstNum - 1)] negative:negative base:10]); } else { // We're dealing with a floating point number. Bah. I hate // floating point numbers. if ([readtable isExponentMarker:firstSeparator]) { exponentMarkerPos = i; if ([readtable isSign:[token characterAtIndex:i]]) { exponentSign = [token characterAtIndex:i]; i++; } else exponentSign = '+'; exponent = i; while ((i < [token length]) && [readtable isDecimalDigit:[token characterAtIndex:i]]) i++; //NSLog (@"...2"); //NSLog (@"%@, %@", // [token substringWithRange:NSMakeRange (firstNum, exponentMarkerPos - firstNum - 1)], // [token substringFromIndex:exponent]); return [MLKFloat floatWithExponentMarker:firstSeparator integerPart:[token substringWithRange:NSMakeRange(firstNum, exponentMarkerPos - firstNum - 1)] negative:negative fractionalPart:@"" exponent:[token substringFromIndex:exponent] exponentNegative:(exponentSign == '-')]; } else { while ((i < [token length]) && [readtable isDecimalDigit:[token characterAtIndex:i]]) i++; if (i == [token length]) { //NSLog (@"...3"); //NSLog (@"%@, %@", // [token substringWithRange:NSMakeRange (firstNum, secondNum - firstNum - 1)], // [token substringFromIndex:secondNum]); return [MLKFloat floatWithExponentMarker:firstSeparator integerPart:[token substringWithRange:NSMakeRange (firstNum, secondNum - firstNum - 1)] negative:negative fractionalPart:[token substringFromIndex:secondNum] exponent:@"" exponentNegative:NO]; } // Assume token[i] is an exponent marker. exponentMarkerPos = i; exponentMarker = [token characterAtIndex:i]; i++; if ([readtable isSign:[token characterAtIndex:i]]) { exponentSign = [token characterAtIndex:i]; i++; } else exponentSign = '+'; exponent = i; while ((i < [token length]) && [readtable isDecimalDigit:[token characterAtIndex:i]]) i++; //NSLog (@"...4"); //NSLog (@"%@, %@, %@", // [token substringWithRange:NSMakeRange (firstNum, secondNum - firstNum - 1)], // [token substringWithRange:NSMakeRange (secondNum, exponentMarkerPos - secondNum)], // [token substringFromIndex:exponent]); return [MLKFloat floatWithExponentMarker:exponentMarker integerPart:[token substringWithRange:NSMakeRange (firstNum, secondNum - firstNum - 1)] negative:negative fractionalPart:[token substringWithRange:NSMakeRange (secondNum, exponentMarkerPos - secondNum)] exponent:[token substringFromIndex:exponent] exponentNegative:(exponentSign == '-')]; } } digits: i = firstNum; while ((i < [token length]) && [readtable isDigit:[token characterAtIndex:i] inBase:base]) i++; if (i == [token length]) { //NSLog (@"###"); return MLKCanoniseInteger ([MLKInteger integerWithString: [token substringWithRange: NSMakeRange (firstNum, [token length] - firstNum)] negative:negative base:base]); } // Assume token[i] is a slash. i++; secondNum = i; //NSLog (@"RRR"); //NSLog (@"n: %@", [token substringWithRange: // NSMakeRange (firstNum, // secondNum - firstNum - 1)]); //NSLog (@"d: %@", [token substringFromIndex:secondNum]); return [MLKRatio ratioWithNumeratorString: [token substringWithRange: NSMakeRange (firstNum, secondNum - firstNum - 1)] denominatorString:[token substringFromIndex:secondNum] negative:negative base:base]; } else { unsigned long i, packageMarker; MLKPackage *package; NSString *symbolName; MLKSymbol *symbol; // Look for the package marker. packageMarker = -1; for (i = 0; i < [token length]; i++) { if ([readtable isPackageMarker:[token characterAtIndex:i]]) { packageMarker = i; break; } } // Extract the package and symbol name. if (packageMarker == -1) { package = [[MLKDynamicContext currentContext] valueForSymbol:[[MLKPackage findPackage:@"COMMON-LISP"] intern:@"*PACKAGE*"]]; symbolName = token; } else if (packageMarker == 0) { package = [MLKPackage findPackage:@"KEYWORD"]; symbolName = [token substringFromIndex:1]; } else { NSString *packageName = [token substringToIndex:packageMarker]; if ([packageName isEqualToString:@"#"]) package = nil; else { package = [MLKPackage findPackage:packageName]; if (!package) [NSException raise:@"MLKReaderError" format:@"Can't find package %@.", [token substringToIndex:packageMarker]]; } if ([readtable isPackageMarker:[token characterAtIndex:(i+1)]]) symbolName = [token substringFromIndex:(packageMarker+2)]; else { // A single package marker means we have to check whether // the symbol is external in the package. symbolName = [token substringFromIndex:(packageMarker+1)]; if (package) { symbol = [package intern:symbolName]; if (![[package exportedSymbols] containsObject:symbol]) [NSException raise:@"MLKReaderError" format:@"Package %@ does not export symbol %@.", [package name], MLKPrintToString(symbol)]; } } } if (package) symbol = [package intern:symbolName]; else symbol = [MLKSymbol symbolWithName:symbolName package:nil]; return symbol; } } +(id) readFromString:(NSString *)string { return [self readFromStream:LAUTORELEASE([[MLKStringInputStream alloc] initWithString:string]) eofError:YES eofValue:nil recursive:NO preserveWhitespace:NO]; } @end