No OneTemporary
Actions

Authored By

Unknown

Size

9 KB

Referenced Files

None

Subscribers

None

View Options

	diff --git a/util/tokenreader.cpp b/util/tokenreader.cpp
	index 012043a3..fedf0444 100644
	--- a/util/tokenreader.cpp
	+++ b/util/tokenreader.cpp
	@@ -1,340 +1,343 @@
	#include <fstream>
	#include <iostream>
	#include <string>
	#include <cstring>
	#include <sstream>
	#include <vector>

	#include "file-system.h"
	#include "token.h"
	#include "token_exception.h"
	#include "tokenreader.h"
	#include "pointer.h"

	using namespace std;

	/* tokenreader reads a file formatted with s-expressions. examples:
	* (hello)
	* (hello world)
	* (hello "world")
	* (hello (world))
	* (hello (world hi))
	*/

	TokenReader::TokenReader(){
	}

	TokenReader::TokenReader(const char * file){
	readTokenFromFile(file);
	}

	TokenReader::TokenReader(const string & file){
	readTokenFromFile(file);
	}

	Token * TokenReader::readTokenFromFile(const std::string & path){
	/*
	ifstream file(path.c_str());
	if (!file){
	ostringstream out;
	out << "Could not open '" << path << "'";
	throw TokenException(__FILE__, __LINE__, out.str());
	}
	file >> noskipws;
	*/
	Filesystem::AbsolutePath realPath(path);
	Util::ReferenceCount<Storage::File> file = Storage::instance().open(realPath);
	if (file == NULL \|\| !file->good()){
	throw TokenException(__FILE__, __LINE__, string("Could not read ") + realPath.path());
	}
	readTokens(*file.raw());
	// file.close();
	if (my_tokens.size() > 0){
	my_tokens[0]->setFile(path);
	return my_tokens[0];
	}
	ostringstream out;
	out << "No tokens read from " << path;
	throw TokenException(__FILE__, __LINE__, out.str());
	}

	Token * TokenReader::readTokenFromFile(Storage::File & file){
	readTokens(file);
	// file.close();
	if (my_tokens.size() > 0){
	my_tokens[0]->setFile("");
	return my_tokens[0];
	}
	ostringstream out;
	out << "No tokens read from file";
	throw TokenException(__FILE__, __LINE__, out.str());

	}

	Token * TokenReader::readToken(){
	if (my_tokens.size() > 0){
	return my_tokens[0];
	}
	throw TokenException(__FILE__, __LINE__, "No tokens read");
	}

	Token * TokenReader::readToken(const string & path){
	return readTokenFromFile(path);
	}

	Token * TokenReader::readToken(const char * path){
	return readTokenFromFile(path);
	}

	Token * TokenReader::readTokenFromString(const string & stuff){
	/*
	istringstream input(stuff);
	input >> noskipws;
	*/
	Storage::StringFile input(stuff);
	readTokens(input);
	if (my_tokens.size() > 0){
	return my_tokens[0];
	}
	throw TokenException(__FILE__, __LINE__, "No tokens read");
	}

	TokenReader::~TokenReader(){
	// ifile.close();

	/* tokenreader giveth, and tokenreader taketh */
	for ( vector< Token * >::iterator it = my_tokens.begin(); it != my_tokens.end(); it++ ){
	delete *it;
	}
	}

	static inline bool is_alpha(char c){
	// const char * alpha = "abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789./-_!:*";
	const char * alpha = "./-_!:*";
	return (c >= 'a' && c <= 'z') \|\|
	(c >= 'A' && c <= 'Z') \|\|
	(c >= '0' && c <= '9') \|\|
	strchr(alpha, c) != NULL;
	}

	static inline bool is_nonalpha(char c){
	const char * nonalpha = " ;()#\"";
	return strchr(nonalpha, c) != NULL;
	}

	class BufferedStream{
	public:
	BufferedStream(Storage::File & input):
	data(NULL),
	position(0),
	size(input.getSize()){
	+ if (input.getSize() == 0){
	+ throw TokenException(__FILE__, __LINE__, "File has size 0");
	+ }
	data = new unsigned char[size];
	input.readLine((char*) data, size);
	}

	BufferedStream & operator>>(unsigned char & n){
	if (position < size){
	n = data[position];
	position += 1;
	}
	return *this;
	}

	bool eof(){
	return position >= size;
	}

	~BufferedStream(){
	delete[] data;
	}

	unsigned char * data;
	int position;
	int size;
	};

	void TokenReader::readTokens(Storage::File & input){

	/*
	if ( !ifile ){
	ostringstream out;
	out << "Could not open '" << myfile << "'";
	throw TokenException(__FILE__, __LINE__, out.str());
	}
	*/
	// Token * t;

	// string token_string;

	// char open_paren = 'x';
	int parens = 0;
	// int position = 0;
	/*
	while (input.good() && open_paren != '('){
	input >> open_paren;
	position += 1;
	}
	*/
	// token_string += '(';

	BufferedStream buffer(input);

	Token * currentToken = NULL;
	// Token * cur_token = new Token();
	// cur_token->setFile(myfile);
	// my_tokens.push_back(cur_token);
	// Token * first = cur_token;
	vector<Token *> token_stack;
	/* tokens that were ignored using ;@, and should be deleted */
	vector<Util::ReferenceCount<Token> > ignore_list;
	// token_stack.push_back(cur_token);

	/* when a ;@ is seen, read the next s-expression but throw it away */
	bool do_ignore = false;

	unsigned char n = 0;
	string cur_string = "";

	/* in_quote is true if a " is read and before another " is read */
	bool in_quote = false;

	/* escaped unconditionally adds the next character to the string */
	bool escaped = false;
	while (!buffer.eof()){
	// char n;
	// slow as we go
	buffer >> n;
	// position += 1;
	// printf("Read character '%c' %d at %d\n", n, n, input.tellg());
	// cout << "Read character '" << n << "' " << (int) n << " at " << input.tellg() << endl;

	// cout<<"Alpha char: "<<n<<endl;

	if (escaped){
	switch (n){
	case 'n' : {
	cur_string += "\n";
	break;
	}
	default : {
	cur_string += n;
	break;
	}
	}
	escaped = false;
	continue;
	}

	if (n == '\\'){
	escaped = true;
	continue;
	}

	if (in_quote){
	if (n == '"'){
	in_quote = false;

	Token * sub = new Token(cur_string, false);
	if (currentToken != NULL){
	sub->setParent(currentToken);
	if (do_ignore){
	ignore_list.push_back(Util::ReferenceCount<Token>(sub));
	do_ignore = false;
	} else {
	currentToken->addToken(sub);
	}
	cur_string = "";
	} else {
	delete sub;
	}
	} else {
	cur_string += n;
	}
	} else {
	/* not in a quote */

	if (n == '"'){
	in_quote = true;
	} else if (is_alpha(n)){
	cur_string += n;
	} else if (cur_string != "" && is_nonalpha(n)){
	// cout<<"Made new token "<<cur_string<<endl;
	Token * sub = new Token(cur_string, false);
	if (currentToken != NULL){
	sub->setParent(currentToken);
	if (do_ignore){
	do_ignore = false;
	ignore_list.push_back(Util::ReferenceCount<Token>(sub));
	} else {
	currentToken->addToken(sub);
	}
	} else {
	delete sub;
	}
	cur_string = "";
	}

	if (n == '#' \|\| n == ';'){
	buffer >> n;

	/* if the next character is a @ then ignore the next entire s-expression
	* otherwise just ignore the current line
	*/
	if (n == '@'){
	do_ignore = true;
	} else {
	while (n != '\n' && !buffer.eof()){
	buffer >> n;
	}
	continue;
	}
	} else if (n == '('){
	Token * another = new Token();
	if (currentToken != NULL){
	another->setParent(currentToken);
	}

	if (do_ignore){
	ignore_list.push_back(Util::ReferenceCount<Token>(another));
	do_ignore = false;
	} else {
	if (currentToken != NULL){
	currentToken->addToken(another);
	} else {
	/* top level token */
	my_tokens.push_back(another);
	}
	}

	parens += 1;
	currentToken = another;
	token_stack.push_back(currentToken);
	} else if (n == ')'){
	parens -= 1;
	if (token_stack.empty()){
	throw TokenException(__FILE__, __LINE__, "Saw a ) but there is no corresponding (");
	}
	token_stack.pop_back();

	if (! token_stack.empty()){
	currentToken = token_stack.back();
	} else {
	currentToken = NULL;
	}
	}
	}
	}

	if (!token_stack.empty()){
	ostringstream failure;
	failure << "Wrong number of parentheses. Open parens is " << parens;
	throw TokenException(__FILE__, __LINE__, failure.str());
	}

	/*
	for (vector<Token*>::iterator it = my_tokens.begin(); it != my_tokens.end(); it++){
	Token * token = *it;
	token->finalize();
	}
	*/
	}

File Metadata

Mime Type: text/x-diff
Expires: Mon, Jun 22, 8:14 PM (6 d, 13 h ago)
Storage Engine: blob
Storage Format: Raw Data
Storage Handle: 72947
Default Alt Text: (9 KB)

No OneTemporaryActions

View Options

File Metadata

Event Timeline

No OneTemporary
Actions