资源库-编译原理实验一：c++ vertor实现简单词法分析器

dbkx_29

已于 2024-05-28 15:27:04 修改

阅读量112

点赞数 1

文章标签： c++ 开发语言

于 2024-05-20 15:44:21 首次发布

本文链接：https://blog.csdn.net/dbkx_29/article/details/139067060

版权

#include <iostream>
using namespace std;
#include <string>

struct Token {
	std::string type; // 词法单元类型，如"IDENTIFIER", "SEPARATOR"
	std::string value; // 词法单元的值
};
#include <vector>
#include <cctype>

pair<bool, string> keywordIdentify(string identifier) {
	if (identifier == "int")
		return pair<bool, string>(1, "关键字int");
	else if (identifier == "main")
		return pair<bool, string>(1, "主程序入口main");
	else if (identifier == "return")
		return pair<bool, string>(1, "关键字return");
	else {
		return pair<bool, string>(0, "");
	}
}

vector<Token> tokenize(const std::string &input) {
	vector<Token> tokens;
	size_t pos = 0;

	while (pos < input.size()) {
		if (isspace(input[pos])) { // 跳过空白字符
			++pos;
		} else if (isalpha(input[pos]) || input[pos] == '_') { // 标识符
			string identifier;
			while (pos < input.size() && (isalnum(input[pos]) || input[pos] == '_')) {
				identifier += input[pos++];
			}
			pair<bool, string> res = keywordIdentify(identifier);
			if (res.first) {
				tokens.push_back({res.second, identifier});
			} else
				tokens.push_back({"标识符", identifier});
		} else { // 其他字符视为分隔符处理
			tokens.push_back({"分隔符", string(1, input[pos++])});
		}
	}

	return tokens;
}



int main() {
	string input = "int main() { int __a = 5; return 0; }";
	auto tokens = tokenize(input);

	for (const auto &token : tokens) {
		std::cout << "Type: " << token.type << ", Value: '" << token.value << "'\n";
	}

	return 0;
}