0% found this document useful (0 votes)

11 views7 pages

CC Project Code

Uploaded by

muhamanibutt

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

11 views7 pages

CC Project Code

Uploaded by

muhamanibutt

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 7

#include <iostream>

#include <string>
#include <fstream>
#include <vector>
#include <sstream>
#include <unordered_set>
#include <string>
#include <fstream>
#include <unordered_map>
#include <regex>

using namespace std;

int totalTokens = 0;
vector<string> linesFromDataFile;
vector<vector<string>> tokenizedData;
vector<string> cleanedLines;
vector<string> tokenizedLines;
unordered_set<string> found_operators = {};
unordered_set<string> found_punctuators = {};
unordered_set<string> found_keywords = {};
unordered_set<string> found_identifiers = {};
unordered_set<string> found_constants = {};
unordered_set<string> found_literals = {};
unordered_set<string> found_special_characters = {};
unordered_set<string> found_invalid_tokens = {};

vector<string> errors;
string local_data;

void load_data_from_string()
{
stringstream ss(local_data);
string line;

while (getline(ss, line))

{
linesFromDataFile.push_back(line);
}

cout << "\nStored lines from local_data:";

for (size_t i = 0; i < linesFromDataFile.size(); i++)
{
cout << linesFromDataFile[i] << endl;
}
}
void load_data()
{
ifstream fin("Sourcecode.txt");
string line;

if (!fin)
{
cout << "Error opening data.txt!" << endl;
return;
}
while(getline(fin, line))
{
linesFromDataFile.push_back(line);
}
fin.close();

cout << "\nStored lines from data.txt:\n";

for (size_t i = 0; i < linesFromDataFile.size(); i++)
{
cout << linesFromDataFile[i] << endl;
}
cout << endl << endl;
}
string remove_comments_and_spaces(const string& line) {
string cleanedLine;
bool inComment = false;
bool inString = false;

for (size_t i = 0; i < line.length(); ++i)

{
if (line[i] == '\"') {
inString = !inString;
cleanedLine += line[i];
continue;
}

if (!inString && line[i] == '/' && (i + 1) < line.length() && line[i + 1] == '/')
{ //for // wala comment
break;
}
if (!inString && line[i] == '/' && (i + 1) < line.length() && line[i + 1] == '*')
{ //for /**/ wala comment
inComment = true;
continue;
}
if (inComment && line[i] == '*' && (i + 1) < line.length() && line[i + 1] == '/')
{
inComment = false;
i++;
continue;
}

if (!inComment) {
if (line[i] != ' ' || (cleanedLine.length() > 0 && cleanedLine.back() != ' ')) {
cleanedLine += line[i];
}
}
}

size_t start = cleanedLine.find_first_not_of(' ');

size_t end = cleanedLine.find_last_not_of(' ');
return (start == string::npos) ? "" : cleanedLine.substr(start, end - start + 1);
}
void process_lines(const vector<string>& linesFromDataFile)
{
for (const auto& line : linesFromDataFile)
{
string cleanedLine = remove_comments_and_spaces(line);
if (!cleanedLine.empty())
{
cleanedLines.push_back(cleanedLine);
}
}
}
void tokenize_lines(const vector<string>& cleanedLines) {
const regex tokenRegex(R"([\s]+|(;|\(|\)|\{|\}|\[|\]))");

for (const auto& line : cleanedLines) {

string currentToken;
for (size_t i = 0; i < line.size(); ++i) {
char ch = line[i];
if (isspace(ch) || ch == ';' || ch == '(' || ch == ')' || ch == '{' || ch == '}' || ch == '[' || ch == ']' || ch == '<' || ch == '>' || ch == '#') {
if (!currentToken.empty()) {
tokenizedLines.push_back(currentToken);
currentToken.clear();
}
if (!isspace(ch)) {
tokenizedLines.push_back(string(1, ch));
}
}
else {
currentToken += ch;
}
}
if (!currentToken.empty()) {
tokenizedLines.push_back(currentToken);
}
}

cout << "Tokens in line: " << endl;

for (const auto& tok : tokenizedLines) {
cout << " < " << tok << " > ";
}
cout << endl << endl << endl;
}

bool identifier_scanner(const string& token) {

int transition_table[4][4] = {
{2, 2, 1, -1},
{3,3,3, -1},
{2, 2, 3, -1},
{3,3,3, -1}
};

enum CharCategory { L, D, Underscore, O };

auto classify_char = [](char ch) -> CharCategory {

if ((ch >= 'a' && ch <= 'z') || (ch >= 'A' && ch <= 'Z')) return L;
if (ch >= '0' && ch <= '9') return D;
if (ch == '_') return Underscore;
return O;
};

int state = 0;

for (size_t i = 0; i < token.size(); ++i) {

char ch = token[i];
int char_type = classify_char(ch);

state = transition_table[state][char_type];

if (state == -1) {
return false;
}
}

return state == 3;
}
bool constant_scanner(const string& token) {
int transition_table[8][5] = {
{1, 2, -1, -1, -1},
{-1, 2, -1, -1, -1},
{-1, 2, 3, 5, -1},
{-1, 4, -1, -1, -1},
{-1, 4, -1, 5, -1},
{6, 6, -1, -1, -1},
{-1, 6, -1, -1, -1},
};

enum CharCategory { S, D, Dot, E, O };

auto classify_char = [](char ch) -> CharCategory {

if (ch == '+' || ch == '-') return S;
if (ch >= '0' && ch <= '9') return D;
if (ch == '.') return Dot;
if (ch == 'e' || ch == 'E') return E;
return O;
};

int state = 0;

for (size_t i = 0; i < token.size(); ++i) {

char ch = token[i];
int char_type = classify_char(ch);

state = transition_table[state][char_type];

if (state == -1) {
return false;
}
}

return state == 2 || state == 4 || state == 6;

}
bool operator_scanner(const string& token) {
enum State {
START = 0,
EXCLAMATION = 1,
LESS_THAN = 2,
EQUAL = 3,
PLUS = 4,
MINUS = 5,
GREATER_THAN = 6,
AND = 7,
OR = 8,
COLON = 9,
FINAL = 10,
FINAL_EQUAL = 11
};

enum Character {
ASTERISK = '*',
SLASH = '/',
PERCENT = '%',
EXCLAMATION_MARK = '!',
LESS_THAN_MARK = '<',
EQUAL_MARK = '=',
PLUS_MARK = '+',
MINUS_MARK = '-',
GREATER_THAN_MARK = '>',
AND_MARK = '&',
OR_MARK = '|',
COLON_MARK = ':',
INVALID_CHAR = -1
};
int transition_table[12][256] = { 0 };

transition_table[START][ASTERISK] = FINAL;
transition_table[START][SLASH] = FINAL;
transition_table[START][PERCENT] = FINAL;
transition_table[START][EXCLAMATION_MARK] = EXCLAMATION;
transition_table[START][LESS_THAN_MARK] = LESS_THAN;
transition_table[START][EQUAL_MARK] = EQUAL;
transition_table[START][PLUS_MARK] = PLUS;
transition_table[START][MINUS_MARK] = MINUS;
transition_table[START][GREATER_THAN_MARK] = GREATER_THAN;
transition_table[START][AND_MARK] = AND;
transition_table[START][OR_MARK] = OR;
transition_table[START][COLON_MARK] = COLON;

transition_table[EXCLAMATION][EQUAL_MARK] = FINAL;
transition_table[LESS_THAN][GREATER_THAN_MARK] = FINAL;
transition_table[LESS_THAN][LESS_THAN_MARK] = FINAL;
transition_table[EQUAL][COLON_MARK] = FINAL_EQUAL;
transition_table[EQUAL][PLUS_MARK] = FINAL;
transition_table[EQUAL][LESS_THAN_MARK] = FINAL;
transition_table[EQUAL][EQUAL_MARK] = FINAL;
transition_table[EQUAL][GREATER_THAN_MARK] = FINAL;
transition_table[PLUS][PLUS_MARK] = FINAL;
transition_table[MINUS][MINUS_MARK] = FINAL;
transition_table[GREATER_THAN][GREATER_THAN_MARK] = FINAL;
transition_table[AND][AND_MARK] = FINAL;
transition_table[OR][OR_MARK] = FINAL;
transition_table[COLON][COLON_MARK] = FINAL;
transition_table[FINAL_EQUAL][EQUAL_MARK] = FINAL;

int state = START;

for (char ch : token) {

int char_code = static_cast<int>(ch);

if (transition_table[state][char_code] == 0) {
return false;
}

state = transition_table[state][char_code];
}

return (state == FINAL || state == PLUS || state == MINUS || state == COLON);

}
bool punctuator_scanner(const string& token) {
enum State {
START = 0,
FINAL = 1
};

enum Character {
OPEN_BRACKET = '[',
CLOSE_BRACKET = ']',
OPEN_CURLY = '{',
CLOSE_CURLY = '}',
LESS_THAN = '<',
GREATER_THAN = '>',
OPEN_PAREN = '(',
CLOSE_PAREN = ')',
SEMICOLON = ';',
COMMA = ',',
INVALID_CHAR = -1
};
int transition_table[2][256] = { 0 };

transition_table[START][OPEN_BRACKET] = FINAL;
transition_table[START][CLOSE_BRACKET] = FINAL;
transition_table[START][OPEN_CURLY] = FINAL;
transition_table[START][CLOSE_CURLY] = FINAL;
transition_table[START][LESS_THAN] = FINAL;
transition_table[START][GREATER_THAN] = FINAL;
transition_table[START][OPEN_PAREN] = FINAL;
transition_table[START][CLOSE_PAREN] = FINAL;
transition_table[START][SEMICOLON] = FINAL;
transition_table[START][COMMA] = FINAL;

if (token.size() != 1) {
return false;
}

int state = START;

char ch = token[0];
int char_code = static_cast<int>(ch);

if (transition_table[state][char_code] == FINAL) {
return true;
}
else {
return false;
}
}
bool special_character_scanner(const string& token) {
enum State {
START = 0,
VALID = 1,
INVALID = 2
};

int transition_table[2][256] = { 0 };

transition_table[START][0] = INVALID;
transition_table[START][1] = VALID;

if (token.size() != 1) {
return false;
}

int state = START;

if (token.size() == 1) {
state = transition_table[state][1];
}

if (state == VALID) {
return true;
}

return false;
}
bool keyword_scanner(const string& token) {
enum State {
START = 0,
VALID_KEYWORD,
INVALID_KEYWORD
};

static const unordered_set<string> keywords = {

"loop", "agar", "magar", "asm", "else", "new", "this", "auto", "enum", "operator",
"throw", "bool", "explicit", "private", "true", "break", "export", "protected",
"try", "case", "extern", "public", "typedef", "catch", "false", "register",
"typeid", "char", "float", "typename", "class", "for", "return", "union",
"const", "friend", "short", "unsigned", "goto", "signed", "using", "continue",
"if", "sizeof", "virtual", "default", "inline", "static", "void", "delete",
"int", "volatile", "do", "long", "struct", "double", "mutable", "switch",
"while", "namespace",

"include", "iostream", "boolean", "std", "main", "string", "cout", "cin", "endl"

};

if (token.empty()) {
return false;
}

int state = START;

for (size_t i = 0; i < token.size(); ++i) {

char ch = token[i];

if (state == START) {
if (!isalpha(ch)) {
return false;
}
}
}

return (keywords.find(token) != keywords.end());

}
bool literal_scanner(const string& token) {

enum State {
START = 0,
IN_STRING = 1,
IN_CHAR = 2,
INVALID = -1,
VALID = 3
};

int transitionTable[4][256] = { 0 };

transitionTable[START]['\"'] = IN_STRING;
transitionTable[START]['\''] = IN_CHAR;
transitionTable[IN_STRING]['\"'] = VALID;
transitionTable[IN_CHAR]['\''] = VALID;

for (int i = 0; i < 256; i++) {

if (transitionTable[START][i] == 0) transitionTable[START][i] = INVALID;
if (transitionTable[IN_STRING][i] == 0) transitionTable[IN_STRING][i] = IN_STRING;
if (transitionTable[IN_CHAR][i] == 0) transitionTable[IN_CHAR][i] = IN_CHAR;
}
int state = START;

for (size_t i = 0; i < token.size(); ++i) {

char ch = token[i];

state = transitionTable[state][ch];

if (state == INVALID) {
return false;
}
}

return state == VALID;

}
void fa_scanner() {
ofstream fout("errors.txt");
ofstream fout_tokens("token.txt");

for (const auto& token : tokenizedLines) {

if (keyword_scanner(token)) {
found_keywords.insert(token);
}
else if (identifier_scanner(token)) {
found_identifiers.insert(token);
}
else if (literal_scanner(token)) {
found_literals.insert(token);
}
else if (constant_scanner(token)) {
found_constants.insert(token);
}
else if (operator_scanner(token)) {
found_operators.insert(token);
}
else if (punctuator_scanner(token)) {
found_punctuators.insert(token);
}
else if (special_character_scanner(token)) {
found_special_characters.insert(token);
}
else {
errors.push_back(token);
}
}

cout << "Identifiers: ";

fout_tokens << "Identifiers: ";
for (const auto& id : found_identifiers) {
cout << id << " ";
fout_tokens << id << " ";
}
cout << endl;
fout_tokens << endl;

cout << "Constants: ";

fout_tokens << "Constants: ";
for (const auto& constant : found_constants) {
cout << constant << " ";
fout_tokens << constant << " ";
}
cout << endl;
fout_tokens << endl;

cout << "Operators: ";

fout_tokens << "Operators: ";
for (const auto& op : found_operators) {
cout << op << " ";
fout_tokens << op << " ";
}
cout << endl;
fout_tokens << endl;

cout << "Punctuators: ";

fout_tokens << "Punctuators: ";
for (const auto& punct : found_punctuators) {
cout << punct << " ";
fout_tokens << punct << " ";
}
cout << endl;
fout_tokens << endl;

cout << "keywords: ";

fout_tokens << "keywords: ";
for (const auto& keyword : found_keywords) {
cout << keyword << " ";
fout_tokens << keyword << " ";
}
cout << endl;
fout_tokens << endl;

cout << "Literals: ";

fout_tokens << "Literals: ";
for (const auto& literal : found_literals) {
cout << literal << " ";
fout_tokens << literal << " ";
}
cout << endl;
fout_tokens << endl;

cout << "Special Characters: ";

fout_tokens << "Special Characters: ";
for (const auto& sp_character : found_special_characters) {
cout << sp_character << " ";
fout_tokens << sp_character << " ";
}
cout << endl;
fout_tokens << endl;

cout << "Errors Invalid Characters: ";

fout << "Errors Invalid Characters: ";
for (const auto& error : errors) {
cout << error << " ";
fout << error << " ";
}
cout << endl;
fout << endl;
}

int main() {
local_data = R"(
# include < iostream >
# include < string >
# include < boolean >
using namespace std ;
int main ( )
{
//hello this is a comment
std :: int var_1 = 5.0 * 10 & 6 ;
double _var_2 = 3.43433E+13 ; //hello this is a comment
char @character = 'a' ;
int _va%r_3_ = var_1 + _var_2 ;
cout << var_1 + _var_2 << "HELLO" << endl ;
}
)";

bool get_data_from_file = true;

if (get_data_from_file){
load_data();
}
else{
load_data_from_string();
}
process_lines(linesFromDataFile);
tokenize_lines(cleanedLines);
fa_scanner();

return 0;
}

Rajat Prasad CD File
No ratings yet
Rajat Prasad CD File
39 pages
SSLCD Lab Manual c1 Batch
No ratings yet
SSLCD Lab Manual c1 Batch
15 pages
CD 1 To 11 Practical
No ratings yet
CD 1 To 11 Practical
34 pages
Compiler Design Lab-Journal-8
No ratings yet
Compiler Design Lab-Journal-8
41 pages
22BLC1161 LexicalAnalyser
No ratings yet
22BLC1161 LexicalAnalyser
25 pages
Principles of Compiler Construction Lab File NSUT
No ratings yet
Principles of Compiler Construction Lab File NSUT
31 pages
Print
No ratings yet
Print
38 pages
Compiler Design Lab File Blank
No ratings yet
Compiler Design Lab File Blank
23 pages
Cdjavacodes
No ratings yet
Cdjavacodes
23 pages
Compiler Lab2
No ratings yet
Compiler Lab2
17 pages
Lab 3 and 4
No ratings yet
Lab 3 and 4
12 pages
Compiler Lab Print Merged
No ratings yet
Compiler Lab Print Merged
45 pages
Compiler Design Lab ASSESMENT 1 22BCE0411
No ratings yet
Compiler Design Lab ASSESMENT 1 22BCE0411
13 pages
Calc
No ratings yet
Calc
13 pages
Compiler Design Lab File
No ratings yet
Compiler Design Lab File
26 pages
Compiler Design
No ratings yet
Compiler Design
16 pages
Lab3 CD 22BLC1161
No ratings yet
Lab3 CD 22BLC1161
12 pages
22bce2509 VL2024250102410 Ast01
No ratings yet
22bce2509 VL2024250102410 Ast01
12 pages
Compiler Design Record (21072)
No ratings yet
Compiler Design Record (21072)
48 pages
Compiler Design Final Record
No ratings yet
Compiler Design Final Record
37 pages
LAB3CC 06062022 042621pm
No ratings yet
LAB3CC 06062022 042621pm
10 pages
21BAI1213 - Abhinav V - Experiment-2
No ratings yet
21BAI1213 - Abhinav V - Experiment-2
11 pages
Lab2 CD 22BLC1161
No ratings yet
Lab2 CD 22BLC1161
9 pages
Lab 3
No ratings yet
Lab 3
8 pages
CD File Kunal 4 To 9
No ratings yet
CD File Kunal 4 To 9
10 pages
21BCE3008
No ratings yet
21BCE3008
7 pages
PCD Lawn Menial Process
No ratings yet
PCD Lawn Menial Process
24 pages
Cs-603 Activity: Abca-1 (Coding/Debugging) Compiler: Name - Divyansh Sharma Roll No. - 0905cs211055
No ratings yet
Cs-603 Activity: Abca-1 (Coding/Debugging) Compiler: Name - Divyansh Sharma Roll No. - 0905cs211055
6 pages
Important Programs
No ratings yet
Important Programs
20 pages
CD Assignments
No ratings yet
CD Assignments
7 pages
CSE425 Assignment
No ratings yet
CSE425 Assignment
5 pages
A2 Program
No ratings yet
A2 Program
5 pages
DS Lab 10
No ratings yet
DS Lab 10
18 pages
Praneet 43 Spccexp 1
No ratings yet
Praneet 43 Spccexp 1
4 pages
Infix To Postfix Code
No ratings yet
Infix To Postfix Code
7 pages
Name:atif Ali Enrollment: (01-134191-008)
No ratings yet
Name:atif Ali Enrollment: (01-134191-008)
15 pages
A1
No ratings yet
A1
3 pages
Assignment No.2 - DSAL
No ratings yet
Assignment No.2 - DSAL
6 pages
CD Lab1
No ratings yet
CD Lab1
8 pages
Sslab 4
No ratings yet
Sslab 4
6 pages
Code Exp-4
No ratings yet
Code Exp-4
7 pages
Program No. - 3: Write A Program To Find Different Tokens in A Program
No ratings yet
Program No. - 3: Write A Program To Find Different Tokens in A Program
3 pages
Classification of Business Environment
83% (6)
Classification of Business Environment
12 pages
LA Using Transition Table
No ratings yet
LA Using Transition Table
5 pages
Name:Prakash R Class:CSE - B Register Number:185001108
No ratings yet
Name:Prakash R Class:CSE - B Register Number:185001108
16 pages
CD Lab Final (1-10)
No ratings yet
CD Lab Final (1-10)
29 pages
Precedence
No ratings yet
Precedence
5 pages
CD Assessment 1
No ratings yet
CD Assessment 1
14 pages
CC Ass 2
No ratings yet
CC Ass 2
9 pages
23F-0675 Remaining 4C
No ratings yet
23F-0675 Remaining 4C
3 pages
Pathak 22
No ratings yet
Pathak 22
18 pages
System Programming Lab File: Amity School of Engineering & Technology
No ratings yet
System Programming Lab File: Amity School of Engineering & Technology
22 pages
CC Assignment
No ratings yet
CC Assignment
11 pages
Assignment 2 04042021 045308pm
No ratings yet
Assignment 2 04042021 045308pm
14 pages
Expression Evaluation (Compiler Construction)
No ratings yet
Expression Evaluation (Compiler Construction)
4 pages
Dfa Simulation
No ratings yet
Dfa Simulation
5 pages
CD Assignment-2
No ratings yet
CD Assignment-2
16 pages
Recursive Descent Parser
No ratings yet
Recursive Descent Parser
2 pages
New Text Document
No ratings yet
New Text Document
3 pages
CC
No ratings yet
CC
5 pages
Computerised Assessment of Handwriting
No ratings yet
Computerised Assessment of Handwriting
15 pages
Data Umum SSH 2024
No ratings yet
Data Umum SSH 2024
376 pages
SCBA Pre-Use Inspection
No ratings yet
SCBA Pre-Use Inspection
2 pages
Econ2330 Ch09
No ratings yet
Econ2330 Ch09
65 pages
31st MCMC
No ratings yet
31st MCMC
11 pages
Oracle Final Exam Semester 1
100% (1)
Oracle Final Exam Semester 1
22 pages
The Relationship of Endodontic-Periodontic Lesions
No ratings yet
The Relationship of Endodontic-Periodontic Lesions
7 pages
Hufnagel Transcript
No ratings yet
Hufnagel Transcript
3 pages
Recovery Is Everywhere Handout
No ratings yet
Recovery Is Everywhere Handout
3 pages
John B. Goodenough
No ratings yet
John B. Goodenough
11 pages
Semitic Alphabets
No ratings yet
Semitic Alphabets
16 pages
Financial Kake Da Hotel (N)
No ratings yet
Financial Kake Da Hotel (N)
10 pages
Three High-Altitude Peoples, Three Adaptations To Thin Air
No ratings yet
Three High-Altitude Peoples, Three Adaptations To Thin Air
11 pages
File Page No 1663658874765
No ratings yet
File Page No 1663658874765
10 pages
4as Tle7 LC4
No ratings yet
4as Tle7 LC4
5 pages
Guidanc CTspection
No ratings yet
Guidanc CTspection
17 pages
Work Immersion Instructions
No ratings yet
Work Immersion Instructions
14 pages
Nature 14432
No ratings yet
Nature 14432
17 pages
5 Muscle
No ratings yet
5 Muscle
3 pages
Abdullah Shakeel, Bscs 3b 19arid5127
No ratings yet
Abdullah Shakeel, Bscs 3b 19arid5127
6 pages
My NoteBook
No ratings yet
My NoteBook
17 pages
Anfis Based Kinematic Analysis of A 4-Dofs Scara Robot: Jyotindra Narayan Ashish Singla
No ratings yet
Anfis Based Kinematic Analysis of A 4-Dofs Scara Robot: Jyotindra Narayan Ashish Singla
7 pages
Risk Assessment Table New Version
No ratings yet
Risk Assessment Table New Version
4 pages
Assignment 1 ECN3112
No ratings yet
Assignment 1 ECN3112
4 pages
Lovino - B8 - Case Analysis Essay Volunteerism
No ratings yet
Lovino - B8 - Case Analysis Essay Volunteerism
3 pages
Mapping Pulling Cable Grounding System
No ratings yet
Mapping Pulling Cable Grounding System
1 page
Upgrading Cimplicity 6.1 To 8.1 License Issue
No ratings yet
Upgrading Cimplicity 6.1 To 8.1 License Issue
2 pages
Biography of Adolf Hitler
No ratings yet
Biography of Adolf Hitler
1 page
TCTX 5100 Classroom Rules Learning Activity
No ratings yet
TCTX 5100 Classroom Rules Learning Activity
2 pages
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet

CC Project Code

Uploaded by

CC Project Code

Uploaded by

#include <iostream>

using namespace std;

while (getline(ss, line))

cout << "\nStored lines from local_data:";

cout << "\nStored lines from data.txt:\n";

for (size_t i = 0; i < line.length(); ++i)

size_t start = cleanedLine.find_first_not_of(' ');

for (const auto& line : cleanedLines) {

cout << "Tokens in line: " << endl;

bool identifier_scanner(const string& token) {

enum CharCategory { L, D, Underscore, O };

auto classify_char = [](char ch) -> CharCategory {

for (size_t i = 0; i < token.size(); ++i) {

enum CharCategory { S, D, Dot, E, O };

auto classify_char = [](char ch) -> CharCategory {

for (size_t i = 0; i < token.size(); ++i) {

return state == 2 || state == 4 || state == 6;

int state = START;

for (char ch : token) {

return (state == FINAL || state == PLUS || state == MINUS || state == COLON);

int state = START;

int state = START;

static const unordered_set<string> keywords = {

"include", "iostream", "boolean", "std", "main", "string", "cout", "cin", "endl"

int state = START;

for (size_t i = 0; i < token.size(); ++i) {

return (keywords.find(token) != keywords.end());

for (int i = 0; i < 256; i++) {

for (size_t i = 0; i < token.size(); ++i) {

return state == VALID;

for (const auto& token : tokenizedLines) {

cout << "Identifiers: ";

cout << "Constants: ";

cout << "Operators: ";

cout << "Punctuators: ";

cout << "keywords: ";

cout << "Literals: ";

cout << "Special Characters: ";

cout << "Errors Invalid Characters: ";

bool get_data_from_file = true;

You might also like