0% found this document useful (0 votes)

5 views4 pages

Mid Term Project

The document contains a C++ program for a tokenizer that processes a line of C++ code and identifies various tokens such as keywords, operators, punctuation, comments, and literals. It defines a structure for tokens and includes functions to check for keywords, operators, punctuation, and to tokenize the input code. The main function prompts the user for input and displays the identified tokens.

Uploaded by

sajidtusan

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

5 views4 pages

Mid Term Project

Uploaded by

sajidtusan

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 4

Mid-Term Project

Student ID: 41230100703

Student Name: Sajid Hossain Tusan
Course Name: Compiler Design
Course Code: CSE3272
Code:
#include <iostream>
#include <vector>
#include <string>
#include <cctype>

using namespace std;

struct Token {
string value;
string type;
};

// Basic list of C++ keywords

const string keywordList[] = {
"int", "float", "if", "else", "while", "for", "return", "char", "double",
"bool", "void", "class"
};
const int keywordCount = sizeof(keywordList) / sizeof(keywordList[0]);

// Check if a word is a keyword

bool isKeyword(const string &word) {
for (int i = 0; i < keywordCount; i++) {
if (word == keywordList[i]) return true;
}
return false;
}

// Check if a character is an operator

bool isOperator(char ch) {
return ch == '+' || ch == '-' || ch == '*' || ch == '/' || ch == '=' || ch
== '<' || ch == '>';
}

// Check if a character is punctuation

bool isPunctuation(char ch) {
return ch == ';' || ch == ',' || ch == ':' || ch == '.';
}

// Check if a character is a parenthesis

bool isParenthesis(char ch) {
return ch == '(' || ch == ')' || ch == '{' || ch == '}' || ch == '[' || ch
== ']';
}

// Check if a string is a number

bool isNumber(const string &s) {
for (char ch : s) {
if (!isdigit(ch)) return false;
}
return !s.empty();
}
// Main tokenizer function
vector<Token> tokenize(const string &code) {
vector<Token> tokens;
string word;
int i = 0;

while (i < code.length()) {

char ch = code[i];

// Skip spaces
if (isspace(ch)) {
i++;
continue;
}

// Handle preprocessor directives

if (ch == '#') {
string directive;
while (i < code.length() && code[i] != '\n') {
directive += code[i++];
}
tokens.push_back({directive, "Preprocessor Directive"});
continue;
}

// Handle comments
if (ch == '/' && i + 1 < code.length()) {
if (code[i + 1] == '/') {
string comment = "//";
i += 2;
while (i < code.length()) comment += code[i++];
tokens.push_back({comment, "Single-line Comment"});
continue;
} else if (code[i + 1] == '*') {
string comment = "/*";
i += 2;
while (i < code.length() - 1 && !(code[i] == '*' && code[i + 1] ==
'/')) {
comment += code[i++];
}
comment += "*/";
i += 2;
tokens.push_back({comment, "Multi-line Comment"});
continue;
}
}

// Handle string literals

if (ch == '"') {
string str = "\"";
i++;
while (i < code.length() && code[i] != '"') str += code[i++];
if (i < code.length()) str += code[i++]; // closing quote
tokens.push_back({str, "String Literal"});
continue;
}

// Handle character literals

if (ch == '\'') {
string str = "'";
i++;
while (i < code.length() && code[i] != '\'') str += code[i++];
if (i < code.length()) str += code[i++]; // closing quote
tokens.push_back({str, "Character Literal"});
continue;
}

// Handle operators
if (isOperator(ch)) {
tokens.push_back({string(1, ch), "Operator"});
i++;
continue;
}

// Handle punctuation
if (isPunctuation(ch)) {
tokens.push_back({string(1, ch), "Punctuation"});
i++;
continue;
}

// Handle parentheses
if (isParenthesis(ch)) {
tokens.push_back({string(1, ch), "Parenthesis"});
i++;
continue;
}

// Handle identifiers, keywords, and numbers

if (isalnum(ch) || ch == '_') {
word = "";
while (i < code.length() && (isalnum(code[i]) || code[i] == '_')) {
word += code[i++];
}

if (isKeyword(word))
tokens.push_back({word, "Keyword"});
else if (isNumber(word))
tokens.push_back({word, "Number"});
else
tokens.push_back({word, "Identifier"});
continue;
}

// Unknown character
tokens.push_back({string(1, ch), "Unknown"});
i++;
}

return tokens;
}

// Print tokens
void displayTokens(const vector<Token> &tokens) {
cout << "\nTokens Found:\n";
for (const auto &t : tokens) {
cout << t.value << " -> " << t.type << endl;
}
}

int main() {
string line;
cout << "Enter a line of C++ code:\n";
getline(cin, line);

vector<Token> tokens = tokenize(line);

displayTokens(tokens);

return 0;
}

Cross Platform Game Programming
100% (4)
Cross Platform Game Programming
481 pages
Cs-603 Activity: Abca-1 (Coding/Debugging) Compiler: Name - Divyansh Sharma Roll No. - 0905cs211055
No ratings yet
Cs-603 Activity: Abca-1 (Coding/Debugging) Compiler: Name - Divyansh Sharma Roll No. - 0905cs211055
6 pages
Tokencc C
No ratings yet
Tokencc C
4 pages
Compiler Practical File
No ratings yet
Compiler Practical File
33 pages
21BAI1213 - Abhinav V - Experiment-2
No ratings yet
21BAI1213 - Abhinav V - Experiment-2
11 pages
C2ex Java
No ratings yet
C2ex Java
6 pages
3
No ratings yet
3
3 pages
CD 1
No ratings yet
CD 1
31 pages
CC Lab 1-2
No ratings yet
CC Lab 1-2
6 pages
Rajat Prasad CD File
No ratings yet
Rajat Prasad CD File
39 pages
من المفترض ان ده حل الكويز بس بيقع في كذا تيست
No ratings yet
من المفترض ان ده حل الكويز بس بيقع في كذا تيست
4 pages
Week 2a &2B
No ratings yet
Week 2a &2B
6 pages
Compiler Design Practical File
No ratings yet
Compiler Design Practical File
12 pages
2
No ratings yet
2
6 pages
Cdjavacodes
No ratings yet
Cdjavacodes
23 pages
Sslab 2
No ratings yet
Sslab 2
6 pages
Compiler Design Lab
No ratings yet
Compiler Design Lab
49 pages
Lab2 CD 22BLC1161
No ratings yet
Lab2 CD 22BLC1161
9 pages
Java8Stepwise2 JJ
No ratings yet
Java8Stepwise2 JJ
28 pages
Lexer
No ratings yet
Lexer
6 pages
Sec B
No ratings yet
Sec B
43 pages
Compiler
No ratings yet
Compiler
7 pages
Infix To Postfix Code
No ratings yet
Infix To Postfix Code
7 pages
CD File - Merged
No ratings yet
CD File - Merged
52 pages
Lab Assig 2021
No ratings yet
Lab Assig 2021
41 pages
Pranjal
No ratings yet
Pranjal
32 pages
Name:atif Ali Enrollment: (01-134191-008)
No ratings yet
Name:atif Ali Enrollment: (01-134191-008)
15 pages
Compiler Design Lab ASSESMENT 1 22BCE0411
No ratings yet
Compiler Design Lab ASSESMENT 1 22BCE0411
13 pages
22BLC1161 LexicalAnalyser
No ratings yet
22BLC1161 LexicalAnalyser
25 pages
Ornek Scanner Parser
No ratings yet
Ornek Scanner Parser
44 pages
A
No ratings yet
A
4 pages
Scanner Solution
No ratings yet
Scanner Solution
4 pages
CompilerConsLab Pranjal
No ratings yet
CompilerConsLab Pranjal
11 pages
Project Report
No ratings yet
Project Report
16 pages
2020CS409 Lab Manual
No ratings yet
2020CS409 Lab Manual
105 pages
Program For Lexical Analyser
No ratings yet
Program For Lexical Analyser
5 pages
Chapter 8 Excercise 2
No ratings yet
Chapter 8 Excercise 2
1 page
CD Lab Manual - Word
No ratings yet
CD Lab Manual - Word
42 pages
Compiler Project
No ratings yet
Compiler Project
16 pages
Program No. - 3: Write A Program To Find Different Tokens in A Program
No ratings yet
Program No. - 3: Write A Program To Find Different Tokens in A Program
3 pages
Experiments
No ratings yet
Experiments
5 pages
CD Lab Manual File
No ratings yet
CD Lab Manual File
27 pages
Compiler Construction Assignment
No ratings yet
Compiler Construction Assignment
7 pages
System Software and Compiler Lab: Token Separation
No ratings yet
System Software and Compiler Lab: Token Separation
5 pages
CD Lab File
No ratings yet
CD Lab File
45 pages
CD Lab Manual
No ratings yet
CD Lab Manual
37 pages
Compiler Design Lab
No ratings yet
Compiler Design Lab
27 pages
Compiler Design & Construction Term Project: Part 1
No ratings yet
Compiler Design & Construction Term Project: Part 1
10 pages
Ccfile
No ratings yet
Ccfile
44 pages
CC Lab 1-4
No ratings yet
CC Lab 1-4
13 pages
CD Lab
No ratings yet
CD Lab
36 pages
Compiler Lab Print Merged
No ratings yet
Compiler Lab Print Merged
45 pages
Microsoft Word - Lab - Compiler
No ratings yet
Microsoft Word - Lab - Compiler
5 pages
Stack
No ratings yet
Stack
5 pages
Lexical Analysis of Compiler
No ratings yet
Lexical Analysis of Compiler
13 pages
Dfa Simulation
No ratings yet
Dfa Simulation
5 pages
CC Lab
No ratings yet
CC Lab
54 pages
Algorithm - Assig#3
No ratings yet
Algorithm - Assig#3
8 pages
EX:No: 1A Implementation of Token Separation
No ratings yet
EX:No: 1A Implementation of Token Separation
4 pages
CD
No ratings yet
CD
11 pages
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet
DOC1 Overview: An Introduction For Programmers
No ratings yet
DOC1 Overview: An Introduction For Programmers
23 pages
OCS353-Data Science Fundamentals Manual 1 - PDF
No ratings yet
OCS353-Data Science Fundamentals Manual 1 - PDF
6 pages
ABAP Chapter 3: Open SQL Internal Table
No ratings yet
ABAP Chapter 3: Open SQL Internal Table
101 pages
SS Lab Programs
No ratings yet
SS Lab Programs
34 pages
AWS Partner - Generative AI On AWS - Sales Guide
No ratings yet
AWS Partner - Generative AI On AWS - Sales Guide
4 pages
Handling Shutdown Situations - Not A Tame Lion
No ratings yet
Handling Shutdown Situations - Not A Tame Lion
4 pages
Java OOP ch1
No ratings yet
Java OOP ch1
14 pages
IPT 102 Module 1
No ratings yet
IPT 102 Module 1
14 pages
Lec02 Script M File Array
No ratings yet
Lec02 Script M File Array
40 pages
Chapter02-02 Database Design - Transforming ERD Into Relation
No ratings yet
Chapter02-02 Database Design - Transforming ERD Into Relation
42 pages
Complete RISE The Journey of A Young Entrepreneur
No ratings yet
Complete RISE The Journey of A Young Entrepreneur
56 pages
No ratings yet
10 pages
Exemples Code VB PDF
No ratings yet
Exemples Code VB PDF
2 pages
(Ebook PDF) Starting Out With C++: From Control Structures Through Objects, Brief Version 8th Edition Download
100% (1)
(Ebook PDF) Starting Out With C++: From Control Structures Through Objects, Brief Version 8th Edition Download
53 pages
Do While Loop in C
No ratings yet
Do While Loop in C
3 pages
The C Programming Language
No ratings yet
The C Programming Language
20 pages
E-Health Care Management
No ratings yet
E-Health Care Management
92 pages
Library Management System Final Report
No ratings yet
Library Management System Final Report
38 pages
Core Java Operators Practice Questions
No ratings yet
Core Java Operators Practice Questions
10 pages
Rinki
No ratings yet
Rinki
4 pages
Comandos mySQLi
No ratings yet
Comandos mySQLi
4 pages
SQL Interview Questions With Theory Answers
No ratings yet
SQL Interview Questions With Theory Answers
26 pages
EWM Inbound Del Automatic Creation From Outbound Del (SPED Approach)
100% (1)
EWM Inbound Del Automatic Creation From Outbound Del (SPED Approach)
7 pages
Suresh11 Net
No ratings yet
Suresh11 Net
8 pages
Lecture7 Py
No ratings yet
Lecture7 Py
9 pages
A Mostly Complete Guide To Webpack 5 (2020)
No ratings yet
A Mostly Complete Guide To Webpack 5 (2020)
17 pages
Book 5
No ratings yet
Book 5
142 pages
OSDB75 Dump
No ratings yet
OSDB75 Dump
12 pages
Introduction To Embedded Systems: Edward A. Lee
No ratings yet
Introduction To Embedded Systems: Edward A. Lee
22 pages

Mid Term Project

Uploaded by

Mid Term Project

Uploaded by

Mid-Term Project

Student ID: 41230100703

using namespace std;

// Basic list of C++ keywords

// Check if a word is a keyword

// Check if a character is an operator

// Check if a character is punctuation

// Check if a character is a parenthesis

// Check if a string is a number

while (i < code.length()) {

// Handle preprocessor directives

// Handle string literals

// Handle character literals

// Handle identifiers, keywords, and numbers

vector<Token> tokens = tokenize(line);

You might also like