0% found this document useful (0 votes)

18 views3 pages

3

The document is a C program that implements a lexical analyzer for parsing and tokenizing input strings. It defines functions to identify delimiters, operators, keywords, valid identifiers, and numbers, and processes the input to extract and categorize these tokens. The main function demonstrates the lexical analyzer using a sample C code snippet.

Uploaded by

gg4480

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

18 views3 pages

3

Uploaded by

gg4480

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 3

#include <ctype.

h>
#include <stdbool.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>

#define MAX_LENGTH 100

// Function to check if a character is a delimiter

bool isDelimiter(char chr) {
return (chr == ' ' || chr == '+' || chr == '-' || chr == '*' || chr == '/' ||
chr == ',' ||
chr == ';' || chr == '%' || chr == '>' || chr == '<' || chr == '=' ||
chr == '(' ||
chr == ')' || chr == '[' || chr == ']' || chr == '{' || chr == '}');
}

// Function to check if a character is an operator

bool isOperator(char chr) {
return (chr == '+' || chr == '-' || chr == '*' || chr == '/' || chr == '%' ||
chr == '>' || chr == '<' || chr == '=' || chr == '&' || chr == '|');
}

// Function to check if a string is a valid identifier

bool isValidIdentifier(char *str) {
if (!isalpha(str[0]) && str[0] != '_') // Identifiers must start with a letter
or underscore
return false;

for (int i = 1; i < strlen(str); i++) {

if (!isalnum(str[i]) && str[i] != '_') // Can contain letters, numbers, or
underscores
return false;
}

return true;
}

// Function to check if a string is a keyword

bool isKeyword(char *str) {
const char *keywords[] = {
"auto", "break", "case", "char", "const", "continue", "default", "do",
"double", "else", "enum",
"extern", "float", "for", "goto", "if", "int", "long", "register",
"return", "short", "signed",
"sizeof", "static", "struct", "switch", "typedef", "union", "unsigned",
"void", "volatile", "while"
};

for (int i = 0; i < sizeof(keywords) / sizeof(keywords[0]); i++) {

if (strcmp(str, keywords[i]) == 0)
return true;
}

return false;
}

// Function to check if a string is an integer or floating point number

bool isNumber(char *str) {
bool hasDecimal = false;
int i = 0;

if (str[0] == '-') // Allow negative numbers

i++;

for (; str[i] != '\0'; i++) {

if (!isdigit(str[i])) {
if (str[i] == '.' && !hasDecimal) {
hasDecimal = true; // Allow only one decimal point
} else {
return false;
}
}
}

return true;
}

// Function to extract a substring from a string

char *getSubstring(char *str, int start, int end) {
int subLength = end - start + 1;
char *subStr = (char *)malloc((subLength + 1) * sizeof(char));
strncpy(subStr, str + start, subLength);
subStr[subLength] = '\0';
return subStr;
}

// Lexical Analyzer Function

void lexicalAnalyzer(char *input) {
int left = 0, right = 0, len = strlen(input);

while (right < len) {

// Handling string literals
if (input[right] == '"') {
left = right;
right++;
while (right < len && input[right] != '"')
right++;
right++; // Include closing quote
char *strLiteral = getSubstring(input, left, right - 1);
printf("Token: String Literal, Value: %s\n", strLiteral);
free(strLiteral); // Free allocated memory
left = right;
continue;
}

// Handling single-line and multi-line comments

if (input[right] == '/' && input[right + 1] == '/') {
while (input[right] != '\n' && right < len)
right++;
left = right;
continue;
} else if (input[right] == '/' && input[right + 1] == '*') {
right += 2;
while (right < len && !(input[right] == '*' && input[right + 1] ==
'/'))
right++;
right += 2; // Include closing */
left = right;
continue;
}

// Detecting multi-character operators (>=, ==, !=, etc.)

if (isOperator(input[right])) {
if (isOperator(input[right + 1])) {
printf("Token: Operator, Value: %c%c\n", input[right], input[right
+ 1]);
right += 2;
} else {
printf("Token: Operator, Value: %c\n", input[right]);
right++;
}
left = right;
continue;
}

// Skipping delimiters
if (isDelimiter(input[right])) {
if (input[right] != ' ') // Ignore spaces
printf("Token: Delimiter, Value: %c\n", input[right]);
right++;
left = right;
continue;
}

// Processing words (identifiers, keywords, numbers)

while (right < len && !isDelimiter(input[right]))
right++;

char *subStr = getSubstring(input, left, right - 1);

if (isKeyword(subStr))
printf("Token: Keyword, Value: %s\n", subStr);
else if (isNumber(subStr))
printf("Token: Number, Value: %s\n", subStr);
else if (isValidIdentifier(subStr))
printf("Token: Identifier, Value: %s\n", subStr);
else
printf("Token: Unidentified, Value: %s\n", subStr);

free(subStr); // Free allocated memory

left = right;
}
}

// Main function
int main() {
char lex_input[MAX_LENGTH] = "int main() { int a = 10, b = 20; float c = 3.14;
if (a >= b) printf(\"Hello World!\"); return 0; }";

printf("For Expression:\n%s\n\n", lex_input);

lexicalAnalyzer(lex_input);

return 0;
}

Assembly - Fundamentals of ALP
100% (1)
Assembly - Fundamentals of ALP
51 pages
Op
No ratings yet
Op
259 pages
Car Washing Management System
100% (2)
Car Washing Management System
21 pages
SRWE Module 5
100% (1)
SRWE Module 5
52 pages
Credit Card Fraud Analysis Project Documentation
No ratings yet
Credit Card Fraud Analysis Project Documentation
101 pages
Log
No ratings yet
Log
467 pages
Python Binary Files
No ratings yet
Python Binary Files
8 pages
Boyle ccs4 HW 03
No ratings yet
Boyle ccs4 HW 03
14 pages
CD Assignment-2
No ratings yet
CD Assignment-2
16 pages
Ipq 6000
No ratings yet
Ipq 6000
68 pages
CiTRANS 660 Troubleshooting Guide
No ratings yet
CiTRANS 660 Troubleshooting Guide
148 pages
CD Lab Manual
No ratings yet
CD Lab Manual
68 pages
DEEPAK CD File
No ratings yet
DEEPAK CD File
62 pages
CD Lab Krish
No ratings yet
CD Lab Krish
33 pages
Teja CD Record
No ratings yet
Teja CD Record
33 pages
CD File - Merged
No ratings yet
CD File - Merged
52 pages
CD Lab Manual
No ratings yet
CD Lab Manual
37 pages
4th Sem Syllabus
No ratings yet
4th Sem Syllabus
67 pages
CD Lab
No ratings yet
CD Lab
36 pages
CD Lab Manual
No ratings yet
CD Lab Manual
71 pages
Cdlab UPDATED
No ratings yet
Cdlab UPDATED
43 pages
CD Lab File
No ratings yet
CD Lab File
45 pages
R20 CD Lab Manual
No ratings yet
R20 CD Lab Manual
43 pages
Pranjal
No ratings yet
Pranjal
32 pages
CD 1 To 11 Practical
No ratings yet
CD 1 To 11 Practical
34 pages
CD Lab Manual
No ratings yet
CD Lab Manual
31 pages
Ex: 1.a Program To Recognize A Few Patterns in C Aim
No ratings yet
Ex: 1.a Program To Recognize A Few Patterns in C Aim
28 pages
Important Programs
No ratings yet
Important Programs
20 pages
Expl Prgrms
No ratings yet
Expl Prgrms
23 pages
Lexical Analyser in C++ - ASHWATH KV - 106120017 For Full Code
No ratings yet
Lexical Analyser in C++ - ASHWATH KV - 106120017 For Full Code
4 pages
CD 1
No ratings yet
CD 1
31 pages
STQA Unit I
No ratings yet
STQA Unit I
18 pages
Principles of Compiler Construction Lab File NSUT
No ratings yet
Principles of Compiler Construction Lab File NSUT
31 pages
CD Lab Answers
No ratings yet
CD Lab Answers
19 pages
CD Lab Prgms Final
No ratings yet
CD Lab Prgms Final
42 pages
CD Lab Programs
No ratings yet
CD Lab Programs
43 pages
Compiler Design Lab Manual
No ratings yet
Compiler Design Lab Manual
51 pages
Compiler Design Labs
No ratings yet
Compiler Design Labs
25 pages
CD Lab
No ratings yet
CD Lab
27 pages
Gigabyte Gv-R67xtgaming Oc-12gd Rev 1.0
No ratings yet
Gigabyte Gv-R67xtgaming Oc-12gd Rev 1.0
42 pages
Write A C Program To Identify Different Types of Tokens in A Given Program
No ratings yet
Write A C Program To Identify Different Types of Tokens in A Given Program
46 pages
Cybersecurity
No ratings yet
Cybersecurity
20 pages
Cdlabmanual
No ratings yet
Cdlabmanual
19 pages
SESlides 5
No ratings yet
SESlides 5
21 pages
Lab 3 and 4
No ratings yet
Lab 3 and 4
12 pages
CITY CD Lab
No ratings yet
CITY CD Lab
50 pages
Class 5 - 2D Maxima Sweep-Line Algorithm
No ratings yet
Class 5 - 2D Maxima Sweep-Line Algorithm
28 pages
CD Lab Manual - Word
No ratings yet
CD Lab Manual - Word
42 pages
Compiler Design Practical File
No ratings yet
Compiler Design Practical File
12 pages
Ex: 1.a Program To Recognize A Few Patterns in C Aim
No ratings yet
Ex: 1.a Program To Recognize A Few Patterns in C Aim
15 pages
CD Lab1
No ratings yet
CD Lab1
8 pages
Chapter 2 Dit
No ratings yet
Chapter 2 Dit
17 pages
CC Assignment#3 Lexical AnalyzerC++ M.shayan 1755-2020 Muhammad Hassan
No ratings yet
CC Assignment#3 Lexical AnalyzerC++ M.shayan 1755-2020 Muhammad Hassan
13 pages
3rd Semester Syllabus
No ratings yet
3rd Semester Syllabus
9 pages
Compiler Design Lab
No ratings yet
Compiler Design Lab
27 pages
Programm 1
No ratings yet
Programm 1
8 pages
CD Lab Manual Final
No ratings yet
CD Lab Manual Final
51 pages
EXP1
No ratings yet
EXP1
6 pages
2
No ratings yet
2
6 pages
Assignment 2
No ratings yet
Assignment 2
4 pages
DotnetConf2019HCMC NETCore3
No ratings yet
DotnetConf2019HCMC NETCore3
11 pages
CSE425 Assignment
No ratings yet
CSE425 Assignment
5 pages
CD 1
No ratings yet
CD 1
18 pages
Pathakexp 4
No ratings yet
Pathakexp 4
5 pages
Experiment No 1
No ratings yet
Experiment No 1
4 pages
Installation Guide Windows
No ratings yet
Installation Guide Windows
6 pages
Experiments
No ratings yet
Experiments
5 pages
CD Lab5
No ratings yet
CD Lab5
6 pages
Assignment 4
No ratings yet
Assignment 4
3 pages
Token Sep
No ratings yet
Token Sep
3 pages
CD Assignments
No ratings yet
CD Assignments
7 pages
Praneet 43 Spccexp 1
No ratings yet
Praneet 43 Spccexp 1
4 pages
Compiler Design: Department of Computer Science & Faculty of Engineering
No ratings yet
Compiler Design: Department of Computer Science & Faculty of Engineering
27 pages
HTML - Overview - Tutorialspoint
No ratings yet
HTML - Overview - Tutorialspoint
4 pages
Synology DS223 Data Sheet Enu
No ratings yet
Synology DS223 Data Sheet Enu
9 pages
Lexical Analyser in C++ - ASHWATH KV - 106120017 For Full Code
No ratings yet
Lexical Analyser in C++ - ASHWATH KV - 106120017 For Full Code
4 pages
Week 2a &2B
No ratings yet
Week 2a &2B
6 pages
IT Coordinator in School
No ratings yet
IT Coordinator in School
1 page
Ibtasam Mateen (18-Arid-5157) Compiler Practical
No ratings yet
Ibtasam Mateen (18-Arid-5157) Compiler Practical
6 pages
21 Brs 1619
No ratings yet
21 Brs 1619
4 pages
MultiVue Quick Guide (EPIQ Evolution 5.0 & Affiniti Continuum 3.0) Newpdf
No ratings yet
MultiVue Quick Guide (EPIQ Evolution 5.0 & Affiniti Continuum 3.0) Newpdf
5 pages
Cmpe-371 DSP
No ratings yet
Cmpe-371 DSP
1 page
Pega Customer Service Pricing Matrix PDF
No ratings yet
Pega Customer Service Pricing Matrix PDF
3 pages
Compiler Design Lab Assignment Lab 4
No ratings yet
Compiler Design Lab Assignment Lab 4
7 pages
Desktop Dell Optiplex 7010 SFF (59P3N)
No ratings yet
Desktop Dell Optiplex 7010 SFF (59P3N)
3 pages
New Text Document
No ratings yet
New Text Document
6 pages
SPCC Lab1
No ratings yet
SPCC Lab1
2 pages
Multi-Mode Router: Meet All Your Needs. TL-WR841N
No ratings yet
Multi-Mode Router: Meet All Your Needs. TL-WR841N
2 pages
Teacher's Notes - Lab Chapter 1 - Intro To Solaris
No ratings yet
Teacher's Notes - Lab Chapter 1 - Intro To Solaris
3 pages
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet

3

Uploaded by

3

Uploaded by

#include <ctype.

#define MAX_LENGTH 100

// Function to check if a character is a delimiter

// Function to check if a character is an operator

// Function to check if a string is a valid identifier

for (int i = 1; i < strlen(str); i++) {

// Function to check if a string is a keyword

for (int i = 0; i < sizeof(keywords) / sizeof(keywords[0]); i++) {

// Function to check if a string is an integer or floating point number

if (str[0] == '-') // Allow negative numbers

for (; str[i] != '\0'; i++) {

// Function to extract a substring from a string

// Lexical Analyzer Function

while (right < len) {

// Handling single-line and multi-line comments

// Detecting multi-character operators (>=, ==, !=, etc.)

// Processing words (identifiers, keywords, numbers)

char *subStr = getSubstring(input, left, right - 1);

free(subStr); // Free allocated memory

printf("For Expression:\n%s\n\n", lex_input);

You might also like