0% found this document useful (0 votes)

5 views4 pages

Tokencc C

Program on c

Uploaded by

h6643246

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

5 views4 pages

Tokencc C

Program on c

Uploaded by

h6643246

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 4

File: /home/shahana/tokencc.

c Page 1 of 4

#include <stdio.h>
#include <ctype.h>
#include <string.h>

// Define token types

typedef enum {
TOKEN_KEYWORD,
TOKEN_IDENTIFIER,
TOKEN_CONSTANT,
TOKEN_STRING,
TOKEN_OPERATOR,
TOKEN_SPECIAL_SYMBOL,
TOKEN_UNKNOWN,
TOKEN_EOF
} TokenType;

// Define a structure for tokens

typedef struct {
TokenType type;
char lexeme[100];
} Token;

// List of keywords
const char *keywords[] = {
"if", "else", "while", "for", "return", "int", "float", "void", "char", "double"
};

const int keywordCount = 10;

// Function to check if a lexeme is a keyword

int isKeyword(char *lexeme) {
for (int i = 0; i < keywordCount; i++) {
if (strcmp(lexeme, keywords[i]) == 0) {
return 1;
}
}
return 0;
}

// Function to classify a character

int isSpecialSymbol(char ch) {
return (ch == ',' || ch == ';' || ch == '(' || ch == ')' ||
ch == '[' || ch == ']' || ch == '{' || ch == '}' ||
ch == '&' || ch == '|' || ch == '!' || ch == '#' ||
ch == '^' || ch == '~' || ch == '?' || ch == ':');
}

int isOperator(char ch) {

return (ch == '+' || ch == '-' || ch == '*' || ch == '/' ||
ch == '>' || ch == '<' || ch == '=' || ch == '&' ||
ch == '|' || ch == '!');
}

int isDigit(char ch) {

return (ch >= '0' && ch <= '9');
}

int isIdentifierStart(char ch) {

return (isalpha(ch) || ch == '_');
}

int isIdentifierPart(char ch) {

return (isalnum(ch) || ch == '_');
}

// Function to get the next token

File: /home/shahana/tokencc.c Page 2 of 4

Token getNextToken(FILE *source) {

Token token;
int ch = fgetc(source);

// Ignore whitespaces, tabs, and newlines

while (isspace(ch)) {
ch = fgetc(source);
}

// Ignore comments
if (ch == '/') {
int nextChar = fgetc(source);
if (nextChar == '/') {
// Single-line comment
while (ch != '\n' && ch != EOF) {
ch = fgetc(source);
}
return getNextToken(source); // Ignore comment and get next token
} else if (nextChar == '*') {
// Multi-line comment
while (1) {
ch = fgetc(source);
if (ch == '*' && (ch = fgetc(source)) == '/') {
break;
}
if (ch == EOF) {
break;
}
}
return getNextToken(source); // Ignore comment and get next token
} else {
ungetc(nextChar, source);
}
}

// Check for EOF

if (ch == EOF) {
token.type = TOKEN_EOF;
strcpy(token.lexeme, "EOF");
return token;
}

// Handle strings
if (ch == '\"') {
int i = 0;
token.lexeme[i++] = ch;
ch = fgetc(source);
while (ch != '\"' && ch != EOF) {
token.lexeme[i++] = ch;
ch = fgetc(source);
}
token.lexeme[i++] = ch;
token.lexeme[i] = '\0';
token.type = TOKEN_STRING;
return token;
}

// Handle identifiers and keywords

if (isIdentifierStart(ch)) {
int i = 0;
token.lexeme[i++] = ch;
ch = fgetc(source);
while (isIdentifierPart(ch)) {
token.lexeme[i++] = ch;
ch = fgetc(source);
}
File: /home/shahana/tokencc.c Page 3 of 4

ungetc(ch, source);
token.lexeme[i] = '\0';

if (isKeyword(token.lexeme)) {
token.type = TOKEN_KEYWORD;
} else {
token.type = TOKEN_IDENTIFIER;
}
return token;
}

// Handle numeric constants

if (isDigit(ch)) {
int i = 0;
token.lexeme[i++] = ch;
ch = fgetc(source);
while (isDigit(ch)) {
token.lexeme[i++] = ch;
ch = fgetc(source);
}
ungetc(ch, source);
token.lexeme[i] = '\0';
token.type = TOKEN_CONSTANT;
return token;
}

// Handle operators
if (isOperator(ch)) {
token.type = TOKEN_OPERATOR;
token.lexeme[0] = ch;
token.lexeme[1] = '\0';
return token;
}

// Handle special symbols

if (isSpecialSymbol(ch)) {
token.type = TOKEN_SPECIAL_SYMBOL;
token.lexeme[0] = ch;
token.lexeme[1] = '\0';
return token;
}

// Unknown token
token.type = TOKEN_UNKNOWN;
token.lexeme[0] = ch;
token.lexeme[1] = '\0';
return token;
}

// Function to print tokens

void printToken(Token token) {
switch (token.type) {
case TOKEN_KEYWORD: printf("Keyword: %s\n", token.lexeme); break;
case TOKEN_IDENTIFIER: printf("Identifier: %s\n", token.lexeme); break;
case TOKEN_CONSTANT: printf("Constant: %s\n", token.lexeme); break;
case TOKEN_STRING: printf("String: %s\n", token.lexeme); break;
case TOKEN_OPERATOR: printf("Operator: %s\n", token.lexeme); break;
case TOKEN_SPECIAL_SYMBOL: printf("Special Symbol: %s\n", token.lexeme); break;
case TOKEN_UNKNOWN: printf("Unknown: %s\n", token.lexeme); break;
case TOKEN_EOF: printf("End of File\n"); break;
default: break;
}
}

int main() {
FILE *source = fopen("sample1.c", "r");
File: /home/shahana/tokencc.c Page 4 of 4

if (source == NULL) {
printf("Error: Unable to open file.\n");
return 1;
}

Token token;
do {
token = getNextToken(source);
printToken(token);
} while (token.type != TOKEN_EOF);

fclose(source);
return 0;
}

Design and Implementation of A Computerised Stadium Management Information System
100% (8)
Design and Implementation of A Computerised Stadium Management Information System
32 pages
Vio 3 Service
No ratings yet
Vio 3 Service
84 pages
Lisp Interpreter in Rust
From Everand
Lisp Interpreter in Rust
Vishal Patil
1/5 (1)
NC-WR744G: AC1200 Wireless Dual Band Router
No ratings yet
NC-WR744G: AC1200 Wireless Dual Band Router
3 pages
Worth1000 Photoshop Tutorials
100% (3)
Worth1000 Photoshop Tutorials
315 pages
ATJ209X Program Guide v1.4
No ratings yet
ATJ209X Program Guide v1.4
137 pages
Compiler Design Lab
No ratings yet
Compiler Design Lab
49 pages
CD Lab Manual File
No ratings yet
CD Lab Manual File
27 pages
Pranjal
No ratings yet
Pranjal
32 pages
21BAI1213 - Abhinav V - Experiment-2
No ratings yet
21BAI1213 - Abhinav V - Experiment-2
11 pages
Design A Lexical Analyser For Given Language and The Lexical Analyser Should Ignore Redundant Spaces
No ratings yet
Design A Lexical Analyser For Given Language and The Lexical Analyser Should Ignore Redundant Spaces
7 pages
Program For Lexical Analyser
No ratings yet
Program For Lexical Analyser
5 pages
CD Lab File
No ratings yet
CD Lab File
45 pages
Include 1
No ratings yet
Include 1
2 pages
EX:No: 1A Implementation of Token Separation
No ratings yet
EX:No: 1A Implementation of Token Separation
4 pages
Assignment 2
No ratings yet
Assignment 2
4 pages
3
No ratings yet
3
3 pages
Experiment No 3 PDF
No ratings yet
Experiment No 3 PDF
4 pages
Ex 1 - Lexical Analyser
No ratings yet
Ex 1 - Lexical Analyser
8 pages
Write A C Program To Identify Different Types of Tokens in A Given Program
No ratings yet
Write A C Program To Identify Different Types of Tokens in A Given Program
6 pages
Week 2a &2B
No ratings yet
Week 2a &2B
6 pages
Lexer
No ratings yet
Lexer
6 pages
Mid Term Project
No ratings yet
Mid Term Project
4 pages
Compiler Design (CS-701) : Develop A Lexical Analyzer To Recognize A Few Patterns in C
No ratings yet
Compiler Design (CS-701) : Develop A Lexical Analyzer To Recognize A Few Patterns in C
17 pages
CD 1
No ratings yet
CD 1
31 pages
Dfa Simulation
No ratings yet
Dfa Simulation
5 pages
2
No ratings yet
2
6 pages
Final PCC Practical Experiment (Odd)
No ratings yet
Final PCC Practical Experiment (Odd)
6 pages
Compiler Satyam
No ratings yet
Compiler Satyam
43 pages
03 Lexical Analysis
No ratings yet
03 Lexical Analysis
14 pages
21bai1724 Lab-01
No ratings yet
21bai1724 Lab-01
11 pages
Experiments
No ratings yet
Experiments
5 pages
CD Lab Manual
No ratings yet
CD Lab Manual
68 pages
CC Lab 1-2
No ratings yet
CC Lab 1-2
6 pages
Lexical Analyser
No ratings yet
Lexical Analyser
3 pages
Wa0091.
No ratings yet
Wa0091.
36 pages
CD Lab Prgms Final
No ratings yet
CD Lab Prgms Final
43 pages
21BAI1159 Hari Prasath Experiment-2
No ratings yet
21BAI1159 Hari Prasath Experiment-2
11 pages
Assignment 1
No ratings yet
Assignment 1
11 pages
CD File - Merged
No ratings yet
CD File - Merged
52 pages
Rajalakshmi Institute of Technology Chennai: Department of Computer Science and Engineering
No ratings yet
Rajalakshmi Institute of Technology Chennai: Department of Computer Science and Engineering
20 pages
22bce2509 VL2024250102410 Ast01
No ratings yet
22bce2509 VL2024250102410 Ast01
12 pages
Compiler Lab Experiments
No ratings yet
Compiler Lab Experiments
24 pages
CD Lab Programs
No ratings yet
CD Lab Programs
9 pages
21bai1724 Lab-02
No ratings yet
21bai1724 Lab-02
10 pages
CD515
No ratings yet
CD515
55 pages
Lexical Analysis
No ratings yet
Lexical Analysis
3 pages
Compiler Design Lab
No ratings yet
Compiler Design Lab
27 pages
Compiler Design & Networks Lab Manual
No ratings yet
Compiler Design & Networks Lab Manual
69 pages
CD Assignment-2
No ratings yet
CD Assignment-2
16 pages
7) Write A Program To Design Lexical Analyzer
No ratings yet
7) Write A Program To Design Lexical Analyzer
25 pages
Cdlab UPDATED
No ratings yet
Cdlab UPDATED
43 pages
C Program To Read The File and Display Contents On The Screen
No ratings yet
C Program To Read The File and Display Contents On The Screen
22 pages
SPL PR 10
No ratings yet
SPL PR 10
2 pages
Uliya
No ratings yet
Uliya
45 pages
Lab 3 and 4
No ratings yet
Lab 3 and 4
12 pages
CD Lab Manual
No ratings yet
CD Lab Manual
37 pages
Lab Programs
No ratings yet
Lab Programs
20 pages
Tarun
No ratings yet
Tarun
51 pages
CD Lab Manual - Word
No ratings yet
CD Lab Manual - Word
42 pages
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet
Introduction to PHP, Part 5, Second Edition
From Everand
Introduction to PHP, Part 5, Second Edition
Adam Majczak
No ratings yet
Python Reference: An Alphabetical Guide
From Everand
Python Reference: An Alphabetical Guide
Jo Foster
No ratings yet
Simplified PHP
From Everand
Simplified PHP
James Blanchette
No ratings yet
Introduction to PHP, Part 2, Second Edition
From Everand
Introduction to PHP, Part 2, Second Edition
Adam Majczak
No ratings yet
MongoDB and NoSQL Injection and Prevention
No ratings yet
MongoDB and NoSQL Injection and Prevention
5 pages
Gujarat Technological University
No ratings yet
Gujarat Technological University
2 pages
VR&AR
No ratings yet
VR&AR
8 pages
WR 1 Q P Memo
No ratings yet
WR 1 Q P Memo
7 pages
Find Changes Logs For A Table Using SM30 - SAP Blogs
No ratings yet
Find Changes Logs For A Table Using SM30 - SAP Blogs
7 pages
Scribbed 223751127-Chapter-12-Enhanced-Entity-Relationship-Modeling PDF
No ratings yet
Scribbed 223751127-Chapter-12-Enhanced-Entity-Relationship-Modeling PDF
16 pages
C# Concepts
No ratings yet
C# Concepts
2 pages
Alex Watts CV
No ratings yet
Alex Watts CV
2 pages
CZ4031 Project 2 Report
No ratings yet
CZ4031 Project 2 Report
34 pages
C Handbook
No ratings yet
C Handbook
22 pages
TE Comp Sem VI - AI For May 2022 Examination
No ratings yet
TE Comp Sem VI - AI For May 2022 Examination
3 pages
Day 3 - Customizing ChatGPT
No ratings yet
Day 3 - Customizing ChatGPT
44 pages
Internship Report
No ratings yet
Internship Report
8 pages
Arrays
No ratings yet
Arrays
9 pages
IA Industrial Automation Product Pricelist V6 August 02-09-21
No ratings yet
IA Industrial Automation Product Pricelist V6 August 02-09-21
148 pages
Form # 4 - ICS 4 Cable Installation Below Ground
No ratings yet
Form # 4 - ICS 4 Cable Installation Below Ground
1 page
Samsung GT c3520 Service Manual PDF
No ratings yet
Samsung GT c3520 Service Manual PDF
71 pages
Main Ldap Training Day2
No ratings yet
Main Ldap Training Day2
39 pages
Panasonic Lumix s5 II
No ratings yet
Panasonic Lumix s5 II
803 pages
Apple Assignment
No ratings yet
Apple Assignment
8 pages
Magel Is
No ratings yet
Magel Is
40 pages
Advance Excel Toolkit
No ratings yet
Advance Excel Toolkit
3 pages
Box Sensor 2
No ratings yet
Box Sensor 2
1 page
Vpre 2C
No ratings yet
Vpre 2C
5 pages
Computers
No ratings yet
Computers
2 pages

Tokencc C

Uploaded by

Tokencc C

Uploaded by

File: /home/shahana/tokencc.

// Define token types

// Define a structure for tokens

const int keywordCount = 10;

// Function to check if a lexeme is a keyword

// Function to classify a character

int isOperator(char ch) {

int isDigit(char ch) {

int isIdentifierStart(char ch) {

int isIdentifierPart(char ch) {

// Function to get the next token

Token getNextToken(FILE *source) {

// Ignore whitespaces, tabs, and newlines

// Check for EOF

// Handle identifiers and keywords

// Handle numeric constants

// Handle special symbols

// Function to print tokens

You might also like