0% found this document useful (0 votes)

24 views27 pages

ISR Code

Uploaded by

Akshata Dongaonkar

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

24 views27 pages

ISR Code

Uploaded by

Akshata Dongaonkar

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 27

Name: Akshata Vishal Dongaonkar

Roll No.:45020
Div: BE-IT-A
Subject: ISR

1. Conflation Algorithm

import java.io.BufferedReader; import

java.io.FileNotFoundException; import

java.io.FileReader; import

java.io.IOException; import

java.io.InputStreamReader;

import java.util.ArrayList;

import java.util.HashMap;

import java.util.Iterator; import

java.util.Map;

public class Conflation { public static ArrayList<String> stopList = new

ArrayList<String>(); public static ArrayList<String> removestopList = new

ArrayList<String>(); public static String suffixes[] = { "able", "ing", "ion",

"y", "ment" };

public static String stopwords[] = { "i", "big", "am", "m", "a", "we",

"are", "it", "of", "this", "and", "is", "to", "at", "in", "was",

"with", "doing", "It", "not", "our" };

public static void main(String[] args) {

InputStreamReader st = new InputStreamReader(System.in);

BufferedReader buff = new BufferedReader(st);

String fname = "";

System.out.println("Enter a filename:");

try {
fname = buff.readLine();

} catch (IOException e) {

e.printStackTrace();

conflation(fname);

public static void conflation(String fname) {

BufferedReader buff;

int i = 0, j = 0;

try {

buff = new BufferedReader(new FileReader(fname));

int flag = 0;

String line = "";

line = buff.readLine();

String[] buffer = line.split(" ");

for (i = 0; i < buffer.length; i++) {

flag = 0;

if (buffer[i].endsWith("."))

buffer[i] = buffer[i].replace(".", "");

for (j = 0; j < stopwords.length; j++) {

if (buffer[i].equals(stopwords[j])) {

stopList.add(buffer[i]);

flag = 1;

break;

if (flag != 1 && !buffer[i].equals(null)) {

removestopList.add(buffer[i]);
}

System.out.println("\n--------------After Removing Stop Words-----------------");

for (int k = 0; k < removestopList.size(); k++) {

System.out.println(removestopList.get(k));

suffixesString(removestopList);

countFrequency(removestopList);

} catch (FileNotFoundException e) {

e.printStackTrace();

} catch (IOException e) {

e.printStackTrace();

private static void countFrequency(ArrayList<String> removestopList2) {

// Mapping of String->Integer (word -> frequency)

System.out.println("\n\n-------After Counting Frequency-----------"); final

Map<String, Integer> frequencyMap = new HashMap<String, Integer>(); for

(int k = 0; k < removestopList.size(); k++) {

String currentWord = removestopList.get(k);

Integer frequency = frequencyMap.get(currentWord);

// Add the word if it doesn't already exist, otherwise increment the

// frequency counter.

if (frequency == null) {

frequency = 0;

frequencyMap.put(currentWord, frequency + 1);

}

Iterator entries = frequencyMap.entrySet().iterator();

while (entries.hasNext()) {

Map.Entry entry = (Map.Entry) entries.next();

String key = (String) entry.getKey();

Integer value = (Integer) entry.getValue();

System.out.println(key + " = " + value);

private static void suffixesString(ArrayList<String> removestopList) {

System.out.println("\n\n--------After Removing Suffixes------------"); for

(int k = 0; k < removestopList.size(); k++) {

String suffixString = removestopList.get(k);

int flag = 0;

for (int m = 0; m < suffixes.length; m++) {

if (suffixString.endsWith(suffixes[m])) {

int len = suffixString.length();

int len1 = suffixes[m].length();

int len2 = len - len1;

String sufString = suffixString.substring(0, len2);

System.out.print(suffixString + "\t\t");

System.out.println(sufString);

flag = 1;

break;

if (flag != 1)

System.out.println(suffixString + "\t\t" + suffixString);

}
}

Output:
2. Single Pass Algorithm
import java.io.BufferedReader;

import java.io.IOException; import

java.io.InputStreamReader; import

java.util.ArrayList;

public class Singlepass { public static void main(String[]

args) throws IOException {

BufferedReader stdInpt = new BufferedReader(new InputStreamReader(System.in));

System.out.println("Enter the no of Tokens"); int noOfDocuments =

Integer.parseInt(stdInpt.readLine()); System.out.println("Enter the no of

Documents"); int noOfTokens = Integer.parseInt(stdInpt.readLine());

System.out.println("Enter the threshhold"); float threshhold =

Float.parseFloat(stdInpt.readLine()); System.out.println("Enter the Document

Token Matrix"); int[][] input = new int[noOfDocuments][noOfTokens]; for

(int i = 0; i < noOfDocuments; ++i) { for (int j = 0; j < noOfTokens; ++j) {

System.out.println("Enter(" + i + "," + j + ")");

input[i][j] = Integer.parseInt(stdInpt.readLine());

SinglePassAlgorithm(noOfDocuments, noOfTokens, threshhold, input);

private static void SinglePassAlgorithm(int noOfDocuments, int noOfTokens,float threshhold, int[][]

input) {
int[][] cluster = new int[noOfDocuments][noOfDocuments + 1];

ArrayList<Float[]> clusterRepresentative = new ArrayList<Float[]>();

cluster[0][0] = 1; cluster[0][1] = 0; int noOfClusters = 1;

Float[] temp = new Float[noOfTokens];

temp = convertintArrToFloatArr(input[0]);

clusterRepresentative.add(temp); for (int i

= 1; i < noOfDocuments; ++i) {

float max = -1; int clusterId = -1; for (int j = 0; j < noOfClusters; ++j) { float similarity

= calculateSimilarity( convertintArrToFloatArr(input[i]),clusterRepresentative.get(j));

if (similarity > threshhold) {

if (similarity > max) {

max = similarity;

clusterId = j;

if (max == -1) {

cluster[noOfClusters][0] = 1;

cluster[noOfClusters][1] = i;

noOfClusters++;

clusterRepresentative.add(convertintArrToFloatArr(input[i]));

} else { cluster[clusterId][0] +=

1; int index = cluster[clusterId][0];

cluster[clusterId][index] = i;

clusterRepresentative.set(clusterId,

calculateClusterRepresentative(cluster[clusterId],

input, noOfTokens));

}
for (int i = 0; i < noOfClusters; ++i) {

System.out.print("\n" + i + "\t");

for (int j = 1; j <= cluster[i][0]; ++j) {

System.out.print(" " + cluster[i][j]);

/* This function convert input integer array into float array.*/ private

static Float[] convertintArrToFloatArr(int[] input) {

int size = input.length;

Float[] answer = new Float[size];

for (int i = 0; i < input.length; ++i) {

answer[i] = (float) input[i];

return answer;

/**

* This function calculate the similarity value.

* Formula= answer =answer+ a[i]*b[i]

*/ private static float calculateSimilarity(Float[] a, Float[]

b) {

float answer = 0;

for (int i = 0; i < a.length; ++i) {

answer += a[i] * b[i];

return answer;

/* This function calculates the centroid value.*/ private static

Float[] calculateClusterRepresentative(int[] cluster,

int[][] input, int noOFTokens) {

Float[] answer = new Float[noOFTokens]; for

(int i = 0; i < noOFTokens; ++i) {

answer[i] = Float.parseFloat("0");

for (int i = 1; i <= cluster[0]; ++i) {

for (int j = 0; j < noOFTokens; ++j) {

answer[j] += input[cluster[i]][j];

for (int i = 0; i < noOFTokens; ++i) {

answer[i] /= cluster[0];

return answer;

Output:
3. Inverted File
import java.io.BufferedReader;

import java.io.FileNotFoundException;

import java.io.FileReader; import

java.io.IOException; import

java.io.InputStreamReader; import

java.util.ArrayList; import

java.util.StringTokenizer;

public class InvertedFile { public static void

displayIndex(ArrayList<String> invertedData,

int[][] docno) {

int i, j;

for (i = 0; i < invertedData.size(); i++) {

System.out.print(invertedData.get(i) + "\t"); for (j = 1; j <=

docno[i][0]; j++)

System.out.print(docno[i][j] + "\t");

System.out.print("\n");

public static void indexing(String fname, ArrayList<String> invertedData,int[][] docno, int fileno) {

BufferedReader br;

try {

br = new BufferedReader(new FileReader(fname));

String data = "", line = br.readLine();

while (line != null) {

data += line + " ";

line = br.readLine();

}
String[] st = data.split("[ ,.]");

String currenttoken = null;

int i = 0;

while (i < st.length) {

currenttoken = st[i];

int indx = invertedData.indexOf(currenttoken);

if (indx == -1) {

invertedData.add(currenttoken);

indx = invertedData.indexOf(currenttoken);

docno[indx][0] = 1;

docno[indx][1] = fileno;

} else {

docno[indx][docno[indx][0] + 1] = fileno;

docno[indx][0] += 1;

i += 1;

} catch (Exception e) {

e.printStackTrace();

public static void main(String[] args) throws NumberFormatException,

IOException {

String fname = "";

ArrayList<String> invertedData = new ArrayList<String>();

int docno[][] = new int[100][10];

InputStreamReader ins = new InputStreamReader(System.in);

BufferedReader br = new BufferedReader(ins);

System.out.println("\nENTER TOTAL NO OF FILES:"); int no

= Integer.parseInt(br.readLine());

int i = 1;

while (i - 1 != no) {

System.out.println("\nENTER FILE " + i + " NAME:");

fname = br.readLine();

indexing(fname, invertedData, docno, i);

i += 1;

displayIndex(invertedData, docno);

Output:
4. Precision And Recall

import java.util.HashSet; import

java.util.Set;

public class PrecisionRecallCalculator {

public static void main(String[] args) {

// Sample input: Answer set A, Query q1, and Relevant documents Rq1

Set<String> answerSetA = new HashSet<>(); answerSetA.add("Doc1");

answerSetA.add("Doc2"); answerSetA.add("Doc3");

answerSetA.add("Doc4"); answerSetA.add("Doc5");

Set<String> relevantDocumentsRq1 = new HashSet<>();

relevantDocumentsRq1.add("Doc1"); relevantDocumentsRq1.add("Doc2");

relevantDocumentsRq1.add("Doc3");

// Query q1

String query = "q1";

// Calculate precision and recall

double precision = calculatePrecision(answerSetA, relevantDocumentsRq1);

double recall = calculateRecall(answerSetA, relevantDocumentsRq1);

// Print the results

System.out.println("Query: " + query);

System.out.println("Precision: " + precision);

System.out.println("Recall: " + recall);

}
// Calculate precision

public static double calculatePrecision(Set<String> retrievedDocuments, Set<String>

relevantDocuments) {

int relevantRetrieved = 0;

for (String doc : retrievedDocuments) {

if (relevantDocuments.contains(doc)) {

relevantRetrieved++;

return (double) relevantRetrieved / retrievedDocuments.size();

// Calculate recall

public static double calculateRecall(Set<String> retrievedDocuments, Set<String>

relevantDocuments) {

int relevantRetrieved = 0;

for (String doc : retrievedDocuments) {

if (relevantDocuments.contains(doc)) {

relevantRetrieved++;

return (double) relevantRetrieved / relevantDocuments.size();

Output:
5. Harmonic Mean

package com.darshan;

public class MetricsCalculator

public static double calculateF1(double precision, double recall)

{ if (precision + recall == 0) { return 0;

} return 2 * (precision * recall) / (precision +

recall);

public static double calculateEMeasure(double precision, double recall,

double alpha) { if (precision == 0 && recall == 0) {

return 0;

} return 1 / ((alpha / precision) + ((1 - alpha) /

recall));

} public static void main(String[]

args) {

// Example values

double precision = 0.75;

double recall = 0.80;

double alpha = 0.5;

// Calculate F-measure double f1Score =

calculateF1(precision, recall);

System.out.println("F-measure (F1-score): " + String.format("%.2f",

f1Score));

// Calculate E-measure double eMeasure =

calculateEMeasure(precision, recall, alpha);

System.out.println("E-measure: " + String.format("%.2f", eMeasure));

}

Output :
6. Feature Extraction
7. Web Crowler
8. Weather Forecasting

TCS CodeVita Actual Questions Answers
No ratings yet
TCS CodeVita Actual Questions Answers
27 pages
Full Hackerrank
No ratings yet
Full Hackerrank
108 pages
25 Java Programs
No ratings yet
25 Java Programs
36 pages
Java8 Problems Solutions All 50
No ratings yet
Java8 Problems Solutions All 50
8 pages
String Interview Questions
No ratings yet
String Interview Questions
10 pages
FRAZ DSA Sheet Solutions by Prashant
No ratings yet
FRAZ DSA Sheet Solutions by Prashant
53 pages
Dynapac Large Tracked Paver Range: SD2500C / SD2500CS / SD2550C / SD2550CS
No ratings yet
Dynapac Large Tracked Paver Range: SD2500C / SD2500CS / SD2550C / SD2550CS
20 pages
TELX TD PABX Manual PDF
No ratings yet
TELX TD PABX Manual PDF
44 pages
Yuvraj (22scse1012063)
No ratings yet
Yuvraj (22scse1012063)
49 pages
T-49C-CA MOD2 Operational Manual
No ratings yet
T-49C-CA MOD2 Operational Manual
52 pages
BS - EN12715 - 2000 Execution of Special Geotechnical Work - Grouting
No ratings yet
BS - EN12715 - 2000 Execution of Special Geotechnical Work - Grouting
56 pages
Boiler Turbine Technical Report
No ratings yet
Boiler Turbine Technical Report
31 pages
Hoistway Top: Gen2 Nova MRL - Machine
100% (1)
Hoistway Top: Gen2 Nova MRL - Machine
4 pages
Amazon Interview Questions With Solutions Java
No ratings yet
Amazon Interview Questions With Solutions Java
13 pages
DCDR FULL
100% (1)
DCDR FULL
23 pages
All Session Programs With Solutins
No ratings yet
All Session Programs With Solutins
128 pages
Arcgis Online Tutorial 2017 PDF
No ratings yet
Arcgis Online Tutorial 2017 PDF
22 pages
Rajat Sachan 22scse1012575 Dsa Mte Assignment
No ratings yet
Rajat Sachan 22scse1012575 Dsa Mte Assignment
57 pages
1 AiM Online Review
No ratings yet
1 AiM Online Review
121 pages
AAPS Shubh
No ratings yet
AAPS Shubh
43 pages
Adrineel Saha - C-191 - Formal Language and Automata Theory (PCCCS502) - Mini Project
No ratings yet
Adrineel Saha - C-191 - Formal Language and Automata Theory (PCCCS502) - Mini Project
93 pages
AAPS Lab File Code
No ratings yet
AAPS Lab File Code
32 pages
CSharp - Programs Very Important
No ratings yet
CSharp - Programs Very Important
127 pages
VST - Axial Flow Catalog - 2021.R010
No ratings yet
VST - Axial Flow Catalog - 2021.R010
6 pages
Skill Lab
No ratings yet
Skill Lab
27 pages
UART - Specification by Texas Instruments
No ratings yet
UART - Specification by Texas Instruments
51 pages
Java Programs
No ratings yet
Java Programs
21 pages
PLACEMENT PRACTICE 10-12-2024, Himanshu
No ratings yet
PLACEMENT PRACTICE 10-12-2024, Himanshu
17 pages
Leetcode
No ratings yet
Leetcode
96 pages
Core Java Questions
100% (1)
Core Java Questions
16 pages
Array, String Methods
No ratings yet
Array, String Methods
11 pages
Cdjavacodes
No ratings yet
Cdjavacodes
23 pages
Godaddy
No ratings yet
Godaddy
14 pages
JAVA
No ratings yet
JAVA
29 pages
Most Asked
No ratings yet
Most Asked
7 pages
LeetCode Interview Questions Solutions Improved
No ratings yet
LeetCode Interview Questions Solutions Improved
8 pages
Hackertest
No ratings yet
Hackertest
9 pages
SPOS Codes
No ratings yet
SPOS Codes
21 pages
CA Paper Comp
No ratings yet
CA Paper Comp
10 pages
Collections Assignment
No ratings yet
Collections Assignment
9 pages
Java Questions Srithar
No ratings yet
Java Questions Srithar
29 pages
NFJJDJJSJJ OK
No ratings yet
NFJJDJJSJJ OK
9 pages
PROGRAM: (K-Nearest Neighbour Algorithm)
No ratings yet
PROGRAM: (K-Nearest Neighbour Algorithm)
24 pages
AC Assingment 3 1127
No ratings yet
AC Assingment 3 1127
6 pages
Week 6 - Level 2 - 10 (Step) Rithish S
No ratings yet
Week 6 - Level 2 - 10 (Step) Rithish S
19 pages
Bhaskar - CSE-2 - DAA Experential Learning
No ratings yet
Bhaskar - CSE-2 - DAA Experential Learning
9 pages
Hash
No ratings yet
Hash
16 pages
Repeated Coding Question
No ratings yet
Repeated Coding Question
13 pages
String Codes
No ratings yet
String Codes
11 pages
Assignment 8
No ratings yet
Assignment 8
10 pages
Java Ca
No ratings yet
Java Ca
13 pages
Assistant Secretary - Job Description
No ratings yet
Assistant Secretary - Job Description
2 pages
Programs - Day 3
No ratings yet
Programs - Day 3
24 pages
21BCS1130 - Abhinav Soni Day 6
No ratings yet
21BCS1130 - Abhinav Soni Day 6
9 pages
Java Assignmnet
No ratings yet
Java Assignmnet
6 pages
Notes
No ratings yet
Notes
22 pages
Pass 1
No ratings yet
Pass 1
9 pages
CD LAB in Java
No ratings yet
CD LAB in Java
12 pages
Top50 Java String Array Problems
No ratings yet
Top50 Java String Array Problems
7 pages
PESIT Bangalore South Campus: Vii Semester Lab Manual Subject: Machine Learning
No ratings yet
PESIT Bangalore South Campus: Vii Semester Lab Manual Subject: Machine Learning
31 pages
DBMS Assignment 9 PDF
No ratings yet
DBMS Assignment 9 PDF
5 pages
DBMS Assignment 9
No ratings yet
DBMS Assignment 9
5 pages
Assignment 03 23121053 MD - Tanimur Rahman
No ratings yet
Assignment 03 23121053 MD - Tanimur Rahman
11 pages
Solar Tracking System Thesis PDF
100% (3)
Solar Tracking System Thesis PDF
5 pages
CS201 Midterm1 Helper Sheet
No ratings yet
CS201 Midterm1 Helper Sheet
5 pages
Game Over
No ratings yet
Game Over
3 pages
Leet Code Solutions
No ratings yet
Leet Code Solutions
6 pages
5th Sem QN Paper 2022
No ratings yet
5th Sem QN Paper 2022
15 pages
A3 InvertedFiles
No ratings yet
A3 InvertedFiles
2 pages
Apriori Algorithm DWDM
No ratings yet
Apriori Algorithm DWDM
5 pages
Lecture Note 1
No ratings yet
Lecture Note 1
42 pages
UN 9252-02 Part 1 - UD-AU-000-EB-00019 PDF
100% (1)
UN 9252-02 Part 1 - UD-AU-000-EB-00019 PDF
17 pages
Public Class Charrep (
No ratings yet
Public Class Charrep (
15 pages
Import Java - Io. Public Class Palindrome (
No ratings yet
Import Java - Io. Public Class Palindrome (
7 pages
CTPM PIDs Review Clarifications For WQIFOD 26-30 Aug 2012
No ratings yet
CTPM PIDs Review Clarifications For WQIFOD 26-30 Aug 2012
6 pages
Irp May 29th
No ratings yet
Irp May 29th
5 pages
Ebook The Practical Guide To Using A Semantic Layer
No ratings yet
Ebook The Practical Guide To Using A Semantic Layer
30 pages
DRAWINGS 1 OPS-WW - Colour Up Deluxe
No ratings yet
DRAWINGS 1 OPS-WW - Colour Up Deluxe
12 pages
Admin Workflow User Documentation
No ratings yet
Admin Workflow User Documentation
19 pages
Csec French p2 2019 MJ
No ratings yet
Csec French p2 2019 MJ
14 pages
Divine Light Academy: Class No
No ratings yet
Divine Light Academy: Class No
2 pages
Delegated Content Erasure in IPFS: Future Generation Computer Systems June 2020
No ratings yet
Delegated Content Erasure in IPFS: Future Generation Computer Systems June 2020
10 pages
TOEIC
No ratings yet
TOEIC
14 pages
Training Schedule Loan Performer: Tea Break
No ratings yet
Training Schedule Loan Performer: Tea Break
12 pages
Intel It Annual Performance Report 2021 2022 Paper
No ratings yet
Intel It Annual Performance Report 2021 2022 Paper
19 pages
DGMD S17 Summer2019 Jun20
No ratings yet
DGMD S17 Summer2019 Jun20
6 pages
(18 April 2024) Aligning Open Language Models
No ratings yet
(18 April 2024) Aligning Open Language Models
77 pages
Stephen Mcgruer: Contact Details Education Experience
No ratings yet
Stephen Mcgruer: Contact Details Education Experience
1 page
Advanced C Concepts and Programming: First Edition
From Everand
Advanced C Concepts and Programming: First Edition
Gayatri
3/5 (1)
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet