0% found this document useful (0 votes)

12 views7 pages

App

The document contains a Flask application that serves as a file management and summarization tool. It supports various file formats, allowing users to search, open, and summarize files using an AI model. The application includes a web interface with functionalities for text extraction, database searching, and real-time summary streaming.

Uploaded by

Botir Bakhtiyarov

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

12 views7 pages

App

Uploaded by

Botir Bakhtiyarov

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 7

backend code:

from flask import Flask, render_template, request, jsonify, Response,

stream_with_context
import sqlite3
import os
import markdown
from PyPDF2 import PdfReader
import pandas as pd
from docx import Document
from pptx import Presentation
import webbrowser
import threading
import subprocess
import psutil
import sys
import torch
from transformers import AutoModelForCausalLM, AutoTokenizer
import re
from transformers import TextIteratorStreamer

# Initialize Flask app

base_path = getattr(sys, 'frozen', False) and os.path.dirname(sys.executable) or
os.path.dirname(__file__)
app = Flask(
__name__,
template_folder=os.path.join(base_path, 'templates'),
static_folder=os.path.join(base_path, 'static')
)

def run():
exe_name = "app.exe" # Just the executable name, not the full path
for process in psutil.process_iter(attrs=['name']):
if process.info['name'] == exe_name:
print(f"{exe_name} is already running.")
return # Exit the function if the process is already running

current_directory = os.getcwd()
exe_path = os.path.join(current_directory, "app", "app.exe")
subprocess.Popen([exe_path])

def open_browser():
webbrowser.open_new("http://127.0.0.1:5000")

# Initialize AI model
print(f"GPU available: {torch.cuda.is_available()}")
device = "cuda" if torch.cuda.is_available() else "cpu"

model_name = r"C:\Users\nick\DeepSeek-R1-Distill-Qwen-1.5B"
tokenizer = AutoTokenizer.from_pretrained(model_name)
tokenizer.pad_token = tokenizer.eos_token
model = AutoModelForCausalLM.from_pretrained(
model_name,
device_map="auto",
torch_dtype=torch.bfloat16
).to(device)

def get_file_text(file_path):
ext = os.path.splitext(file_path)[1].lower()
text = None
try:
if ext == '.txt':
with open(file_path, 'r', encoding='utf-8') as f:
text = f.read()

elif ext == '.pdf':

reader = PdfReader(file_path)
text = "".join([page.extract_text() or "" for page in reader.pages])

elif ext in ['.doc', '.docx']:

doc = Document(file_path)
text = "\n".join([para.text for para in doc.paragraphs if
para.text.strip() != ""])

elif ext in ['.ppt', '.pptx']:

prs = Presentation(file_path)
text = "\n".join([shape.text for slide in prs.slides for shape in
slide.shapes if hasattr(shape, "text")])

elif ext in ['.xls', '.xlsx']:

dfs = pd.read_excel(file_path, sheet_name=None)
text = "\n\n".join([f"Sheet: {name}\n{df.to_string(index=False)}" for
name, df in dfs.items()])

else:
with open(file_path, 'r', encoding='utf-8') as f:
text = f.read()

except Exception as e:
print(f"Error reading file ({ext}): {e}")
return None

return text

def search_database(query):
conn = sqlite3.connect(r"file_database.db")
cursor = conn.cursor()
cursor.execute("""SELECT id, file_name, path, file_type FROM files
WHERE file_name LIKE ? OR file_type LIKE ?""", (f"%{query}%",
f"%{query}%"))
results = cursor.fetchall()
conn.close()
return results

@app.route('/')
def index():
return render_template('index.html')

@app.route('/search')
def search():
query = request.args.get('q', '')
results = search_database(query) if query else []
return render_template('result.html', results=results)

@app.route('/open/<path:file_path>')
def open_file(file_path):
try:
os.startfile(file_path)
return "", 204
except Exception as e:
return str(e), 500

@app.route('/summary/<path:file_path>')
def summary_file(file_path):
return render_template('summary.html', file_name=os.path.basename(file_path),
file_path=file_path)

@app.route('/stream-summary', methods=['POST'])
def stream_summary():
file_path = request.form['file_path']

file_text = get_file_text(file_path)
if not file_text:
return Response("Error processing file", status=400)

def generate():
try:
prompt = f"请总结以下文本: {file_text}"
messages = [{"role": "user", "content": prompt}]

text = tokenizer.apply_chat_template(
messages,
tokenize=False,
add_generation_prompt=True
)

inputs = tokenizer(text, return_tensors="pt").to(device)

streamer = TextIteratorStreamer(tokenizer)

generation_kwargs = dict(
inputs,
streamer=streamer,
max_new_tokens=1024,
temperature=0.7,
top_p=0.9,
do_sample=True,
pad_token_id=tokenizer.eos_token_id,
eos_token_id=tokenizer.eos_token_id,
)

thread = threading.Thread(target=model.generate,
kwargs=generation_kwargs)
thread.start()

buffer = ""
for new_text in streamer:
buffer += new_text
# Stream complete sentences when possible
if '.' in buffer:
parts = buffer.split('.')
for part in parts[:-1]:
yield part.strip() + '. '
buffer = parts[-1]
else:
yield buffer.strip()
buffer = ""
# Yield remaining content
if buffer.strip():
yield buffer.strip()

thread.join()

except Exception as e:
yield f"Error: {str(e)}"

return Response(stream_with_context(generate()), mimetype="text/plain")

if __name__ == '__main__':
if not any(proc.info['name'] == "app.exe" for proc in
psutil.process_iter(attrs=['name'])):
run()
threading.Timer(1.5, open_browser).start()
app.run(debug=True)

summary.html
<!DOCTYPE html>
<html lang="en">
<head>
<meta charset="UTF-8">
<meta name="viewport" content="width=device-width, initial-scale=1.0">
<title>总结</title>
<link rel="icon" href="{{ url_for('static', filename='img/logo_icon.ico') }}"
type="image/x-icon">

body {
background: #e3f1fb;
font-family: "Inter-Regular", sans-serif;
}

.container {
max-width: 1280px;
margin: 0 auto;
padding: 20px;
display: flex;
flex-direction: column;
align-items: center;
}

.search-container {
display: flex;
align-items: center;
gap: 20px;
margin-bottom: 30px;
}
.search-box {
background: #ffffff;
border-radius: 29px;
width: 400px;
height: 57px;
padding: 10px 20px;
}

.search-btn {
background: #3a7fff;
border-radius: 29px;
width: 143px;
height: 57px;
display: flex;
align-items: center;
justify-content: center;
color: #ffffff;
font-size: 20px;
cursor: pointer;
}

.logo {
width: 195px;
margin-bottom: 20px;
}

.file-info {
background: #ffffff;
border-radius: 15px;
width: 100%;
padding: 20px;
margin-bottom: 20px;
display: flex;
justify-content: space-between;
align-items: center;
}

.summary-container {
background: #ffffff;
border-radius: 15px;
width: 100%;
min-height: 550px;
padding: 20px;
}

.open-btn {
background: #3a7fff;
border-radius: 29px;
width: 143px;
height: 57px;
display: flex;
align-items: center;
justify-content: center;
color: #ffffff;
font-size: 20px;
cursor: pointer;
}

.streaming-content {
white-space: pre-wrap;
padding: 20px;
border: 1px solid #ccc;
margin: 20px;
}
</style>
</head>
<body>
<div class="container">
<img class="logo" src="{{ url_for('static', filename='img/logo.svg') }}"
alt="Logo" />
<div class="search-container">
<input type="text" class="search-box" id="searchBox" placeholder="搜
索...">
<div class="search-btn" onclick="search()">搜索</div>
</div>
<div class="file-info">
<span>{{ file_name }}</span>
<a class="open-btn" href="{{ url_for('open_file',
file_path=file_path)}}">打开</a>
</div>
<div class="summary-container">
<h3>总结:</h3>
<div id="streaming-content">

</div>
</div>
</div>
<script>
// Handle search functionality
document.getElementById('searchBox').addEventListener('keypress',
function(event) {
if (event.key === 'Enter') {
search();
}
});

function search() {
let query = document.getElementById('searchBox').value;
if (query.trim() === '') return;
window.location.href = `/search?q=${query}`;
}

const streamingContent = document.getElementById('streaming-content');

const filePath = "{{ file_path|replace('\\', '/') }}"; // Ensure proper file
path format

fetch('/stream-summary', {
method: 'POST',
body: new URLSearchParams({ file_path: filePath }),
headers: { 'Content-Type': 'application/x-www-form-urlencoded' }
})
.then(response => {
const reader = response.body.getReader();
function readStream() {
reader.read().then(({ done, value }) => {
if (done) return;
// Append the new chunk of text to the streaming content
streamingContent.textContent += new
TextDecoder().decode(value);
readStream(); // Continue reading the stream
});
}
readStream();
})
.catch(error => {
console.error("Error:", error);
streamingContent.innerHTML = `<div class="error">Error: $
{error.message}</div>`;
});
</script>
</body>
</html>

Langchain Onepager
No ratings yet
Langchain Onepager
1 page
CS FINAL - Pagenumber
No ratings yet
CS FINAL - Pagenumber
31 pages
Cs For Pranav
No ratings yet
Cs For Pranav
29 pages
FK Jayanth
No ratings yet
FK Jayanth
21 pages
Sourcecode
No ratings yet
Sourcecode
16 pages
Sns 1 Design A Simple Web Page
No ratings yet
Sns 1 Design A Simple Web Page
8 pages
Chatbot CA
No ratings yet
Chatbot CA
20 pages
Web Designing File
No ratings yet
Web Designing File
50 pages
Advance Python
No ratings yet
Advance Python
202 pages
App 2
No ratings yet
App 2
10 pages
365careers - AI - Eng - Bootcamp, Ai, 365careers, Udemy
No ratings yet
365careers - AI - Eng - Bootcamp, Ai, 365careers, Udemy
89 pages
Index
No ratings yet
Index
28 pages
Code
No ratings yet
Code
18 pages
WCA Faceplate Analog en
No ratings yet
WCA Faceplate Analog en
71 pages
Trip Planner Example
No ratings yet
Trip Planner Example
7 pages
DR Prompt Bolt
No ratings yet
DR Prompt Bolt
5 pages
Gen Ai 7,8,9,10
No ratings yet
Gen Ai 7,8,9,10
7 pages
Also For The Webpage Code, Could You Style It Up A
No ratings yet
Also For The Webpage Code, Could You Style It Up A
8 pages
01 Functional Requirements CV Projects-3
No ratings yet
01 Functional Requirements CV Projects-3
7 pages
Ai Lab 02
No ratings yet
Ai Lab 02
12 pages
Big Data Front Page
No ratings yet
Big Data Front Page
68 pages
AI驱动的前端开发
No ratings yet
AI驱动的前端开发
13 pages
Data Engineering Concepts #2 - Sending Data Using An API - by Bar Dadon - Dev Genius
No ratings yet
Data Engineering Concepts #2 - Sending Data Using An API - by Bar Dadon - Dev Genius
14 pages
Sans Titre
No ratings yet
Sans Titre
11 pages
Ceragon FibeAir IP-10G IP-10E User Guide 20120601 Rev A.01
No ratings yet
Ceragon FibeAir IP-10G IP-10E User Guide 20120601 Rev A.01
577 pages
Also For The Webpage Code, Could You Style It Up A
No ratings yet
Also For The Webpage Code, Could You Style It Up A
7 pages
Project Report Final
No ratings yet
Project Report Final
16 pages
Zref
No ratings yet
Zref
8 pages
How I Automated My Workflow With AI Agent Teams (NO-CODE)
No ratings yet
How I Automated My Workflow With AI Agent Teams (NO-CODE)
8 pages
Another Hack Test3
No ratings yet
Another Hack Test3
4 pages
Duckduckgo Download
No ratings yet
Duckduckgo Download
3 pages
Assignment 1
No ratings yet
Assignment 1
5 pages
Assignment 2
No ratings yet
Assignment 2
20 pages
Synopsis
No ratings yet
Synopsis
3 pages
AI ML Fullstack Career Roadmap
No ratings yet
AI ML Fullstack Career Roadmap
9 pages
Build A Perplexity Clone in 8min With AI
No ratings yet
Build A Perplexity Clone in 8min With AI
3 pages
AI ML Engineering Topics Updated With 2 Pages
No ratings yet
AI ML Engineering Topics Updated With 2 Pages
6 pages
Assignment
No ratings yet
Assignment
2 pages
Full Process For Coding With AI Coding Assistants
No ratings yet
Full Process For Coding With AI Coding Assistants
9 pages
Index 572
No ratings yet
Index 572
3 pages
Angular Notes PDF
No ratings yet
Angular Notes PDF
3 pages
Library CSE Book
No ratings yet
Library CSE Book
53 pages
Module 4 Lesson 2 Updated
No ratings yet
Module 4 Lesson 2 Updated
24 pages
Web Development
No ratings yet
Web Development
6 pages
1-Object Oriented Programming Development-University of Luton
100% (1)
1-Object Oriented Programming Development-University of Luton
21 pages
A Step by Step Guide To Using GarageBand
No ratings yet
A Step by Step Guide To Using GarageBand
20 pages
Institute (School) Management System - Daffodil 151-40-216
No ratings yet
Institute (School) Management System - Daffodil 151-40-216
55 pages
C Programming 3
No ratings yet
C Programming 3
28 pages
Manual de Intraweb
No ratings yet
Manual de Intraweb
131 pages
04 1 Ufs
No ratings yet
04 1 Ufs
18 pages
Module 16a NTP
No ratings yet
Module 16a NTP
10 pages
BAB 5 Perancangan Output, Input Dan Antaramuka
No ratings yet
BAB 5 Perancangan Output, Input Dan Antaramuka
97 pages
ENCh 03
No ratings yet
ENCh 03
56 pages
Total Station Procedure
No ratings yet
Total Station Procedure
10 pages
ICE360S - Laravel Blog Design Project - April 2024
No ratings yet
ICE360S - Laravel Blog Design Project - April 2024
3 pages
Database
No ratings yet
Database
15 pages
TouchChip TCESC4K Module
No ratings yet
TouchChip TCESC4K Module
2 pages
C Series Quick Guide of Fingerprint T&A
No ratings yet
C Series Quick Guide of Fingerprint T&A
6 pages
Software Project Concept
No ratings yet
Software Project Concept
5 pages
Sitev 3
No ratings yet
Sitev 3
7 pages
JD - GET - Tech
No ratings yet
JD - GET - Tech
3 pages
Bharath Resume
No ratings yet
Bharath Resume
3 pages
DS NetworkSpace2 en
No ratings yet
DS NetworkSpace2 en
3 pages
CELF Part 2
No ratings yet
CELF Part 2
5 pages
Pacemaker Editor Shortcuts Windows
No ratings yet
Pacemaker Editor Shortcuts Windows
2 pages
Essential n8n Playbook
From Everand
Essential n8n Playbook
Leandro Calado
No ratings yet
HTML5 Reference: An Alphabetical Guide
From Everand
HTML5 Reference: An Alphabetical Guide
Jo Foster
No ratings yet
React Portfolio App Development: Increase your online presence and create your personal brand
From Everand
React Portfolio App Development: Increase your online presence and create your personal brand
Abdelfattah Ragab
No ratings yet
Simplifying Data Science With Python
From Everand
Simplifying Data Science With Python
Billy David millican
No ratings yet
Angular Shopping Store: From Scratch to Successful Payment
From Everand
Angular Shopping Store: From Scratch to Successful Payment
Abdelfattah Ragab
No ratings yet
50 Recipes for Programming Node.js
From Everand
50 Recipes for Programming Node.js
Jamie Munro
3/5 (4)
Firebase Storage for Angular: A reliable file upload solution for your applications
From Everand
Firebase Storage for Angular: A reliable file upload solution for your applications
Abdelfattah Ragab
No ratings yet
Angular Generative AI: Building an intelligent CV enhancer with Google Gemini
From Everand
Angular Generative AI: Building an intelligent CV enhancer with Google Gemini
Abdelfattah Ragab
No ratings yet
NgRx SignalStore: An effortless solution for state management
From Everand
NgRx SignalStore: An effortless solution for state management
Abdelfattah Ragab
No ratings yet
Quick Python Guide
From Everand
Quick Python Guide
Coder1
No ratings yet
10 Lessons in Front-end
From Everand
10 Lessons in Front-end
Krasimir Tsonev
2/5 (1)
How to a Developers Guide to 4k: Developer edition, #3
From Everand
How to a Developers Guide to 4k: Developer edition, #3
Xinc Cyberwizard
No ratings yet
Introduction to PHP, Part 4, Second Edition
From Everand
Introduction to PHP, Part 4, Second Edition
Adam Majczak
No ratings yet
Introduction to PHP, Part 2, Second Edition
From Everand
Introduction to PHP, Part 2, Second Edition
Adam Majczak
No ratings yet
Introduction to PHP, Part 5, Second Edition
From Everand
Introduction to PHP, Part 5, Second Edition
Adam Majczak
No ratings yet
Ajax in One Hour, For Beginners, Learn Coding Fast
From Everand
Ajax in One Hour, For Beginners, Learn Coding Fast
Ray Yao
No ratings yet
C++ Functions and tutorial
From Everand
C++ Functions and tutorial
Nino Paiotta
No ratings yet
Mastering JavaScript: The Complete Guide to JavaScript Mastery
From Everand
Mastering JavaScript: The Complete Guide to JavaScript Mastery
Tim Robards
5/5 (1)
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet
Oracle Certified Professional Java Programmer OCPJP 1Z0 809
From Everand
Oracle Certified Professional Java Programmer OCPJP 1Z0 809
Manish Soni
No ratings yet
Inspiring Powershell Articles
From Everand
Inspiring Powershell Articles
Murat Yildirimoglu
No ratings yet
PHP Interview Questions, Answers, and Explanations: PHP Certification Review: PHP FAQ
From Everand
PHP Interview Questions, Answers, and Explanations: PHP Certification Review: PHP FAQ
equitypress
No ratings yet
UNIX Shell Programming Interview Questions You'll Most Likely Be Asked
From Everand
UNIX Shell Programming Interview Questions You'll Most Likely Be Asked
Vibrant Publishers
No ratings yet

App

Uploaded by

App

Uploaded by

backend code:

from flask import Flask, render_template, request, jsonify, Response,

# Initialize Flask app

elif ext == '.pdf':

elif ext in ['.doc', '.docx']:

elif ext in ['.ppt', '.pptx']:

elif ext in ['.xls', '.xlsx']:

inputs = tokenizer(text, return_tensors="pt").to(device)

return Response(stream_with_context(generate()), mimetype="text/plain")

const streamingContent = document.getElementById('streaming-content');

You might also like