DeepResearchEvaluator

Running on CPU Upgrade

App Files Files Community

DeepResearchEvaluator / backup3.app.py

awacke1

Rename app.py to backup3.app.py

f51a852 verified about 1 month ago

raw

history blame

22.4 kB

	#!/usr/bin/env python3

	import os
	import re
	import glob
	import json
	import base64
	import zipfile
	import random
	import requests
	import openai
	from PIL import Image
	from urllib.parse import quote

	import streamlit as st
	import streamlit.components.v1 as components

	# If you do model inference via huggingface_hub:
	from huggingface_hub import InferenceClient

	# ----------------------------
	# Configurable BASE_URL
	# ----------------------------
	BASE_URL = "https://huggingface.co/spaces/awacke1/MermaidMarkdownDiagramEditor"

	# Example placeholders for prompt prefixes
	PromptPrefix = "AI-Search: "
	PromptPrefix2 = "AI-Refine: "
	PromptPrefix3 = "AI-JS: "

	# Example roleplaying glossary
	roleplaying_glossary = {
	"Core Rulebooks": {
	"Dungeons and Dragons": ["Player's Handbook", "Dungeon Master's Guide", "Monster Manual"],
	"GURPS": ["Basic Set Characters", "Basic Set Campaigns"]
	},
	"Campaigns & Adventures": {
	"Pathfinder": ["Rise of the Runelords", "Curse of the Crimson Throne"]
	}
	}

	# Example transhuman glossary
	transhuman_glossary = {
	"Neural Interfaces": ["Cortex Jack", "Mind-Machine Fusion"],
	"Cybernetics": ["Robotic Limbs", "Augmented Eyes"],
	}

	# Simple function stubs
	def process_text(text):
	st.write(f"process_text called with: {text}")

	def search_arxiv(text):
	st.write(f"search_arxiv called with: {text}")

	def SpeechSynthesis(text):
	st.write(f"SpeechSynthesis called with: {text}")

	def process_image(image_file, prompt):
	return f"[process_image placeholder] Processing {image_file} with prompt: {prompt}"

	def process_video(video_file, seconds_per_frame):
	st.write(f"[process_video placeholder] Video: {video_file}, seconds/frame: {seconds_per_frame}")

	# Stub if you have a Hugging Face endpoint
	API_URL = "https://huggingface-inference-endpoint-placeholder"
	API_KEY = "hf_XXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX"

	@st.cache_resource
	def InferenceLLM(prompt):
	return f"[InferenceLLM placeholder response to prompt: {prompt}]"

	# ------------------------------------------
	# Glossary & File Utility
	# ------------------------------------------
	@st.cache_resource
	def display_glossary_entity(k):
	"""
	Creates multiple link emojis for a single entity.
	"""
	search_urls = {
	"🚀🌌ArXiv": lambda x: f"/?q={quote(x)}",
	"🃏Analyst": lambda x: f"/?q={quote(x)}-{quote(PromptPrefix)}",
	"📚PyCoder": lambda x: f"/?q={quote(x)}-{quote(PromptPrefix2)}",
	"🔬JSCoder": lambda x: f"/?q={quote(x)}-{quote(PromptPrefix3)}",
	"📖": lambda x: f"https://en.wikipedia.org/wiki/{quote(x)}",
	"🔍": lambda x: f"https://www.google.com/search?q={quote(x)}",
	"🔎": lambda x: f"https://www.bing.com/search?q={quote(x)}",
	"🎥": lambda x: f"https://www.youtube.com/results?search_query={quote(x)}",
	"🐦": lambda x: f"https://twitter.com/search?q={quote(x)}",
	}
	links_md = ' '.join([f"[{emoji}]({url(k)})" for emoji, url in search_urls.items()])
	st.markdown(f"{k} <small>{links_md}</small>", unsafe_allow_html=True)

	def display_content_or_image(query):
	"""
	If a query matches something in transhuman_glossary or a local image, show it.
	"""
	for category, term_list in transhuman_glossary.items():
	for term in term_list:
	if query.lower() in term.lower():
	st.subheader(f"Found in {category}:")
	st.write(term)
	return True
	image_path = f"images/{query}.png"
	if os.path.exists(image_path):
	st.image(image_path, caption=f"Image for {query}")
	return True
	st.warning("No matching content or image found.")
	return False

	def clear_query_params():
	"""
	For clearing URL params, you'd typically use a new link or st.experimental_set_query_params().
	Here, we just warn the user.
	"""
	st.warning("Define a redirect or link without query params if you want to truly clear them.")

	# -----------------------
	# File Handling
	# -----------------------
	def load_file(file_path):
	try:
	with open(file_path, "r", encoding='utf-8') as f:
	return f.read()
	except:
	return ""

	@st.cache_resource
	def create_zip_of_files(files):
	zip_name = "Arxiv-Paper-Search-QA-RAG-Streamlit-Gradio-AP.zip"
	with zipfile.ZipFile(zip_name, 'w') as zipf:
	for file in files:
	zipf.write(file)
	return zip_name

	@st.cache_resource
	def get_zip_download_link(zip_file):
	with open(zip_file, 'rb') as f:
	data = f.read()
	b64 = base64.b64encode(data).decode()
	return f'<a href="data:application/zip;base64,{b64}" download="{zip_file}">Download All</a>'

	def get_table_download_link(file_path):
	"""
	Creates a download link for a single file from your snippet.
	"""
	try:
	with open(file_path, 'r', encoding='utf-8') as file:
	data = file.read()
	b64 = base64.b64encode(data.encode()).decode()
	file_name = os.path.basename(file_path)
	ext = os.path.splitext(file_name)[1]
	mime_map = {
	'.txt': 'text/plain',
	'.py': 'text/plain',
	'.xlsx': 'text/plain',
	'.csv': 'text/plain',
	'.htm': 'text/html',
	'.md': 'text/markdown',
	'.wav': 'audio/wav'
	}
	mime_type = mime_map.get(ext, 'application/octet-stream')
	return f'<a href="data:{mime_type};base64,{b64}" target="_blank" download="{file_name}">{file_name}</a>'
	except:
	return ''

	def get_file_size(file_path):
	return os.path.getsize(file_path)

	def FileSidebar():
	"""
	Renders .md files, providing open/view/delete/run logic in the sidebar.
	"""
	all_files = glob.glob("*.md")
	# Exclude short-named or special files if needed
	all_files = [f for f in all_files if len(os.path.splitext(f)[0]) >= 5]
	all_files.sort(key=lambda x: (os.path.splitext(x)[1], x), reverse=True)

	Files1, Files2 = st.sidebar.columns(2)
	with Files1:
	if st.button("🗑 Delete All"):
	for file in all_files:
	os.remove(file)
	st.rerun()
	with Files2:
	if st.button("⬇️ Download"):
	zip_file = create_zip_of_files(all_files)
	st.sidebar.markdown(get_zip_download_link(zip_file), unsafe_allow_html=True)

	file_contents = ''
	file_name = ''
	next_action = ''

	for file in all_files:
	col1, col2, col3, col4, col5 = st.sidebar.columns([1, 6, 1, 1, 1])
	with col1:
	if st.button("🌐", key="md_" + file):
	file_contents = load_file(file)
	file_name = file
	next_action = 'md'
	st.session_state['next_action'] = next_action
	with col2:
	st.markdown(get_table_download_link(file), unsafe_allow_html=True)
	with col3:
	if st.button("📂", key="open_" + file):
	file_contents = load_file(file)
	file_name = file
	next_action = 'open'
	st.session_state['lastfilename'] = file
	st.session_state['filename'] = file
	st.session_state['filetext'] = file_contents
	st.session_state['next_action'] = next_action
	with col4:
	if st.button("▶️", key="read_" + file):
	file_contents = load_file(file)
	file_name = file
	next_action = 'search'
	st.session_state['next_action'] = next_action
	with col5:
	if st.button("🗑", key="delete_" + file):
	os.remove(file)
	st.rerun()

	# If we loaded a file
	if file_contents:
	if next_action == 'open':
	open1, open2 = st.columns([0.8, 0.2])
	with open1:
	file_name_input = st.text_input('File Name:', file_name, key='file_name_input')
	file_content_area = st.text_area('File Contents:', file_contents, height=300, key='file_content_area')

	if st.button('💾 Save File'):
	with open(file_name_input, 'w', encoding='utf-8') as f:
	f.write(file_content_area)
	st.markdown(f'Saved {file_name_input} successfully.')

	elif next_action == 'search':
	file_content_area = st.text_area("File Contents:", file_contents, height=500)
	user_prompt = PromptPrefix2 + file_contents
	st.markdown(user_prompt)
	if st.button('🔍Re-Code'):
	search_arxiv(file_contents)

	elif next_action == 'md':
	st.markdown(file_contents)
	SpeechSynthesis(file_contents)
	if st.button("🔍Run"):
	st.write("Running GPT logic placeholder...")

	# ---------------------------
	# Scoring / Glossaries
	# ---------------------------
	score_dir = "scores"
	os.makedirs(score_dir, exist_ok=True)

	def generate_key(label, header, idx):
	return f"{header}_{label}_{idx}_key"

	def update_score(key, increment=1):
	"""
	Track a 'score' for each glossary item or term, saved in JSON per key.
	"""
	score_file = os.path.join(score_dir, f"{key}.json")
	if os.path.exists(score_file):
	with open(score_file, "r") as file:
	score_data = json.load(file)
	else:
	score_data = {"clicks": 0, "score": 0}
	score_data["clicks"] += increment
	score_data["score"] += increment
	with open(score_file, "w") as file:
	json.dump(score_data, file)
	return score_data["score"]

	def load_score(key):
	file_path = os.path.join(score_dir, f"{key}.json")
	if os.path.exists(file_path):
	with open(file_path, "r") as file:
	score_data = json.load(file)
	return score_data["score"]
	return 0

	def display_buttons_with_scores(num_columns_text):
	"""
	Show glossary items as clickable buttons that increment a 'score'.
	"""
	game_emojis = {
	"Dungeons and Dragons": "🐉",
	"Call of Cthulhu": "🐙",
	"GURPS": "🎲",
	"Pathfinder": "🗺️",
	"Kindred of the East": "🌅",
	"Changeling": "🍃",
	}
	topic_emojis = {
	"Core Rulebooks": "📚",
	"Maps & Settings": "🗺️",
	"Game Mechanics & Tools": "⚙️",
	"Monsters & Adversaries": "👹",
	"Campaigns & Adventures": "📜",
	"Creatives & Assets": "🎨",
	"Game Master Resources": "🛠️",
	"Lore & Background": "📖",
	"Character Development": "🧍",
	"Homebrew Content": "🔧",
	"General Topics": "🌍",
	}

	for category, games in roleplaying_glossary.items():
	category_emoji = topic_emojis.get(category, "🔍")
	st.markdown(f"## {category_emoji} {category}")
	for game, terms in games.items():
	game_emoji = game_emojis.get(game, "🎮")
	for term in terms:
	key = f"{category}_{game}_{term}".replace(' ', '_').lower()
	score_val = load_score(key)
	if st.button(f"{game_emoji} {category} {game} {term} {score_val}", key=key):
	newscore = update_score(key.replace('?', ''))
	st.markdown(f"Scored {category} - {game} - {term} -> {newscore}")

	# -------------------------------
	# Image & Video
	# -------------------------------
	def display_images_and_wikipedia_summaries(num_columns=4):
	image_files = [f for f in os.listdir('.') if f.endswith('.png')]
	if not image_files:
	st.write("No PNG images found in the current directory.")
	return

	image_files_sorted = sorted(image_files, key=lambda x: len(x.split('.')[0]))
	cols = st.columns(num_columns)
	col_index = 0

	for image_file in image_files_sorted:
	with cols[col_index % num_columns]:
	try:
	image = Image.open(image_file)
	st.image(image, use_column_width=True)
	k = image_file.split('.')[0]
	display_glossary_entity(k)
	image_text_input = st.text_input(f"Prompt for {image_file}", key=f"image_prompt_{image_file}")
	if image_text_input:
	response = process_image(image_file, image_text_input)
	st.markdown(response)
	except:
	st.write(f"Could not open {image_file}")
	col_index += 1

	def display_videos_and_links(num_columns=4):
	video_files = [f for f in os.listdir('.') if f.endswith(('.mp4', '.webm'))]
	if not video_files:
	st.write("No MP4 or WEBM videos found in the current directory.")
	return

	video_files_sorted = sorted(video_files, key=lambda x: len(x.split('.')[0]))
	cols = st.columns(num_columns)
	col_index = 0

	for video_file in video_files_sorted:
	with cols[col_index % num_columns]:
	k = video_file.split('.')[0]
	st.video(video_file, format='video/mp4', start_time=0)
	display_glossary_entity(k)
	video_text_input = st.text_input(f"Video Prompt for {video_file}", key=f"video_prompt_{video_file}")
	if video_text_input:
	try:
	seconds_per_frame = 10
	process_video(video_file, seconds_per_frame)
	except ValueError:
	st.error("Invalid input for seconds per frame!")
	col_index += 1

	# --------------------------------
	# MERMAID DIAGRAM
	# --------------------------------
	def generate_mermaid_html(mermaid_code: str) -> str:
	"""
	Returns HTML that centers the Mermaid diagram, loading from a CDN.
	"""
	return f"""
	<html>
	<head>
	<script src="https://cdn.jsdelivr.net/npm/mermaid/dist/mermaid.min.js"></script>
	<style>
	.centered-mermaid {{
	display: flex;
	justify-content: center;
	margin: 20px auto;
	}}
	.mermaid {{
	max-width: 800px;
	}}
	</style>
	</head>
	<body>
	<div class="mermaid centered-mermaid">
	{mermaid_code}
	</div>
	<script>
	mermaid.initialize({{ startOnLoad: true }});
	</script>
	</body>
	</html>
	"""

	def append_model_param(url: str, model_selected: bool) -> str:
	"""
	If user checks 'Append ?model=1', we append &model=1 or ?model=1 if not present.
	"""
	if not model_selected:
	return url
	delimiter = "&" if "?" in url else "?"
	return f"{url}{delimiter}model=1"

	def inject_base_url(url: str) -> str:
	"""
	If a link does not start with http, prepend your BASE_URL
	so it becomes an absolute link to huggingface.co/spaces/...
	"""
	if url.startswith("http"):
	return url
	return f"{BASE_URL}{url}"

	# Our default diagram, containing the "click" lines with /?q=...
	DEFAULT_MERMAID = """
	flowchart LR
	U((User 😎)) -- "Talk 🗣️" --> LLM[LLM Agent 🤖\\nExtract Info]
	click U "/?q=User%20😎" _self
	click LLM "/?q=LLM%20Agent%20Extract%20Info" _blank

	LLM -- "Query 🔍" --> HS[Hybrid Search 🔎\\nVector+NER+Lexical]
	click HS "/?q=Hybrid%20Search%20Vector+NER+Lexical" _blank

	HS -- "Reason 🤔" --> RE[Reasoning Engine 🛠️\\nNeuralNetwork+Medical]
	click RE "/?q=Reasoning%20Engine%20NeuralNetwork+Medical" _blank

	RE -- "Link 📡" --> KG((Knowledge Graph 📚\\nOntology+GAR+RAG))
	click KG "/?q=Knowledge%20Graph%20Ontology+GAR+RAG" _blank
	"""

	def main():
	st.set_page_config(page_title="Mermaid + Clickable Links with Base URL", layout="wide")

	# ---------------------------------------------
	# Query Param Parsing (non-experimental)
	# ---------------------------------------------
	query_params = st.query_params
	query_list = (query_params.get('q') or query_params.get('query') or [''])
	q_or_query = query_list[0] if query_list else ''
	if q_or_query.strip():
	# If there's a q= or query= param, do some processing
	search_payload = PromptPrefix + q_or_query
	st.markdown(search_payload)
	process_text(search_payload)

	# If an 'action' param is present
	if 'action' in query_params:
	action_list = query_params['action']
	if action_list:
	action = action_list[0]
	if action == 'show_message':
	st.success("Showing a message because 'action=show_message' was found in the URL.")
	elif action == 'clear':
	clear_query_params()

	# If a 'query' param is present, show content or image
	if 'query' in query_params:
	query_val = query_params['query'][0]
	display_content_or_image(query_val)

	# ---------------------------------------------
	# Let user pick if we want ?model=1
	# ---------------------------------------------
	st.sidebar.write("## Diagram Link Settings")
	model_selected = st.sidebar.checkbox("Append ?model=1 to each link?")

	# ---------------------------------------------
	# Rebuild the clickable lines in the Mermaid code
	# ---------------------------------------------
	base_diagram = DEFAULT_MERMAID
	lines = base_diagram.strip().split("\n")
	new_lines = []

	for line in lines:
	# We look for lines like: click SOMENODE "/?q=Something" _self
	if "click " in line and '"/?' in line:
	# Try to extract the URL part
	parts = re.split(r'click\s+\S+\s+"([^"]+)"\s+("_self")', line)
	if len(parts) == 4:
	# Example:
	# parts[0] -> 'click LLM '
	# parts[1] -> '/?q=LLM%20Agent%20Extract%20Info'
	# parts[2] -> ' _self'
	# parts[3] -> '' or trailing
	old_url = parts[1]
	# 1) Prepend base if needed
	new_url = inject_base_url(old_url)
	# 2) Possibly add &model=1
	new_url = append_model_param(new_url, model_selected)

	# Recombine
	new_line = f"{parts[0]}\"{new_url}\" {parts[2]}"
	new_lines.append(new_line)
	else:
	# If we can't parse it, keep it as is
	new_lines.append(line)
	else:
	new_lines.append(line)

	mermaid_code = "\n".join(new_lines)

	# ---------------------------------------------
	# Render the top-centered Mermaid diagram
	# ---------------------------------------------
	st.sidebar.markdown("Mermaid Diagram with Base URL Injection")
	diagram_html = generate_mermaid_html(mermaid_code)
	components.html(diagram_html, height=400, scrolling=True)

	# ---------------------------------------------
	# Two-column interface: Markdown & Mermaid
	# ---------------------------------------------
	left_col, right_col = st.columns(2)

	# --- Left: Markdown Editor
	with left_col:
	st.subheader("Markdown Side 📝")
	if "markdown_text" not in st.session_state:
	st.session_state["markdown_text"] = "## Hello!\nType some Markdown here.\n"
	markdown_text = st.text_area(
	"Edit Markdown:",
	value=st.session_state["markdown_text"],
	height=300
	)
	st.session_state["markdown_text"] = markdown_text

	colA, colB = st.columns(2)
	with colA:
	if st.button("🔄 Refresh Markdown"):
	st.write("Markdown content refreshed! 🍿")
	with colB:
	if st.button("❌ Clear Markdown"):
	st.session_state["markdown_text"] = ""
	st.rerun()

	st.markdown("---")
	st.markdown("Preview:")
	st.markdown(markdown_text)

	# --- Right: Mermaid Editor
	with right_col:
	st.subheader("Mermaid Side 🧜‍♂️")

	# We store the final code in session state, so user can edit
	if "current_mermaid" not in st.session_state:
	st.session_state["current_mermaid"] = mermaid_code

	mermaid_input = st.text_area(
	"Edit Mermaid Code:",
	value=st.session_state["current_mermaid"],
	height=300
	)

	colC, colD = st.columns(2)
	with colC:
	if st.button("🎨 Refresh Diagram"):
	st.session_state["current_mermaid"] = mermaid_input
	st.write("Mermaid diagram refreshed! 🌈")
	st.rerun()
	with colD:
	if st.button("❌ Clear Mermaid"):
	st.session_state["current_mermaid"] = ""
	st.rerun()

	st.markdown("---")
	st.markdown("Mermaid Source:")
	st.code(mermaid_input, language="python", line_numbers=True)

	# ---------------------------------------------
	# Media Galleries
	# ---------------------------------------------
	st.markdown("---")
	st.header("Media Galleries")

	num_columns_images = st.slider("Choose Number of Image Columns", 1, 15, 5, key="num_columns_images")
	display_images_and_wikipedia_summaries(num_columns_images)

	num_columns_video = st.slider("Choose Number of Video Columns", 1, 15, 5, key="num_columns_video")
	display_videos_and_links(num_columns_video)

	# (Optionally) Extended text interface
	showExtendedTextInterface = False
	if showExtendedTextInterface:
	# For example:
	# display_glossary_grid(roleplaying_glossary)
	# num_columns_text = st.slider("Choose Number of Text Columns", 1, 15, 4)
	# display_buttons_with_scores(num_columns_text)
	pass

	# ---------------------------------------------
	# File Sidebar
	# ---------------------------------------------
	FileSidebar()

	# ---------------------------------------------
	# Random Title at the bottom
	# ---------------------------------------------
	titles = [
	"🧠🎭 Semantic Symphonies & Episodic Encores",
	"🌌🎼 AI Rhythms of Memory Lane",
	"🎭🎉 Cognitive Crescendos & Neural Harmonies",
	"🧠🎺 Mnemonic Melodies & Synaptic Grooves",
	"🎼🎸 Straight Outta Cognition",
	"🥁🎻 Jazzy Jambalaya of AI Memories",
	"🏰 Semantic Soul & Episodic Essence",
	"🥁🎻 The Music Of AI's Mind"
	]
	st.markdown(f"{random.choice(titles)}")


	if __name__ == "__main__":
	main()