Spaces:

build-small-hackathon
/

CodeFlow

Running

Updated README, added tracing capabilities, changed size of flowchart, vendored the animation assets so this meets off the grid.

1433b16 about 9 hours ago

raw

history blame contribute delete

10.8 kB


	from huggingface_hub import hf_hub_download
	from llama_cpp import Llama
	import gradio as gr
	from gradio import Server
	from fastapi.responses import HTMLResponse, PlainTextResponse, FileResponse # frontend + traces + vendored static assets
	import mimetypes
	from typing import Any, cast # to resolve PyLance freaking out over llama-cpp-python in the generate_flowchart function
	from textwrap import dedent
	from pathlib import Path # load the custom frontend from disk
	import re # remove thinking tag from response
	import json, time, uuid # agent-trace logging
	from datetime import datetime, timezone

	# ----- Get Model ----- #
	# Download Q4_K_M GGUF file from the repo
	model_path = hf_hub_download(
	repo_id="unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF",
	filename="Qwen3-Coder-30B-A3B-Instruct-UD-Q3_K_XL.gguf" # fallback: Q2_K_XL
	)

	# Initialize llama.cpp with the local cached path
	llm = Llama(
	model_path=model_path,
	n_ctx=4096,
	n_threads=2
	)

	# ----- Init App ----- #
	app = gr.Server(title="Code-to-Flowchart Generator")

	# ----- Agent traces ----- #
	# Each generation appends one JSON line capturing the full LLM call (input code,
	# the model's reasoning, output Mermaid + linemap, token usage, latency).
	# Download the whole log from the running app at /traces .
	MODEL_NAME = "unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF:UD-Q3_K_XL"
	TRACE_PATH = Path(__file__).parent / "agent_traces.jsonl"

	def write_trace(record: dict) -> None:
	try:
	with open(TRACE_PATH, "a", encoding="utf-8") as f:
	f.write(json.dumps(record, ensure_ascii=False) + "\n")
	except Exception:
	pass # tracing must never break generation

	# ----- Functions ----- #

	# This is a cleaning function to resolve common syntax errors.
	def quote_labels(text: str) -> str:
	# Mermaid node labels can't hold raw code characters, so quote-wrap each label body
	# A label's real closing bracket is followed by a Mermaid connector, edge-label, pipe, statement end, or EOL
	# operators after a subscript (== < <= > >= != %) are never mistaken for a close.
	END = r'(?=\s*(?:[-<][-.>xo]\|==[>=xo]\|\\|\|;\|$))'

	def esc(body: str) -> str:
	return (body.replace('"', "'")
	.replace('[', '[').replace(']', ']')
	.replace('{', '{').replace('}', '}'))

	out = []
	for line in text.split('\n'):
	line = re.sub(r'(?<=\w)\[(.*?)\]' + END, lambda m: '["' + esc(m.group(1)) + '"]', line)
	line = re.sub(r'(?<=\w)\{(.*?)\}' + END, lambda m: '{"' + esc(m.group(1)) + '"}', line)
	out.append(line)
	return '\n'.join(out)

	# Parse the model's <linemap> block into {nodeId: [startLine, endLine]}.
	# Tolerant of junk lines; drops any entry whose line(s) fall outside the source.
	def parse_linemap(block: str, num_lines: int) -> dict:
	out: dict = {}
	for raw in block.strip().splitlines():
	m = re.match(r'\s([A-Za-z]\w)\s:\s(\d+)(?:\s-\s(\d+))?\s*$', raw)
	if not m:
	continue
	a = int(m.group(2))
	b = int(m.group(3)) if m.group(3) else a
	if a > b:
	a, b = b, a
	if num_lines and 1 <= a <= num_lines and 1 <= b <= num_lines:
	out[m.group(1)] = [a, b]
	return out

	@app.api(name="generate_flowchart")
	def generate_flowchart(src_code: str) -> dict:
	# check if src_code is empty
	if not src_code.strip(): return {"mermaid": "", "linemap": {}}

	# Number the source lines so the model can cite them in the <linemap> block.
	src_lines = src_code.splitlines()
	num_lines = len(src_lines)
	numbered = "\n".join(f"{i}\| {ln}" for i, ln in enumerate(src_lines, 1))

	# Set system prompt
	system_prompt = dedent("""
	## Role/Persona
	You are a senior staff software architect and compiler engineer specializing in visual control-flow mapping. Your philosophy is pure utility: you translate raw execution logic into highly accurate, scannable, structural diagrams without any conversational filler, meta-commentary, or stylistic fluff.

	## Context/Objective
	The user will provide source code files or logic snippets. Your sole objective is to parse the syntax and output a corresponding, valid Mermaid.js flowchart graph. This graph will be rendered natively in a production UI to help developers audit execution paths at a glance.

	## Strict Constraints
	<constraints>
	1. OUTPUT FORMAT: Output valid, raw Mermaid.js syntax, immediately followed by the required <linemap> block (constraint 5). Nothing else.
	2. NO MARKDOWN FENCING: Do not wrap the output in ```mermaid or ``` blocks. Start directly with the Mermaid graph definition, for example: graph TD.
	3. NO PROSE: Do not include introductory text, explanations, or concluding remarks. If the code cannot be parsed, output an isolated error node.
	4. NODE NAMING: Paraphrase conditions into plain words — never put raw code, operators, quotes, parentheses, or square brackets/subscripts inside labels (write Index in bounds?, not i < len(nums); write Element is even?, not nums[i] % 2 == 0)
	5. SOURCE MAP: The user's code is prefixed with `N\| ` line numbers (these are references, never copy the `N\| ` prefix into a label). After the diagram, output a <linemap> block: one `NodeId: N` per node, where N is the 1-based source line that node represents (use `NodeId: start-end` for a multi-line construct). Omit purely structural Start/End nodes that correspond to no source line.
	</constraints>

	<banned_vocabulary>
	- Here is the flowchart
	- ```mermaid
	- ```
	- Note:
	- Explanation:
	- In this diagram
	- As requested
	</banned_vocabulary>

	## Response Workflow
	Before outputting the final diagram syntax, perform structural parsing inside a hidden <thinking> tag according to these steps:
	1. Identify all conditional branches, including if/else, loops, including for/while, and termination points, including return/throw.
	2. Map out the execution flow nodes chronologically.
	3. Verify that every opening bracket and node label matching syntax, including [ ], ( ), and { }, is perfectly balanced and closed according to Mermaid specifications.
	4. Ensure no markdown formatting tags leak past the closing </thinking> tag.

	## Few-Shot Examples

	Input:
	1\| def check_status(val):
	2\| if val > 10:
	3\| return "Active"
	4\| else:
	5\| return "Inactive"

	Output:
	<thinking>
	1. Control structures: One conditional check, two return branches.
	2. Nodes: A Start, B Conditional, C Active return, D Inactive return.
	3. Source lines: def is line 1, the if is line 2, Active return is line 3, Inactive return is line 5.
	</thinking>
	graph TD
	A[Start: check_status] --> B{val > 10}
	B -- True --> C[Return 'Active']
	B -- False --> D[Return 'Inactive']
	<linemap>
	A: 1
	B: 2
	C: 3
	D: 5
	</linemap>
	""").strip()

	# Reset the cache per request so no cross-request bleeding
	llm.reset()

	# Casting else PyLance gets mad
	t0 = time.perf_counter()
	response = cast(Any, llm.create_chat_completion(
	messages=[
	{"role": "system", "content": system_prompt},
	{"role": "user", "content": numbered}
	],
	temperature=0.1, # Keep it quite deterministic for now
	max_tokens=1024,
	stream=False
	))
	latency_ms = round((time.perf_counter() - t0) * 1000)

	raw = response["choices"][0]["message"]["content"]
	usage = response.get("usage", {}) or {}

	# Capture the model's hidden reasoning for the trace, then strip the tags
	think = re.search(r'<thinking>(.*?)</thinking>', raw, flags=re.DOTALL)
	reasoning = think.group(1).strip() if think else ""
	content = re.sub(r'<thinking>.*?</thinking>', '', raw, flags=re.DOTALL)

	# Extract + strip the node→line map, then validate it against the source length
	linemap: dict = {}
	lm = re.search(r'<linemap>(.*?)</linemap>', content, flags=re.DOTALL)
	if lm:
	linemap = parse_linemap(lm.group(1), num_lines)
	content = content[:lm.start()] + content[lm.end():]

	# Quote-wrap each node label and escape any leaked code characters
	mermaid = quote_labels(content).strip() # and remove excess whitespace

	# ----- Agent trace (append-only JSONL; downloadable at /traces) -----
	write_trace({
	"id": uuid.uuid4().hex,
	"ts": datetime.now(timezone.utc).isoformat(),
	"event": "generate_flowchart",
	"model": MODEL_NAME,
	"params": {"temperature": 0.1, "max_tokens": 1024, "n_ctx": 4096},
	"input": {"src_code": src_code, "num_lines": num_lines},
	"reasoning": reasoning,
	"output": {"raw": raw, "mermaid": mermaid, "linemap": linemap},
	"usage": {
	"prompt_tokens": usage.get("prompt_tokens"),
	"completion_tokens": usage.get("completion_tokens"),
	"total_tokens": usage.get("total_tokens"),
	},
	"latency_ms": latency_ms,
	"status": "ok",
	})

	return {"mermaid": mermaid, "linemap": linemap}

	# ----- Custom Frontend ----- #
	# Served from frontend.html so the same file can be opened directly in a
	# browser (file://) to preview the UI without loading the model.
	index_html = (Path(__file__).parent / "frontend.html").read_text(encoding="utf-8")

	# Load the custom HTML
	# / takes precedent over default Blocks UI
	@app.get("/")
	def index():
	return HTMLResponse(index_html)

	# Serve the vendored frontend assets (Mermaid, CodeMirror bundle, Gradio client,
	# fonts) locally so the app needs NO external CDN/API at runtime.
	STATIC_DIR = (Path(__file__).parent / "static").resolve()
	mimetypes.add_type("text/javascript", ".js")
	mimetypes.add_type("font/woff2", ".woff2")

	@app.get("/static/{fname:path}")
	def static_files(fname: str):
	fp = (STATIC_DIR / fname).resolve()
	# contain to STATIC_DIR (no path traversal) and require a real file
	if not str(fp).startswith(str(STATIC_DIR) + "/") or not fp.is_file():
	return PlainTextResponse("not found", status_code=404)
	mt, _ = mimetypes.guess_type(str(fp))
	return FileResponse(fp, media_type=mt or "application/octet-stream")

	# Download every agent trace collected this run (one JSON object per line).
	# curl https://<your-space>/traces > agent_traces.jsonl
	@app.get("/traces")
	def traces():
	text = TRACE_PATH.read_text(encoding="utf-8") if TRACE_PATH.exists() else ""
	return PlainTextResponse(text, media_type="application/x-ndjson",
	headers={"Content-Disposition": 'attachment; filename="agent_traces.jsonl"'})

	app.launch(share=False) # no external gradio.live tunnel — fully self-hosted