Spaces:

junaid17
/

Cortex-Coder

Sleeping

App Files Files Community

Cortex-Coder / scripts /main.py

junaid17

Upload 7 files

eff58d2 verified 18 days ago

raw

history blame contribute delete

8.89 kB

	from langgraph.checkpoint.memory import MemorySaver
	from langgraph.graph.message import add_messages
	from scripts.load_model import get_model
	from typing import TypedDict, Literal, Optional, Annotated
	from langgraph.graph import StateGraph, END
	from langchain_core.messages import BaseMessage, HumanMessage, SystemMessage
	from scripts.prompts import (
	GENERAL_CHAT_SYSTEM_PROMPT,
	CODE_AGENT_SYSTEM_PROMPT,
	REPAIR_SYSTEM_PROMPT
	)

	# =========================================================
	# LLM
	# =========================================================
	llm = get_model()


	# =========================================================
	# STATE
	# =========================================================
	class ChatState(TypedDict):
	user_input: Annotated[list[BaseMessage], add_messages]
	intent: Optional[Literal["coding", "general_chat"]]
	task_type: Optional[Literal["code_generation", "debugging", "explanation"]]
	language: Optional[Literal["python", "javascript", "cpp", "sql", "java", "unknown"]]
	generated_output: Optional[str]
	is_code: Optional[bool]
	retry_count: int


	# =========================================================
	# HELPERS
	# =========================================================
	def get_last_user_message(state: ChatState) -> str:
	messages = state["user_input"]

	if not messages:
	return ""

	return messages[-1].content


	# =========================================================
	# INTENT CLASSIFIER
	# =========================================================
	def classify_intent(state: ChatState):
	query = get_last_user_message(state).lower()

	coding_keywords = [
	"code", "python", "javascript", "java", "c++", "sql",
	"bug", "debug", "fix", "function", "algorithm",
	"class", "implement", "build", "api", "query",
	"optimize", "refactor", "script", "program"
	]

	intent = "coding" if any(word in query for word in coding_keywords) else "general_chat"

	return {"intent": intent}


	def route_intent(state: ChatState):
	if state["intent"] == "general_chat":
	return "general_chat"

	return "coding"


	# =========================================================
	# GENERAL CHAT
	# =========================================================
	def handle_general_chat(state: ChatState):
	query = get_last_user_message(state)

	messages = [
	SystemMessage(content=GENERAL_CHAT_SYSTEM_PROMPT),
	HumanMessage(content=query)
	]

	response = llm.invoke(messages)

	return {
	"generated_output": response.content
	}


	# =========================================================
	# TASK CLASSIFIER
	# =========================================================
	def classify_task(state: ChatState):
	query = get_last_user_message(state).lower()

	debugging_keywords = [
	"fix", "debug", "error", "broken",
	"issue", "not working", "exception", "traceback"
	]

	explanation_keywords = [
	"explain", "what is", "how does", "why", "difference between"
	]

	if any(word in query for word in debugging_keywords):
	task = "debugging"

	elif any(word in query for word in explanation_keywords):
	task = "explanation"

	else:
	task = "code_generation"

	return {"task_type": task}


	# =========================================================
	# LANGUAGE DETECTOR
	# =========================================================
	def detect_language(state: ChatState):
	query = get_last_user_message(state).lower()

	if any(k in query for k in ["python", "def ", "import ", "print("]):
	lang = "python"

	elif any(k in query for k in ["javascript", "js", "function ", "console.log", "const ", "let "]):
	lang = "javascript"

	elif any(k in query for k in ["c++", "#include", "std::", "cout"]):
	lang = "cpp"

	elif any(k in query for k in ["java", "public class", "system.out"]):
	lang = "java"

	elif any(k in query for k in ["sql", "select ", "insert ", "update ", "delete ", "join "]):
	lang = "sql"

	else:
	lang = "unknown"

	return {"language": lang}


	# =========================================================
	# GENERATOR
	# =========================================================
	def generate_code(state: ChatState):
	query = get_last_user_message(state)

	task = state["task_type"]
	language = state["language"]

	messages = [
	SystemMessage(content=CODE_AGENT_SYSTEM_PROMPT),
	HumanMessage(content=f"""
	Task Type: {task}
	Requested Language: {language}

	User Request:
	{query}
	""")
	]

	response = llm.invoke(messages)

	return {
	"generated_output": response.content
	}


	# =========================================================
	# OUTPUT CLASSIFIER
	# =========================================================
	def classify_output(state: ChatState):
	output = (state["generated_output"] or "").lower()

	code_markers = [
	"def ", "class ", "function ", "const ", "let ",
	"#include", "std::", "public class", "system.out",
	"select ", "insert ", "update ", "delete ",
	"console.log", "print(", "fn "
	]

	is_code = any(marker in output for marker in code_markers)

	return {
	"is_code": is_code
	}


	# =========================================================
	# ROUTER
	# =========================================================
	def route_output(state: ChatState):
	if state["task_type"] == "explanation":
	return "final"

	if state["is_code"]:
	return "final"

	if state["retry_count"] >= 2:
	return "final"

	return "repair"


	# =========================================================
	# REPAIR
	# =========================================================
	def repair_code(state: ChatState):
	bad_output = state["generated_output"] or ""
	language = state["language"]

	messages = [
	SystemMessage(content=REPAIR_SYSTEM_PROMPT),
	HumanMessage(content=f"""
	The previous response was expected to be executable code but was not.

	Requested language:
	{language}

	Bad output:
	{bad_output}

	Return ONLY executable code.
	No explanation.
	No markdown.
	""")
	]

	response = llm.invoke(messages)

	return {
	"generated_output": response.content,
	"retry_count": state["retry_count"] + 1
	}


	# =========================================================
	# GRAPH
	# =========================================================
	checkpointer = MemorySaver()
	builder = StateGraph(ChatState)

	builder.add_node("classify_intent", classify_intent)
	builder.add_node("general_chat", handle_general_chat)
	builder.add_node("classify_task", classify_task)
	builder.add_node("detect_language", detect_language)
	builder.add_node("generate_code", generate_code)
	builder.add_node("classify_output", classify_output)
	builder.add_node("repair", repair_code)

	builder.set_entry_point("classify_intent")

	builder.add_conditional_edges(
	"classify_intent",
	route_intent,
	{
	"general_chat": "general_chat",
	"coding": "classify_task"
	}
	)

	builder.add_edge("general_chat", END)

	builder.add_edge("classify_task", "detect_language")
	builder.add_edge("detect_language", "generate_code")
	builder.add_edge("generate_code", "classify_output")

	builder.add_conditional_edges(
	"classify_output",
	route_output,
	{
	"final": END,
	"repair": "repair"
	}
	)

	builder.add_edge("repair", "classify_output")

	graph = builder.compile(checkpointer=checkpointer)


	# =========================================================
	# STREAM
	# =========================================================
	def stream_chat_response(user_message: str, thread_id: str):
	config = {"configurable": {"thread_id": thread_id}}

	initial_state = {
	"user_input": [HumanMessage(content=user_message)],
	"intent": None,
	"task_type": None,
	"language": None,
	"generated_output": None,
	"is_code": None,
	"retry_count": 0
	}

	for chunk in graph.stream(
	initial_state,
	config=config,
	stream_mode="messages"
	):
	yield chunk


	def get_chat_metadata(thread_id: str):
	config = {"configurable": {"thread_id": thread_id}}

	state = graph.get_state(config)
	values = state.values

	return {
	"intent": values.get("intent"),
	"task_type": values.get("task_type"),
	"language": values.get("language"),
	"is_code": values.get("is_code"),
	"retry_count": values.get("retry_count")
	}