Spaces:
Building
Building
from http.server import HTTPServer, SimpleHTTPRequestHandler | |
# from pyngrok import ngrok | |
import os | |
from mistralai.client import MistralClient | |
from mistralai.models.chat_completion import ChatMessage | |
import json | |
# Mistral AI setup | |
api_key = os.getenv("MISTRAL_API_KEY") | |
if not api_key: | |
raise ValueError("MISTRAL_API_KEY environment variable not set") | |
model = "mistral-tiny" | |
client = MistralClient(api_key=api_key) | |
def generate_goals(input_var): | |
messages = [ | |
ChatMessage(role="user", content=f"Generate 5 specific, industry relevant goals for {input_var} using Python and Pandas in exam data analysis. Each goal should include a brief name and a one-sentence description of the task or skill.") | |
] | |
try: | |
response = client.chat(model=model, messages=messages) | |
return response.choices[0].message.content | |
except Exception as e: | |
return f"An error occurred: {str(e)}" | |
html_content = """ | |
<!DOCTYPE html> | |
<html lang="en"> | |
<head> | |
<meta charset="UTF-8"> | |
<meta name="viewport" content="width=device-width, initial-scale=1.0"> | |
<title>Exam Data Analysis Goals Generator</title> | |
<script src="https://d3js.org/d3.v7.min.js"></script> | |
<style> | |
#visualization { width: 100%; height: 600px; border: 1px solid #ccc; } | |
#generatedGoals { margin-top: 20px; padding: 10px; border: 1px solid #ccc; } | |
</style> | |
</head> | |
<body> | |
<h1>Exam Data Analysis Goals Generator</h1> | |
<div id="visualization"></div> | |
<div id="generatedGoals"></div> | |
<script> | |
const width = 1200; | |
const height = 800; | |
const goals = [ | |
{ id: 1, x: 100, y: 400, name: "Automate Data Import", description: "Develop scripts to automate exam data extraction from various sources (CSV, Excel, databases) using Pandas read_* functions." }, | |
{ id: 2, x: 200, y: 300, name: "Data Cleaning", description: "Implement robust data cleaning processes to handle missing values, outliers, and inconsistencies in exam data using Pandas methods like dropna(), fillna(), and apply()." }, | |
{ id: 3, x: 300, y: 200, name: "Data Transformation", description: "Utilize Pandas for complex data transformations such as pivoting exam results, melting question-wise scores, and creating derived features for analysis." }, | |
{ id: 4, x: 400, y: 300, name: "Statistical Analysis", description: "Develop functions to automate statistical analysis of exam results, including descriptive statistics, hypothesis testing, and correlation analysis using Pandas and SciPy." }, | |
{ id: 5, x: 500, y: 400, name: "Performance Metrics", description: "Create custom functions to calculate industry-standard exam performance metrics like item difficulty, discrimination index, and reliability coefficients using Pandas operations." }, | |
{ id: 6, x: 200, y: 500, name: "Data Filtering", description: "Implement advanced filtering techniques to segment exam data based on various criteria (e.g., demographic info, score ranges) using boolean indexing and query() method in Pandas." }, | |
{ id: 7, x: 300, y: 600, name: "Reporting Automation", description: "Develop automated reporting systems that use Pandas groupby() and agg() functions to generate summary statistics and performance reports for different exam cohorts." }, | |
{ id: 8, x: 400, y: 500, name: "Data Visualization", description: "Create interactive dashboards for exam data visualization using Pandas with Plotly or Bokeh, allowing stakeholders to explore results dynamically." }, | |
{ id: 9, x: 500, y: 600, name: "Time Series Analysis", description: "Implement time series analysis techniques using Pandas datetime functionality to track and forecast exam performance trends over multiple test administrations." }, | |
{ id: 10, x: 300, y: 400, name: "Data Integration", description: "Develop processes to merge exam data with other relevant datasets (e.g., student information systems, learning management systems) using Pandas merge() and join() operations." }, | |
{ id: 11, x: 600, y: 300, name: "Performance Optimization", description: "Improve the efficiency of Pandas operations on large exam datasets by utilizing techniques like chunking, multiprocessing, and query optimization." }, | |
{ id: 12, x: 700, y: 400, name: "Machine Learning Integration", description: "Integrate machine learning models with Pandas for predictive analytics, such as predicting exam success or identifying at-risk students based on historical data." }, | |
{ id: 13, x: 800, y: 500, name: "Custom Indexing", description: "Implement custom indexing strategies in Pandas to efficiently handle hierarchical exam data structures and improve data access patterns." }, | |
{ id: 14, x: 900, y: 400, name: "Data Anonymization", description: "Develop Pandas-based workflows to anonymize sensitive exam data, ensuring compliance with privacy regulations while maintaining data utility for analysis." }, | |
{ id: 15, x: 1000, y: 300, name: "Exam Item Analysis", description: "Create specialized functions using Pandas to perform detailed item analysis, including distractor analysis and reliability calculations for individual exam questions." }, | |
{ id: 16, x: 600, y: 500, name: "Longitudinal Analysis", description: "Implement Pandas-based methods for tracking student performance across multiple exams over time, identifying learning trends and progress patterns." }, | |
{ id: 17, x: 700, y: 600, name: "Adaptive Testing Analysis", description: "Develop analysis pipelines using Pandas to evaluate and optimize adaptive testing algorithms, including item selection strategies and scoring methods." }, | |
{ id: 18, x: 800, y: 700, name: "Exam Equating", description: "Create Pandas workflows to perform exam equating, ensuring comparability of scores across different versions or administrations of an exam." }, | |
{ id: 19, x: 900, y: 600, name: "Response Time Analysis", description: "Utilize Pandas to analyze exam response times, identifying patterns that may indicate guessing, test-taking strategies, or item difficulty." }, | |
{ id: 20, x: 1000, y: 500, name: "Collaborative Filtering", description: "Implement collaborative filtering techniques using Pandas to recommend study materials or practice questions based on exam performance patterns." }, | |
{ id: 21, x: 400, y: 700, name: "Exam Fraud Detection", description: "Develop anomaly detection algorithms using Pandas to identify potential exam fraud or unusual response patterns in large-scale testing programs." }, | |
{ id: 22, x: 500, y: 800, name: "Standard Setting", description: "Create Pandas-based tools to assist in standard setting processes, analyzing expert judgments and examinee data to establish performance standards." }, | |
{ id: 23, x: 600, y: 700, name: "Automated Reporting", description: "Implement automated report generation using Pandas and libraries like Jinja2 to create customized, data-driven exam reports for various stakeholders." }, | |
{ id: 24, x: 700, y: 800, name: "Cross-validation", description: "Develop cross-validation frameworks using Pandas to assess the reliability and generalizability of predictive models in educational assessment contexts." }, | |
{ id: 25, x: 800, y: 300, name: "API Integration", description: "Create Pandas-based interfaces to integrate exam data analysis workflows with external APIs, facilitating real-time data exchange and reporting." }, | |
{ id: 26, x: 900, y: 200, name: "Natural Language Processing", description: "Implement NLP techniques using Pandas and libraries like NLTK to analyze free-text responses in exams, enabling automated scoring and content analysis." }, | |
{ id: 27, x: 1000, y: 100, name: "Exam Blueprint Analysis", description: "Develop Pandas workflows to analyze exam blueprints, ensuring content coverage and alignment with learning objectives across multiple test forms." }, | |
{ id: 28, x: 100, y: 600, name: "Differential Item Functioning", description: "Implement statistical methods using Pandas to detect and analyze differential item functioning (DIF) in exams, ensuring fairness across different demographic groups." }, | |
{ id: 29, x: 200, y: 700, name: "Automated Feedback Generation", description: "Create Pandas-based systems to generate personalized feedback for test-takers based on their exam performance and identified areas for improvement." }, | |
{ id: 30, x: 300, y: 800, name: "Exam Security Analysis", description: "Develop analytical tools using Pandas to assess and enhance exam security, including analysis of item exposure rates and detection of potential security breaches." } | |
]; | |
const connections = [ | |
{ source: 1, target: 2 }, | |
{ source: 2, target: 3 }, | |
{ source: 3, target: 4 }, | |
{ source: 4, target: 5 }, | |
{ source: 5, target: 7 }, | |
{ source: 6, target: 7 }, | |
{ source: 7, target: 8 }, | |
{ source: 8, target: 9 }, | |
{ source: 9, target: 16 }, | |
{ source: 10, target: 13 }, | |
{ source: 11, target: 12 }, | |
{ source: 12, target: 20 }, | |
{ source: 13, target: 16 }, | |
{ source: 14, target: 21 }, | |
{ source: 15, target: 17 }, | |
{ source: 16, target: 18 }, | |
{ source: 17, target: 19 }, | |
{ source: 18, target: 22 }, | |
{ source: 19, target: 21 }, | |
{ source: 20, target: 29 }, | |
{ source: 21, target: 30 }, | |
{ source: 22, target: 23 }, | |
{ source: 23, target: 25 }, | |
{ source: 24, target: 12 }, | |
{ source: 25, target: 23 }, | |
{ source: 26, target: 15 }, | |
{ source: 27, target: 15 }, | |
{ source: 28, target: 22 }, | |
{ source: 29, target: 23 }, | |
{ source: 30, target: 21 }, | |
// Additional connections for more interconnectivity | |
{ source: 1, target: 10 }, | |
{ source: 2, target: 6 }, | |
{ source: 3, target: 13 }, | |
{ source: 4, target: 15 }, | |
{ source: 5, target: 28 }, | |
{ source: 8, target: 23 }, | |
{ source: 11, target: 25 }, | |
{ source: 14, target: 30 }, | |
{ source: 24, target: 17 }, | |
{ source: 26, target: 29 } | |
]; | |
const svg = d3.select("#visualization") | |
.append("svg") | |
.attr("width", width) | |
.attr("height", height); | |
const simulation = d3.forceSimulation(goals) | |
.force("link", d3.forceLink(connections).id(d => d.id)) | |
.force("charge", d3.forceManyBody().strength(-400)) | |
.force("center", d3.forceCenter(width / 2, height / 2)); | |
const link = svg.append("g") | |
.selectAll("line") | |
.data(connections) | |
.enter().append("line") | |
.attr("stroke", "#999") | |
.attr("stroke-opacity", 0.6); | |
const node = svg.append("g") | |
.selectAll("circle") | |
.data(goals) | |
.enter().append("circle") | |
.attr("r", 10) | |
.attr("fill", d => d.color || "#69b3a2") | |
.call(d3.drag() | |
.on("start", dragstarted) | |
.on("drag", dragged) | |
.on("end", dragended)); | |
const text = svg.append("g") | |
.selectAll("text") | |
.data(goals) | |
.enter().append("text") | |
.text(d => d.name) | |
.attr("font-size", "12px") | |
.attr("dx", 12) | |
.attr("dy", 4); | |
node.on("click", async function(event, d) { | |
const response = await fetch('/generate_goals', { | |
method: 'POST', | |
headers: { 'Content-Type': 'application/json' }, | |
body: JSON.stringify({ input_var: d.name }) | |
}); | |
const data = await response.json(); | |
document.getElementById("generatedGoals").innerHTML = `<h2>Generated Goals for ${d.name}</h2><pre>${data.goals}</pre>`; | |
}); | |
simulation.on("tick", () => { | |
link | |
.attr("x1", d => d.source.x) | |
.attr("y1", d => d.source.y) | |
.attr("x2", d => d.target.x) | |
.attr("y2", d => d.target.y); | |
node | |
.attr("cx", d => d.x) | |
.attr("cy", d => d.y); | |
text | |
.attr("x", d => d.x) | |
.attr("y", d => d.y); | |
}); | |
function dragstarted(event) { | |
if (!event.active) simulation.alphaTarget(0.3).restart(); | |
event.subject.fx = event.subject.x; | |
event.subject.fy = event.subject.y; | |
} | |
function dragged(event) { | |
event.subject.fx = event.x; | |
event.subject.fy = event.y; | |
} | |
function dragended(event) { | |
if (!event.active) simulation.alphaTarget(0); | |
event.subject.fx = null; | |
event.subject.fy = null; | |
} | |
</script> | |
</body> | |
</html> | |
""" | |
class MyHandler(SimpleHTTPRequestHandler): | |
def do_GET(self): | |
self.send_response(200) | |
self.send_header('Content-type', 'text/html') | |
self.end_headers() | |
self.wfile.write(html_content.encode()) | |
def do_POST(self): | |
if self.path == '/generate_goals': | |
content_length = int(self.headers['Content-Length']) | |
post_data = self.rfile.read(content_length) | |
data = json.loads(post_data.decode('utf-8')) | |
input_var = data['input_var'] | |
goals = generate_goals(input_var) | |
self.send_response(200) | |
self.send_header('Content-type', 'application/json') | |
self.end_headers() | |
self.wfile.write(json.dumps({'goals': goals}).encode()) | |
else: | |
self.send_error(404) | |
if __name__ == '__main__': | |
port = 7860 | |
server = HTTPServer(('', port), MyHandler) | |
# public_url = ngrok.connect(port).public_url | |
# print(f" * ngrok tunnel \"{public_url}\" -> \"http://127.0.0.1:{port}\"") | |
server.serve_forever() |