Spaces:

CoreyMorris
/

MMLU-by-task-Leaderboard

Runtime error

MMLU-by-task-Leaderboard / test_details_data_processing.py

Corey Morris

WIP. Updated download file. Can now download all files. Need to integrate that code to loop through all files to download or combine files first into a single dataframe and then save that

0a77c60 over 1 year ago

raw

history blame

3.49 kB

	import unittest
	from details_data_processor import DetailsDataProcessor
	import pandas as pd
	import requests
	import os

	class TestDetailsDataProcessor(unittest.TestCase):

	def setUp(self):
	self.processor = DetailsDataProcessor()

	# check that the result is a pandas dataframe
	def test_process_data(self):
	pass
	# data = self.processor.data
	# self.assertIsInstance(data, pd.DataFrame)

	def test_download_file(self):
	DetailsDataProcessor.download_file('https://www.google.com', 'test_file_please_remove')
	self.assertTrue(os.path.exists('test.html'))
	os.remove('test.html')

	# queries_harness is in the url
	def test_download_file_queries(self):
	file_path_with_error = 'results/shaohang/Sparse0.5_OPT-1.3/results_2023-07-19T19:10:31.005235.json'
	url = self.processor.build_url(file_path_with_error)
	DetailsDataProcessor.download_file(url, 'test_file_please_remove')

	# details harness is in the url
	def test_download_file_details(self):
	file_path = 'results/v2ray/LLaMA-2-Wizard-70B-QLoRA/results_2023-08-18T07:09:43.451689.json'
	url = self.processor.build_url(file_path)
	DetailsDataProcessor.download_file(url, 'test_file_please_remove')


	def test_build_url(self):
	test_cases = [
	('results/64bits/LexPodLM-13B/results_2023-07-25T13:41:51.227672.json',
	'https://huggingface.co/datasets/open-llm-leaderboard/details/resolve/main/64bits/LexPodLM-13B/details_harness%7ChendrycksTest-moral_scenarios%7C5_2023-07-25T13%3A41%3A51.227672.json'),
	('results/AlpinDale/pygmalion-instruct/results_2023-08-17T11:20:15.687659.json',
	'https://huggingface.co/datasets/open-llm-leaderboard/details/resolve/main/AlpinDale/pygmalion-instruct/details_harness%7ChendrycksTest-moral_scenarios%7C5_2023-08-17T11%3A20%3A15.687659.json')
	]

	for file_path, expected in test_cases:
	assert self.processor.build_url(file_path) == expected, f"Test failed for file_path: {file_path}"

	def test_pipeline(self):
	df = self.processor.pipeline()
	print(100 * "****")
	print(df)
	self.assertIsInstance(df, pd.DataFrame)

	def test_find_files(self):
	directory = 'results'
	pattern = 'results*.json'
	files = self.processor._find_files(directory, pattern)
	# breakpoint()
	# print(files)
	self.assertIsInstance(files, list)

	def test_build_url_harness_types(self):
	test_cases = [
	('results/shaohang/Sparse0.5_OPT-1.3/results_2023-07-19T19:10:31.005235.json', 'details',
	'https://huggingface.co/datasets/open-llm-leaderboard/details/resolve/main/shaohang/Sparse0.5_OPT-1.3/details_harness%7ChendrycksTest-moral_scenarios%7C5_2023-07-19T19%3A10%3A31.005235.json'),
	('results/shaohang/Sparse0.5_OPT-1.3/results_2023-07-19T19:10:31.005235.json', 'queries',
	'https://huggingface.co/datasets/open-llm-leaderboard/details/resolve/main/shaohang/Sparse0.5_OPT-1.3/queries_harness%7ChendrycksTest-moral_scenarios%7C5_2023-07-19T19%3A10%3A31.005235.json')
	]

	for file_path, harness_type, expected in test_cases:
	self.assertEqual(self.processor.build_url(file_path, harness_type), expected,
	f"Test failed for file_path: {file_path}, harness_type: {harness_type}")



	if __name__ == '__main__':
	unittest.main()