MMLU-by-task-Leaderboard / save_for_regression.py
Corey Morris
script to save dataframe to a file only if there are no uncommitted files
7a88af3
raw
history blame
1.49 kB
# when run
# checks if there is uncommitted code
# if there is uncommitted code, ti retuns an error
# if there is no uncommitted code, it saves the dataframe as a parquet file with the commit hash in the name
import pytest
import pandas as pd
from result_data_processor import ResultDataProcessor
import os
import subprocess
def has_uncommitted_changes(repo_path):
try:
# Change to the repository directory
original_path = os.getcwd()
os.chdir(repo_path)
# Run the git status command
result = subprocess.run(['git', 'status', '--porcelain'], stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
# Check the result
if result.returncode != 0:
print(f"Error checking git status: {result.stderr}")
return False
# If the output is empty, there are no uncommitted changes
return bool(result.stdout.strip())
finally:
# Change back to the original directory
os.chdir(original_path)
if __name__ == '__main__':
if has_uncommitted_changes('.'):
print("There are uncommitted changes")
else:
print("There are no uncommitted changes")
df_current = ResultDataProcessor().data
last_commit = os.popen('git rev-parse HEAD').read().strip()
print(last_commit)
# save the current output to a file
df_current.to_parquet(f'output_{last_commit}.parquet', index=True)
print("Saved output to file")