Skip to content

Commit 5f12b44

Browse files
authored
feat: Dynamically find and use sample submission file in eval tests (microsoft#542)
1 parent f22bc2d commit 5f12b44

File tree

1 file changed

+21
-6
lines changed

1 file changed

+21
-6
lines changed

rdagent/components/coder/data_science/workflow/eval_tests/submission_check.txt

Lines changed: 21 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1,16 +1,31 @@
11
from pathlib import Path
22
import pandas as pd
33

4+
# Find sample submission file dynamically
5+
input_dir = Path("/kaggle/input")
6+
sample_submission_files = list(input_dir.glob("*sample_submission*.csv"))
7+
8+
if not sample_submission_files:
9+
print("Error: No sample submission file found in /kaggle/input/")
10+
exit(1)
11+
12+
# Use first matching file
13+
sample_submission_name = sample_submission_files[0].name
14+
SAMPLE_SUBMISSION_PATH = str(sample_submission_files[0])
15+
print(f"Using sample submission file: {sample_submission_name}")
16+
417
# Check if the sample submission file exists
5-
if not Path("/kaggle/input/sample_submission.csv").exists():
18+
if not Path(SAMPLE_SUBMISSION_PATH).exists():
19+
print(f"Error: {sample_submission_name} not found at {SAMPLE_SUBMISSION_PATH}")
620
exit(0)
721

8-
sample_submission = pd.read_csv('/kaggle/input/sample_submission.csv')
22+
23+
sample_submission = pd.read_csv(SAMPLE_SUBMISSION_PATH)
924
our_submission = pd.read_csv('submission.csv')
1025

1126
success = True
1227
# Print the columns of the sample submission file
13-
print("Columns in sample_submission.csv:", sample_submission.columns)
28+
print(f"Columns in {sample_submission_name}:", sample_submission.columns)
1429
print("Columns in our_submission.csv:", our_submission.columns)
1530

1631
for col in sample_submission.columns:
@@ -19,7 +34,7 @@ for col in sample_submission.columns:
1934
print(f'Column {col} not found in submission.csv')
2035

2136
if success:
22-
print('submission.csv\'s columns aligns with sample_submission.csv .')
37+
print(f'submission.csv\'s columns aligns with {sample_submission_name} .')
2338

2439

2540
# Print the first 5 rows of the two submission files, with columns separated by commas.
@@ -35,7 +50,7 @@ def print_first_rows(file_path, file_name, num_rows=5):
3550
except FileNotFoundError:
3651
print(f"Error: {file_name} not found.")
3752

38-
print_first_rows('/kaggle/input/sample_submission.csv', 'sample_submission.csv')
53+
print_first_rows(SAMPLE_SUBMISSION_PATH, sample_submission_name)
3954
print_first_rows('submission.csv', 'submission.csv')
4055

41-
print("\nPlease Checked the content of the submission file(submission.csv should align with sample_submission.csv). ")
56+
print(f"\nPlease Checked the content of the submission file(submission.csv should align with {sample_submission_name}). ")

0 commit comments

Comments
 (0)