| | |
| | """ |
| | Simple test that only tests data loading and GPU monitoring without model downloads |
| | """ |
| |
|
| | import sys |
| | import os |
| | sys.path.append('src') |
| |
|
| | def test_data_only(): |
| | """Test only data loading functionality""" |
| | try: |
| | import pandas as pd |
| | from tevatron.utils.gpu_monitor import GPUMemoryMonitor |
| | |
| | print("Testing data loading...") |
| | df = pd.read_csv("data/the_vault/DOC_VAULT_train.tsv", sep='\t', nrows=5) |
| | print(f"Loaded {len(df)} samples") |
| | print(f"Columns: {list(df.columns)}") |
| | |
| | print("Testing GPU monitor...") |
| | monitor = GPUMemoryMonitor(memory_threshold=0.8, check_interval=10) |
| | stats = monitor.get_memory_stats() |
| | print(f"GPU monitor initialized: {stats}") |
| | |
| | print("Testing tevatron imports...") |
| | from tevatron.arguments import GLENP1ModelArguments, GLENP1DataArguments |
| | print("Arguments imported successfully") |
| | |
| | print("Basic functionality test PASSED!") |
| | return True |
| | |
| | except Exception as e: |
| | print(f"Test failed: {e}") |
| | import traceback |
| | traceback.print_exc() |
| | return False |
| |
|
| | if __name__ == "__main__": |
| | success = test_data_only() |
| | sys.exit(0 if success else 1) |
| |
|