File size: 579 Bytes
2ed2129
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
from course_search.search_system.data_pipeline import DataPipeline
import logging

def test_pipeline():
    pipeline = DataPipeline()
    
    # Run pipeline and save results
    df = pipeline.run_pipeline(save_path='data/courses_with_embeddings.pkl')
    
    # Print results
    print("\nDataFrame Info:")
    print(df.info())
    print("\nSample Course:")
    print(df.iloc[0][['title', 'description']].to_dict())
    print("\nSample Embedding Shape:", df.iloc[0]['embeddings'].shape)

if __name__ == "__main__":
    logging.basicConfig(level=logging.INFO)
    test_pipeline()