File size: 787 Bytes
f83431c
 
320450f
f83431c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
import pandas as pd

parquet_file = 'data/data_dump_ai_assingment.parquet'
df = pd.read_parquet(parquet_file, engine='pyarrow')

# Setting 3 random campaigns aside as testing examples for final models
campaign_ids = [8, 123, 256]
df_final_testing = df[df['campaign_id'].isin(campaign_ids)==True].copy()

def get_unique_lead_ids(df, campaign_id):
    df_campaign = df_final_testing[df_final_testing['campaign_id'] == campaign_id].copy()
    lead_ids = list(df_campaign['lead_id'].unique())
    return lead_ids

leads_8 = get_unique_lead_ids(df_final_testing, 8)
leads_123 = get_unique_lead_ids(df_final_testing, 123)
leads_256 = get_unique_lead_ids(df_final_testing, 256)

leads_8 = [str(i) for i in leads_8]
leads_123 = [str(i) for i in leads_123]
leads_256 = [str(i) for i in leads_256]