#Import Libraries
import pandas as pd
import jellyfish
# Read first dataset
df1 = pd.read_csv('data1.csv')
df1
# Read second dataset
df2 = pd.read_csv('data2.csv')
df2
# Create join column in first dataset
df1['soundex'] = df1['data1'].apply(lambda x: jellyfish.soundex(x))
df1
# Create join column in second dataset
df2['soundex'] = df2['data3'].apply(lambda x: jellyfish.soundex(x))
df2
# Merge both datasets
df = pd.merge(df1, df2, on=['soundex'])
df
# Export file to csv
df.to_csv('joined_data.csv', encoding='utf-8', index=False)