Я использую индексирование .iloc
и генератор логических последовательностей .isin
:
import pandas as pd
# Read in the full data set, check its size
original_df = pd.read_csv('recipeData.csv', encoding='latin-1')
print(original_df.size) # 1698803
# Store your desired styles for filtering in a python list
styles_list = "American IPA, American Pale Ale, Saison, American Light Lager, American Amber Ale".split(', ')
# Filter using .loc and a boolean mask (checking if each 'Style' value is in your list)
new_df = original_df.loc[original_df['Style'].isin(styles_list)]
print(new_df.size) # 608419