from table_utils import encode_table
import pandas as pd


file_path = 'data/processed_data/formula/qwen/multihiertt/train.parquet'

df = pd.read_parquet(file_path)
print(df.head())

# print(df.columns)

print(len(df))
# idx = 10

# print(df['question'].iloc[idx])

# print(df['answer'].iloc[idx])


# print(encode_table(df['table'].iloc[idx], with_address=True, remove_break_in_cell=True))

