downsized samples to max of 10k
This commit is contained in:
parent
6a31e8fa7f
commit
b06dad23af
|
@ -13,7 +13,7 @@ class UpscaleDataset(Dataset):
|
|||
combined_df = pd.DataFrame()
|
||||
for parquet_file in parquet_files:
|
||||
# Load data with chunking for memory efficiency
|
||||
df = pd.read_parquet(parquet_file, columns=['image_512', 'image_1024']).head(10000)
|
||||
df = pd.read_parquet(parquet_file, columns=['image_512', 'image_1024']).head(5000)
|
||||
combined_df = pd.concat([combined_df, df], ignore_index=True)
|
||||
|
||||
# Validate data format
|
||||
|
|
Loading…
Reference in New Issue