aprender-train 0.29.0

Training & Optimization library with autograd, LoRA, quantization, and model merging
1
2
3
4
5
6
7
8
9
10
11
12
import pandas as pd
import numpy as np

# Create data where features is a list of floats (simulating a vector)
# The example parquet_data.yaml expects columns [features, label]
data = {
    'features': [np.random.rand(10).tolist() for _ in range(100)],
    'label': np.random.randint(0, 2, 100)
}
df = pd.DataFrame(data)
df.to_parquet('data/train.parquet')
print("Successfully created data/train.parquet")