python
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_squared_error
加载数据
df = pd.read_csv('your_data.csv')
查看前几行数据
print(df.head())
假设我们有一个目标变量 'target' 和一些特征变量 'feature1', 'feature2', ...
X = df[['feature1', 'feature2']]
y = df['target']
将数据分为训练集和测试集
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)