philipphager/example.py

## example.py
# Dependencies to install. Pandas for dataframes, pyarrow to support the .parquet file format.
# pip install pandas
# pip install pyarrow

# Load a downloaded dataset from file:
train_df = pd.read_parquet("mslr_train.parquet")
train_df.head()

# The dataset contains 136 features per query-document (columns starting with 'feature_*')
# E.g. one way to select all columns starting with 'feature_'
train_df.filter(regex="^feature_", axis=1).head()

# The field query_id signals which query-document vectors belong to the same search query.
train_df["query_id"].head()

# The relevance column contains the human expert judgments how relevant each document was for the current query (scale 0 - 4)
train_df["relevance"].head()
	# Dependencies to install. Pandas for dataframes, pyarrow to support the .parquet file format.
	# pip install pandas
	# pip install pyarrow

	# Load a downloaded dataset from file:
	train_df = pd.read_parquet("mslr_train.parquet")
	train_df.head()

	# The dataset contains 136 features per query-document (columns starting with 'feature_*')
	# E.g. one way to select all columns starting with 'feature_'
	train_df.filter(regex="^feature_", axis=1).head()

	# The field query_id signals which query-document vectors belong to the same search query.
	train_df["query_id"].head()

	# The relevance column contains the human expert judgments how relevant each document was for the current query (scale 0 - 4)
	train_df["relevance"].head()