import os
import random

import numpy as np
import pandas as pd
from tqdm import tqdm

from evaluation.environment import TrainingEnvironment, TestingEnvironment

# Official hyperparameters for this competition (do not modify)
N_TRAIN_USERS = 1000
N_TEST_USERS = 2000
N_ITEMS = 209527
HORIZON = 2000
TEST_EPISODES = 5
SLATE_SIZE = 5

# Dataset paths
USER_DATA = os.path.join('dataset', 'user_data.json')
ITEM_DATA = os.path.join('dataset', 'item_data.json')

# Output file path
OUTPUT_PATH = os.path.join('output', 'output.csv')

df_user = pd.read_json(USER_DATA, lines=True)
df_user

df_item = pd.read_json(ITEM_DATA, lines=True)
df_item

reset() → None

# Initialize the training environment
train_env = TrainingEnvironment()

# Reset the training environment (this can be useful when you have finished one episode of simulation and do not want to re-initialize a new environment)
train_env.reset()

# Check if there exist any active users in the environment
env_has_next_state = train_env.has_next_state()
print(f'There is {"still some" if env_has_next_state else "no"} active users in the training environment.')

# Get the current user ID
user_id = train_env.get_state()
print(f'The current user is user {user_id}.')

# Get the response of recommending the slate to the current user
slate = [0, 1, 2, 3, 4]
clicked_id, in_environment = train_env.get_response(slate)
print(f'The click result of recommending {slate} to user {user_id} is {f"item {clicked_id}" if clicked_id != -1 else f"{clicked_id} (no click)"}.')
print(f'User {user_id} {"is still in" if in_environment else "leaves"} the environment.')

# Get the normalized session length score of all users
train_score = train_env.get_score()
df_train_score = pd.DataFrame([[user_id, score] for user_id, score in enumerate(train_score)], columns=['user_id', 'avg_score'])
df_train_score

There is still some active users in the training environment.
The current user is user 412.
The click result of recommending [0, 1, 2, 3, 4] to user 412 is -1 (no click).
User 412 is still in the environment.

# Initialize the testing environment
test_env = TestingEnvironment()
scores = []

# The item_ids here is for the random recommender
item_ids = [i for i in range(N_ITEMS)]

# Repeat the testing process for 5 times
for _ in range(TEST_EPISODES):
    # [TODO] Load your model weights here (in the beginning of each testing episode)
    # [TODO] Code for loading your model weights...

    # Start the testing process
    with tqdm(desc='Testing') as pbar:
        # Run as long as there exist some active users
        while test_env.has_next_state():
            # Get the current user id
            cur_user = test_env.get_state()

            # [TODO] Employ your recommendation policy to generate a slate of 5 distinct items
            # [TODO] Code for generating the recommended slate...
            # Here we provide a simple random implementation
            slate = random.sample(item_ids, k=SLATE_SIZE)

            # Get the response of the slate from the environment
            clicked_id, in_environment = test_env.get_response(slate)

            # [TODO] Update your model here (optional)
            # [TODO] You can update your model at each step, or perform a batched update after some interval
            # [TODO] Code for updating your model...

            # Update the progress indicator
            pbar.update(1)

    # Record the score of this testing episode
    scores.append(test_env.get_score())

    # Reset the testing environment
    test_env.reset()

    # [TODO] Delete or reset your model weights here (in the end of each testing episode)
    # [TODO] Code for deleting your model weights...

# Calculate the average scores 
avg_scores = [np.average(score) for score in zip(*scores)]

# Generate a DataFrame to output the result in a .csv file
df_result = pd.DataFrame([[user_id, avg_score] for user_id, avg_score in enumerate(avg_scores)], columns=['user_id', 'avg_score'])
df_result.to_csv(OUTPUT_PATH, index=False)
df_result

Testing: 10233it [00:19, 526.52it/s]
Testing: 10293it [00:19, 541.22it/s]
Testing: 10285it [00:19, 531.14it/s]
Testing: 10244it [00:19, 533.77it/s]
Testing: 10224it [00:19, 533.37it/s]

	user_id	history
0	0	[42558, 65272, 13353]
1	1	[146057, 195688, 143652]
2	2	[67551, 85247, 33714]
3	3	[116097, 192703, 103229]
4	4	[68756, 140123, 135289]
...	...	...
1995	1995	[95090, 131393, 130239]
1996	1996	[2360, 147130, 8145]
1997	1997	[99794, 138694, 157888]
1998	1998	[55561, 60372, 51442]
1999	1999	[125409, 77906, 124792]

	item_id	headline	short_description
0	0	Over 4 Million Americans Roll Up Sleeves For O...	Health experts said it is too early to predict...
1	1	American Airlines Flyer Charged, Banned For Li...	He was subdued by passengers and crew when he ...
2	2	23 Of The Funniest Tweets About Cats And Dogs ...	"Until you have a dog you don't understand wha...
3	3	The Funniest Tweets From Parents This Week (Se...	"Accidentally put grown-up toothpaste on my to...
4	4	Woman Who Called Cops On Black Bird-Watcher Lo...	Amy Cooper accused investment firm Franklin Te...
...	...	...	...
209522	209522	RIM CEO Thorsten Heins' 'Significant' Plans Fo...	Verizon Wireless and AT&T are already promotin...
209523	209523	Maria Sharapova Stunned By Victoria Azarenka I...	Afterward, Azarenka, more effusive with the pr...
209524	209524	Giants Over Patriots, Jets Over Colts Among M...	Leading up to Super Bowl XLVI, the most talked...
209525	209525	Aldon Smith Arrested: 49ers Linebacker Busted ...	CORRECTION: An earlier version of this story i...
209526	209526	Dwight Howard Rips Teammates After Magic Loss ...	The five-time all-star center tore into his te...

	user_id	avg_score
0	0	0.0
1	1	0.0
2	2	0.0
3	3	0.0
4	4	0.0
...	...	...
995	995	0.0
996	996	0.0
997	997	0.0
998	998	0.0
999	999	0.0

	user_id	avg_score
0	0	0.0025
1	1	0.0027
2	2	0.0025
3	3	0.0025
4	4	0.0025
...	...	...
1995	1995	0.0027
1996	1996	0.0025
1997	1997	0.0025
1998	1998	0.0025
1999	1999	0.0025

DataLab Cup 4: Recommender Systems¶

Platform: Kaggle ¶

Overview¶

Datasets¶

User Data¶

Item Data¶

Simulation Environments¶

Environment Classes¶

`class` `TrainingEnvironment`¶

`class` `TestingEnvironment`¶

Environment Public Methods¶

`function` `reset`¶

`function` `has_next_state`¶

`function` `get_state`¶

`function` `get_response`¶

`function` `get_score`¶

Training¶

Testing¶

Scoring¶

How is the Score For Ranking Calculated:¶

Your Report Should Contain:¶

What You Can Do¶

What You CAN NOT Do¶

Competition Timeline¶

References¶

	user_id	avg_score
0	0	0.0
1	1	0.0
2	2	0.0
3	3	0.0
4	4	0.0
...	...	...
995	995	0.0
996	996	0.0
997	997	0.0
998	998	0.0
999	999	0.0

	user_id	avg_score
0	0	0.0
1	1	0.0
2	2	0.0
3	3	0.0
4	4	0.0
...	...	...
995	995	0.0
996	996	0.0
997	997	0.0
998	998	0.0
999	999	0.0

DataLab Cup 4: Recommender Systems¶

Platform: Kaggle¶

Overview¶

Datasets¶

User Data¶

Item Data¶

Simulation Environments¶

Environment Classes¶

class TrainingEnvironment¶

class TestingEnvironment¶

Environment Public Methods¶

function reset¶

function has_next_state¶

function get_state¶

function get_response¶

function get_score¶

Training¶

Testing¶

Scoring¶

How is the Score For Ranking Calculated:¶

Your Report Should Contain:¶

What You Can Do¶

What You CAN NOT Do¶

Competition Timeline¶

References¶

Platform: Kaggle ¶

`class` `TrainingEnvironment`¶

`class` `TestingEnvironment`¶

`function` `reset`¶

`function` `has_next_state`¶

`function` `get_state`¶

`function` `get_response`¶

`function` `get_score`¶

	user_id	avg_score
0	0	0.0
1	1	0.0
2	2	0.0
3	3	0.0
4	4	0.0
...	...	...
995	995	0.0
996	996	0.0
997	997	0.0
998	998	0.0
999	999	0.0