-
Notifications
You must be signed in to change notification settings - Fork 0
/
test.yml
83 lines (75 loc) · 1.94 KB
/
test.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
experiment:
dataset:
name: ml-100k
item: # infos related to item dataset (mandatory, at least item_id)
path: datasets/ml-100k/processed/item.csv
extra_features: [movie_year, movie_title] # features(columns) beside item_id to be used
user: # mandatory (at least user_id)
path: datasets/ml-100k/processed/user.csv
extra_features: [gender, occupation] # features beside user_id
ratings: # mandatory (at least [user_id, item_id, rating])
path: datasets/ml-100k/processed/rating.csv
timestamp: True
enrich:
map_path: datasets/ml-100k/processed/map.csv
enrich_path: datasets/ml-100k/processed/enriched.csv
remove_unmatched: False
properties: [subject, director]
preprocess:
# - method: filter_by_rating
# parameters:
# threshold: 20
# - method: binarize
# parameters:
# threshold: 4
- method: filter_kcore
parameters:
k: 20
iterations: 1
target: user # user or rating
split:
seed: 42
# test:
# method: random_by_ratio
# level: global
# p: 0.2
# validation:
# method: random_by_ratio
# level: global
# p: 0.2
# test:
# method: timestamp_by_ratio
# level: user
# p: 0.1
# validation:
# level: user
# method: timestamp_by_ratio
# p: 0.2
# test:
# method: fixed_timestamp
# # type: global_level
# timestamp: 890000000
# validation:
# method: fixed_timestamp
# timestamp: 880000000
test:
method: k_fold
k: 2
level: "user"
models:
- name: deepwalk_based
config:
save_weights: True
parameters:
walk_len: 10
p: 1.0
q: 1.0
n_walks: 50
embedding_size: 64
epochs: 1
evaluation:
k: 5
relevance_threshold: 0
metrics: [MAP, nDCG]
report:
file: "experiment_results/ml100k_enriched/runk10.csv"