Skip to content

Commit

Permalink
[Modelzoo] Change prefetch setting in data processing. (DeepRec-AI#212)
Browse files Browse the repository at this point in the history
Signed-off-by: Duyi-Wang <[email protected]>
  • Loading branch information
Duyi-Wang authored May 11, 2022
1 parent 08fc710 commit 61020d2
Show file tree
Hide file tree
Showing 6 changed files with 6 additions and 12 deletions.
3 changes: 1 addition & 2 deletions modelzoo/DIEN/train.py
Original file line number Diff line number Diff line change
Expand Up @@ -640,11 +640,10 @@ def parse_csv(value, neg_value):
dataset = dataset.shuffle(buffer_size=20000,
seed=args.seed) # set seed for reproducing
dataset = dataset.repeat(num_epochs)
dataset = dataset.prefetch(batch_size)
dataset = dataset.batch(batch_size)
dataset = dataset.map(parse_csv,
num_parallel_calls=tf.data.experimental.AUTOTUNE)
dataset = dataset.prefetch(1)
dataset = dataset.prefetch(2)
return dataset


Expand Down
3 changes: 1 addition & 2 deletions modelzoo/DIN/train.py
Original file line number Diff line number Diff line change
Expand Up @@ -467,11 +467,10 @@ def parse_csv(value):
dataset = dataset.shuffle(buffer_size=20000,
seed=args.seed) # set seed for reproducing
dataset = dataset.repeat(num_epochs)
dataset = dataset.prefetch(batch_size)
dataset = dataset.batch(batch_size)
dataset = dataset.map(parse_csv,
num_parallel_calls=tf.data.experimental.AUTOTUNE)
dataset = dataset.prefetch(1)
dataset = dataset.prefetch(2)
return dataset


Expand Down
3 changes: 1 addition & 2 deletions modelzoo/DLRM/train.py
Original file line number Diff line number Diff line change
Expand Up @@ -315,10 +315,9 @@ def parse_csv(value):
dataset = dataset.shuffle(buffer_size=20000,
seed=args.seed) # set seed for reproducing
dataset = dataset.repeat(num_epochs)
dataset = dataset.prefetch(batch_size)
dataset = dataset.batch(batch_size)
dataset = dataset.map(parse_csv, num_parallel_calls=28)
dataset = dataset.prefetch(1)
dataset = dataset.prefetch(2)
return dataset


Expand Down
3 changes: 1 addition & 2 deletions modelzoo/DSSM/train.py
Original file line number Diff line number Diff line change
Expand Up @@ -291,10 +291,9 @@ def parse_csv(value):
dataset = dataset.shuffle(buffer_size=20000,
seed=args.seed) # fix seed for reproducing
dataset = dataset.repeat(num_epochs)
dataset = dataset.prefetch(batch_size)
dataset = dataset.batch(batch_size)
dataset = dataset.map(parse_csv, num_parallel_calls=28)
dataset = dataset.prefetch(1)
dataset = dataset.prefetch(2)
return dataset


Expand Down
3 changes: 1 addition & 2 deletions modelzoo/DeepFM/train.py
Original file line number Diff line number Diff line change
Expand Up @@ -275,10 +275,9 @@ def parse_csv(value):
dataset = dataset.shuffle(buffer_size=20000,
seed=args.seed) # fix seed for reproducing
dataset = dataset.repeat(num_epochs)
dataset = dataset.prefetch(batch_size)
dataset = dataset.batch(batch_size)
dataset = dataset.map(parse_csv, num_parallel_calls=28)
dataset = dataset.prefetch(1)
dataset = dataset.prefetch(2)
return dataset


Expand Down
3 changes: 1 addition & 2 deletions modelzoo/WDL/train.py
Original file line number Diff line number Diff line change
Expand Up @@ -318,10 +318,9 @@ def parse_csv(value):
dataset = dataset.shuffle(buffer_size=20000,
seed=args.seed) # fix seed for reproducing
dataset = dataset.repeat(num_epochs)
dataset = dataset.prefetch(batch_size)
dataset = dataset.batch(batch_size)
dataset = dataset.map(parse_csv, num_parallel_calls=28)
dataset = dataset.prefetch(1)
dataset = dataset.prefetch(2)
return dataset


Expand Down

0 comments on commit 61020d2

Please sign in to comment.