Support various block sizes & Change default block size to 16 (#38)
This commit is contained in:
@@ -268,6 +268,7 @@ if __name__ == '__main__':
|
||||
f'{model_name}-tp{args.tensor_parallel_size}',
|
||||
sample_dir,
|
||||
'cacheflow',
|
||||
f'block{args.block_size}',
|
||||
f'req-rate-{args.request_rate}',
|
||||
f'seed{args.seed}',
|
||||
f'duration-{args.duration}',
|
||||
|
||||
Reference in New Issue
Block a user