-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathexplore_hwu64.py
22 lines (19 loc) · 1.24 KB
/
explore_hwu64.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
# Created by xunannancy at 2024/03/04
from explore_banking77 import save_labels, retrieve_labels_sbert_train_examples, prepare_data_sparse_retrieval, \
construct_dataset
from dataset_utilities import label_check
if __name__ == '__main__':
save_labels(dataset='HWU64')
label_check(dataset='HWU64')
model_name = 'gtr-t5-xl'
for setting in ['train_5', 'train_10']:
retrieve_labels_sbert_train_examples(dataset='HWU64', setting=setting, batch_examples=5, model_name=model_name)
for num_words in [100]:
prepare_data_sparse_retrieval(num_words=num_words, with_text=True,
source_list=[f'{setting}_{model_name}_-1examples'],
nickname=f'combined_{setting}_{model_name}_-1examples',
dataset='HWU64')
for dataset in ['train_5', 'train_10', 'valid', 'train', 'test']: #
for label_nickname in [f'combined_train_5_{model_name}_-1examples', f'combined_train_10_{model_name}_-1examples']:
for with_question_flag in [False]:#[True, False]:
construct_dataset(dataset=dataset, label_nickname=label_nickname, parent_dataset='HWU64', with_question_flag=with_question_flag)