blip2_triviaqa_viquae / config_kwargs.json
usr256864's picture
Upload 3 files
0de94d5 verified
{
"monitor_metric": "eval_exact_match",
"trainer_kwargs": {
"class_name": "RA_Reader"
},
"trainee_kwargs": {
"class_name": "Encoder_Generator",
"loss": {
"class_name": "NLLLoss"
},
"freeze_prefixes": [],
"use_image": true,
"quantize": false,
"codebook_kwargs": {
"class_name": "GroupedResidualVQ",
"decay": 0.5,
"commitment_weight": 1,
"dim": 1280,
"codebook_size": 1024,
"num_quantizers": 128,
"groups": 8,
"sample_codebook_temp": 0.0,
"learnable_codebook": false,
"use_cosine_sim": false,
"shared_codebook": false,
"kmeans_init": false
}
},
"data_module_kwargs": {
"class_name": "multi_modal_DataModule",
"data_processor": {
"class_name": "viquae_data_processor",
"dataset_path": "../../all_data/",
"kb_path": "../../all_data/passages/",
"entity_kb_path": "../../all_data/kb/"
},
"relevant_indices_key": "BM25_provenance_indices",
"irrelevant_indices_key": "BM25_irrelevant_indices",
"input_key": "input",
"passage_key": "passage",
"dataloader_kwargs": {
"num_workers": 6,
"prefetch_factor": 2
},
"image_processor_kwargs": {
"class_name": "ImageFormatter",
"feature_extractor_kwargs": {
"class_name": "CLIPFeatureExtractor",
"pretrained_model_name_or_path": "clip-vit-base-patch32_FE"
}
}
},
"answer_generator_kwargs": {
"class_name": "Blip2ForConditionalGeneration",
"checkpoint_name": "answer_generator",
"checkpoint": "saved_models/blip2_triviaqa/answer_generator/pytorch_model.bin",
"title_key": "wikipedia_title",
"column": "my_DPR_few_shot",
"pretrained_model_name_or_path": "/home/data/meerqat/my_transformers_cache/blip2",
"k_train": 5,
"k_test": 5,
"k_entities": 3,
"rag_training": false,
"rag": false,
"generator_only": true,
"entity_prompt": false,
"beam_search": true,
"best_answer": false,
"best_entity": false,
"tokenizer_kwargs": {
"class_name": "Blip2Processor",
"pretrained_model_name_or_path": "blip2_processor"
},
"image_processor_kwargs": {
"class_name": "ImageFormatter",
"feature_extractor_kwargs": {
"class_name": "Blip2Processor",
"pretrained_model_name_or_path": "blip2_processor"
}
},
"inference_path": "saved_models/blip2_triviaqa_viquae/answer_generator"
}
}