vision/m4/evaluation/tasks/__init__.py (651 lines of code) (raw):
from m4.evaluation.tasks.base import (
BaseTask,
BaseTaskClassification,
BaseTaskImageCaptioning,
BaseTaskImageCaptionMatching,
BaseTaskOpenEndedVQA,
Predictor,
)
from m4.models.idefics.evaluation_captioning_in_context_idefics import (
CocoIdeficsImageCaptioningInContextBleuCiderMeteorRouge,
CocoNewSplitsIdeficsImageCaptioningInContextBleuCiderMeteorRouge,
CocoSampleIdeficsImageCaptioningInContextBleuCiderMeteorRouge,
CommonGenIdeficsImageCaptioningInContextBleuCiderMeteorRouge,
CommonGenIdeficsImageCaptioningInContextTextGenMetrics,
Flickr30kNewSplitsIdeficsImageCaptioningInContextBleuCiderMeteorRouge,
IIIT5KIdeficsImageCaptioningInContextExactMatch,
IIIT5KSampleIdeficsImageCaptioningInContextExactMatch,
NoCapsIdeficsImageCaptioningInContextTextGenMetrics,
NoCapsNewSplitsIdeficsImageCaptioningInContextTextGenMetrics,
NoCapsSampleIdeficsImageCaptioningInContextTextGenMetrics,
TextCapsIdeficsImageCaptioningInContextBleuCiderMeteorRouge,
TextCapsIdeficsImageCaptioningInContextTextGenMetrics,
TextCapsNewSplitsIdeficsImageCaptioningInContextBleuCiderMeteorRouge,
TextCapsSampleIdeficsImageCaptioningInContextBleuCiderMeteorRouge,
TextCapsSampleIdeficsImageCaptioningInContextTextGenMetrics,
)
from m4.models.idefics.evaluation_classification_in_context_idefics import (
Caltech101IdeficsClassificationInContextMeanPerClassAccWithKLAndEntropy,
Caltech101SampleIdeficsClassificationInContextMeanPerClassAccWithKLAndEntropy,
Cifar10DummyIdeficsClassificationInContextAccWithKLAndEntropy,
Cifar10IdeficsClassificationInContextAccWithKLAndEntropy,
Cifar10SampleIdeficsClassificationInContextAccWithKLAndEntropy,
Cifar100IdeficsClassificationInContextAccWithKLAndEntropy,
Cifar100SampleIdeficsClassificationInContextAccWithKLAndEntropy,
ClevrIdeficsClassificationInContextAccWithKLAndEntropy,
ClevrNewSplitsIdeficsClassificationInContextAccWithKLAndEntropy,
ClevrSampleIdeficsClassificationInContextAccWithKLAndEntropy,
DTDIdeficsClassificationInContextAccWithKLAndEntropy,
DTDSampleIdeficsClassificationInContextAccWithKLAndEntropy,
FairFaceAgeIdeficsClassificationInContextAccWithKLAndEntropy,
FairFaceAgeNewSplitsIdeficsClassificationInContextAccWithKLAndEntropy,
FairFaceAgeSampleIdeficsClassificationInContextAccWithKLAndEntropy,
FairFaceGenderIdeficsClassificationInContextAccWithKLAndEntropy,
FairFaceGenderNewSplitsIdeficsClassificationInContextAccWithKLAndEntropy,
FairFaceGenderSampleIdeficsClassificationInContextAccWithKLAndEntropy,
FairFaceRaceIdeficsClassificationInContextAccWithKLAndEntropy,
FairFaceRaceNewSplitsIdeficsClassificationInContextAccWithKLAndEntropy,
FairFaceRaceSampleIdeficsClassificationInContextAccWithKLAndEntropy,
Food101IdeficsClassificationInContextAccWithKLAndEntropy,
Food101SampleIdeficsClassificationInContextAccWithKLAndEntropy,
HatefulMemesIdeficsClassificationInContextAccWithKLAndEntropyROCAUC,
HatefulMemesNewSplitsIdeficsClassificationInContextAccWithKLAndEntropyROCAUC,
IIIT5KIdeficsClassificationInContextAccWithKLAndEntropy,
IIIT5KSampleIdeficsClassificationInContextAccWithKLAndEntropy,
ImageNet1kIdeficsClassificationInContextAccWithKLAndEntropy,
ImageNet1kNewSplits1kSupportIdeficsClassificationInContextAccWithKLAndEntropy,
ImageNet1kNewSplits5kSupportIdeficsClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart0NewSplits1kSupportIdeficsClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart0NewSplits5kSupportIdeficsClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart1NewSplits1kSupportIdeficsClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart1NewSplits5kSupportIdeficsClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart2NewSplits1kSupportIdeficsClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart2NewSplits5kSupportIdeficsClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart3NewSplits1kSupportIdeficsClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart3NewSplits5kSupportIdeficsClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart4NewSplits1kSupportIdeficsClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart4NewSplits5kSupportIdeficsClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart5NewSplits1kSupportIdeficsClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart5NewSplits5kSupportIdeficsClassificationInContextAccWithKLAndEntropy,
ImageNet1kSampleIdeficsClassificationInContextAccWithKLAndEntropy,
MMBenchNewSplitsIdeficsClassificationInContextAccWithKLAndEntropy,
NLVR2NewSplitsIdeficsClassificationInContextAccWithKLAndEntropy,
NLVR2SampleIdeficsClassificationInContextAccWithKLAndEntropy,
OxfordPetsIdeficsClassificationInContextMeanPerClassAccWithKLAndEntropy,
OxfordPetsSampleIdeficsClassificationInContextMeanPerClassAccWithKLAndEntropy,
RenderedSST2IdeficsClassificationInContextAccWithKLAndEntropy,
RenderedSST2NewSplitsIdeficsClassificationInContextAccWithKLAndEntropy,
RenderedSST2SampleIdeficsClassificationInContextAccWithKLAndEntropy,
ScienceQAIdeficsClassificationInContextAccWithKLAndEntropy,
ScienceQANewSplitsIdeficsClassificationInContextAccWithKLAndEntropy,
ScienceQANewSplitsOldSetupIdeficsClassificationInContextAccWithKLAndEntropy,
ScienceQASampleIdeficsClassificationInContextAccWithKLAndEntropy,
SEEDAllIdeficsClassificationInContextAccWithKLAndEntropy,
SEEDInstanceAttributesIdeficsClassificationInContextAccWithKLAndEntropy,
SEEDInstanceIdentityIdeficsClassificationInContextAccWithKLAndEntropy,
SEEDInstanceInteractionIdeficsClassificationInContextAccWithKLAndEntropy,
SEEDInstanceLocationIdeficsClassificationInContextAccWithKLAndEntropy,
SEEDInstancesCountingIdeficsClassificationInContextAccWithKLAndEntropy,
SEEDSceneUnderstandingIdeficsClassificationInContextAccWithKLAndEntropy,
SEEDSpatialRelationIdeficsClassificationInContextAccWithKLAndEntropy,
SEEDTextUnderstandingIdeficsClassificationInContextAccWithKLAndEntropy,
SEEDVisualReasoningIdeficsClassificationInContextAccWithKLAndEntropy,
SimpleImageNet1kIdeficsClassificationInContextAccWithKLAndEntropy,
SimpleImageNet1kSampleIdeficsClassificationInContextAccWithKLAndEntropy,
SNLIVEImageOnlySampleIdeficsClassificationInContextAccWithKLAndEntropy,
SNLIVEImagePremiseSampleIdeficsClassificationInContextAccWithKLAndEntropy,
StanfordCarsIdeficsClassificationInContextAccWithKLAndEntropy,
StanfordCarsSampleIdeficsClassificationInContextAccWithKLAndEntropy,
SugarCrepeAddAttIdeficsClassificationInContextAccWithKLAndEntropy,
SugarCrepeAddObjIdeficsClassificationInContextAccWithKLAndEntropy,
SugarCrepeReplaceAttIdeficsClassificationInContextAccWithKLAndEntropy,
SugarCrepeReplaceObjIdeficsClassificationInContextAccWithKLAndEntropy,
SugarCrepeReplaceRelIdeficsClassificationInContextAccWithKLAndEntropy,
SugarCrepeSwapAttIdeficsClassificationInContextAccWithKLAndEntropy,
SugarCrepeSwapObjIdeficsClassificationInContextAccWithKLAndEntropy,
SUN397IdeficsClassificationInContextAccWithKLAndEntropy,
SUN397SampleIdeficsClassificationInContextAccWithKLAndEntropy,
VisDialNewSplitsIdeficsClassificationInContextNDCG,
)
from m4.models.idefics.evaluation_classification_vqa_in_context_idefics import (
VQAv2IdeficsClassificationVQAInContextAcc,
VQAv2SampleIdeficsClassificationVQAInContextAcc,
)
from m4.models.idefics.evaluation_image_caption_matching_idefics import (
WinogroundIdeficsImageCaptionMatchingAccWithKLAndEntropy,
)
from m4.models.idefics.evaluation_open_ended_vqa_in_context_idefics import (
AdVQAIdeficsOpenEndedVQAInContextAcc,
AdVQASampleIdeficsOpenEndedVQAInContextAcc,
OKVQAIdeficsOpenEndedVQAInContextAcc,
OKVQANewSplitsIdeficsOpenEndedVQAInContextAcc,
OKVQASampleIdeficsOpenEndedVQAInContextAcc,
TextVQAIdeficsOpenEndedVQAInContextAcc,
TextVQANewSplitsIdeficsOpenEndedVQAInContextAcc,
TextVQASampleIdeficsOpenEndedVQAInContextAcc,
VizWizIdeficsOpenEndedVQAInContextAcc,
VizWizNewSplitsIdeficsOpenEndedVQAInContextAcc,
VizWizSampleIdeficsOpenEndedVQAInContextAcc,
VQAv2DummyIdeficsOpenEndedVQAInContextAcc,
VQAv2IdeficsOpenEndedVQAInContextAcc,
VQAv2NewSplitsIdeficsOpenEndedVQAInContextAcc,
VQAv2Part0NewSplitsIdeficsOpenEndedVQAInContextAcc,
VQAv2Part1NewSplitsIdeficsOpenEndedVQAInContextAcc,
VQAv2Part2NewSplitsIdeficsOpenEndedVQAInContextAcc,
VQAv2Part3NewSplitsIdeficsOpenEndedVQAInContextAcc,
VQAv2Part4NewSplitsIdeficsOpenEndedVQAInContextAcc,
VQAv2Part5NewSplitsIdeficsOpenEndedVQAInContextAcc,
VQAv2SampleIdeficsOpenEndedVQAInContextAcc,
)
from m4.models.idefics.evaluation_perplexity_in_context_idefics import (
Cm4IdeficsPerplexityInContextMaxSeLen512,
Cm4IdeficsPerplexityInContextMaxSeLen1024,
Cm4SampleIdeficsPerplexityInContextMaxSeLen512,
Cm4SampleIdeficsPerplexityInContextMaxSeLen1024,
CocoIdeficsPerplexityInContext,
CocoSampleIdeficsPerplexityInContext,
CommonGenIdeficsPerplexityInContext,
EnWikiIdeficsPerplexityInContextMaxSeLen512,
EnWikiIdeficsPerplexityInContextMaxSeLen1024,
EnWikiSampleIdeficsPerplexityInContextMaxSeLen512,
EnWikiSampleIdeficsPerplexityInContextMaxSeLen1024,
IIIT5KIdeficsPerplexityInContext,
IIIT5KSampleIdeficsPerplexityInContext,
MiniGPTCaptionsIdeficsPerplexityInContext,
NoCapsIdeficsPerplexityInContext,
NoCapsSampleIdeficsPerplexityInContext,
TextCapsIdeficsPerplexityInContext,
TextCapsSampleIdeficsPerplexityInContext,
)
from m4.models.vgpt2.evaluation_captioning_in_context_vgpt2 import (
CocoSampleVgpt2ImageCaptioningInContextBleuCiderMeteorRouge,
CocoVgpt2ImageCaptioningInContextBleuCiderMeteorRouge,
CommonGenVgpt2ImageCaptioningInContextBleuCiderMeteorRouge,
CommonGenVgpt2ImageCaptioningInContextTextGenMetrics,
IIIT5KSampleVgpt2ImageCaptioningInContextExactMatch,
IIIT5KVgpt2ImageCaptioningInContextExactMatch,
NoCapsSampleVgpt2ImageCaptioningInContextTextGenMetrics,
NoCapsVgpt2ImageCaptioningInContextTextGenMetrics,
TextCapsSampleVgpt2ImageCaptioningInContextBleuCiderMeteorRouge,
TextCapsSampleVgpt2ImageCaptioningInContextTextGenMetrics,
TextCapsVgpt2ImageCaptioningInContextBleuCiderMeteorRouge,
TextCapsVgpt2ImageCaptioningInContextTextGenMetrics,
)
from m4.models.vgpt2.evaluation_classification_in_context_vgpt2 import (
Caltech101SampleVgpt2ClassificationInContextMeanPerClassAccWithKLAndEntropy,
Caltech101Vgpt2ClassificationInContextMeanPerClassAccWithKLAndEntropy,
Cifar10DummyVgpt2ClassificationInContextAccWithKLAndEntropy,
Cifar10SampleVgpt2ClassificationInContextAccWithKLAndEntropy,
Cifar10Vgpt2ClassificationInContextAccWithKLAndEntropy,
Cifar100SampleVgpt2ClassificationInContextAccWithKLAndEntropy,
Cifar100Vgpt2ClassificationInContextAccWithKLAndEntropy,
ClevrSampleVgpt2ClassificationInContextAccWithKLAndEntropy,
ClevrVgpt2ClassificationInContextAccWithKLAndEntropy,
DTDSampleVgpt2ClassificationInContextAccWithKLAndEntropy,
DTDVgpt2ClassificationInContextAccWithKLAndEntropy,
FairFaceAgeSampleVgpt2ClassificationInContextAccWithKLAndEntropy,
FairFaceAgeVgpt2ClassificationInContextAccWithKLAndEntropy,
FairFaceGenderSampleVgpt2ClassificationInContextAccWithKLAndEntropy,
FairFaceGenderVgpt2ClassificationInContextAccWithKLAndEntropy,
FairFaceRaceSampleVgpt2ClassificationInContextAccWithKLAndEntropy,
FairFaceRaceVgpt2ClassificationInContextAccWithKLAndEntropy,
Food101SampleVgpt2ClassificationInContextAccWithKLAndEntropy,
Food101Vgpt2ClassificationInContextAccWithKLAndEntropy,
HatefulMemesVgpt2ClassificationInContextAccWithKLAndEntropyROCAUC,
IIIT5KSampleVgpt2ClassificationInContextAccWithKLAndEntropy,
IIIT5KVgpt2ClassificationInContextAccWithKLAndEntropy,
ImageNet1kSampleVgpt2ClassificationInContextAccWithKLAndEntropy,
ImageNet1kVgpt2ClassificationInContextAccWithKLAndEntropy,
NLVR2NewSplitsVgpt2ClassificationInContextAccWithKLAndEntropy,
NLVR2SampleVgpt2ClassificationInContextAccWithKLAndEntropy,
OxfordPetsSampleVgpt2ClassificationInContextMeanPerClassAccWithKLAndEntropy,
OxfordPetsVgpt2ClassificationInContextMeanPerClassAccWithKLAndEntropy,
RenderedSST2SampleVgpt2ClassificationInContextAccWithKLAndEntropy,
RenderedSST2Vgpt2ClassificationInContextAccWithKLAndEntropy,
ScienceQANewSplitsVgpt2ClassificationInContextAccWithKLAndEntropy,
ScienceQASampleVgpt2ClassificationInContextAccWithKLAndEntropy,
ScienceQAVgpt2ClassificationInContextAccWithKLAndEntropy,
SimpleImageNet1kSampleVgpt2ClassificationInContextAccWithKLAndEntropy,
SimpleImageNet1kVgpt2ClassificationInContextAccWithKLAndEntropy,
SNLIVEImageOnlySampleVgpt2ClassificationInContextAccWithKLAndEntropy,
SNLIVEImagePremiseSampleVgpt2ClassificationInContextAccWithKLAndEntropy,
StanfordCarsSampleVgpt2ClassificationInContextAccWithKLAndEntropy,
StanfordCarsVgpt2ClassificationInContextAccWithKLAndEntropy,
SUN397SampleVgpt2ClassificationInContextAccWithKLAndEntropy,
SUN397Vgpt2ClassificationInContextAccWithKLAndEntropy,
)
from m4.models.vgpt2.evaluation_classification_vqa_in_context_vgpt2 import (
VQAv2SampleVgpt2ClassificationVQAInContextAcc,
VQAv2Vgpt2ClassificationVQAInContextAcc,
)
from m4.models.vgpt2.evaluation_image_caption_matching_vgpt2 import (
WinogroundVgpt2ImageCaptionMatchingAccWithKLAndEntropy,
)
from m4.models.vgpt2.evaluation_open_ended_vqa_in_context_vgpt2 import (
AdVQASampleVgpt2OpenEndedVQAInContextAcc,
AdVQAVgpt2OpenEndedVQAInContextAcc,
OKVQASampleVgpt2OpenEndedVQAInContextAcc,
OKVQAVgpt2OpenEndedVQAInContextAcc,
TextVQASampleVgpt2OpenEndedVQAInContextAcc,
TextVQAVgpt2OpenEndedVQAInContextAcc,
VQAv2SampleVgpt2OpenEndedVQAInContextAcc,
VQAv2Vgpt2OpenEndedVQAInContextAcc,
)
from m4.models.vgpt2.evaluation_perplexity_in_context_vgpt2 import (
CocoSampleVgpt2PerplexityInContext,
CocoVgpt2PerplexityInContext,
CommonGenVgpt2PerplexityInContext,
IIIT5KSampleVgpt2PerplexityInContext,
IIIT5KVgpt2PerplexityInContext,
MiniGPTCaptionsVgpt2PerplexityInContext,
NoCapsSampleVgpt2PerplexityInContext,
NoCapsVgpt2PerplexityInContext,
TextCapsSampleVgpt2PerplexityInContext,
TextCapsVgpt2PerplexityInContext,
)
from m4.models.vllama3.evaluation_captioning_in_context_vllama3 import (
CocoNewSplitsVLlama3ImageCaptioningInContextBleuCiderMeteorRouge,
CocoSampleVLlama3ImageCaptioningInContextBleuCiderMeteorRouge,
CocoVLlama3ImageCaptioningInContextBleuCiderMeteorRouge,
CommonGenVLlama3ImageCaptioningInContextBleuCiderMeteorRouge,
CommonGenVLlama3ImageCaptioningInContextTextGenMetrics,
Flickr30kNewSplitsVLlama3ImageCaptioningInContextBleuCiderMeteorRouge,
IIIT5KSampleVLlama3ImageCaptioningInContextExactMatch,
IIIT5KVLlama3ImageCaptioningInContextExactMatch,
NoCapsNewSplitsVLlama3ImageCaptioningInContextTextGenMetrics,
NoCapsSampleVLlama3ImageCaptioningInContextTextGenMetrics,
NoCapsVLlama3ImageCaptioningInContextTextGenMetrics,
TextCapsNewSplitsVLlama3ImageCaptioningInContextBleuCiderMeteorRouge,
TextCapsSampleVLlama3ImageCaptioningInContextBleuCiderMeteorRouge,
TextCapsSampleVLlama3ImageCaptioningInContextTextGenMetrics,
TextCapsVLlama3ImageCaptioningInContextBleuCiderMeteorRouge,
TextCapsVLlama3ImageCaptioningInContextTextGenMetrics,
)
from m4.models.vllama3.evaluation_classification_in_context_vllama3 import (
AI2DChatbotVLlama3ClassificationInContextAccWithKLAndEntropy,
AI2DLetterLabelChatbotVLlama3ClassificationInContextAccWithKLAndEntropy,
AI2DNoLetterLabelChatbotVLlama3ClassificationInContextAccWithKLAndEntropy,
Caltech101SampleVLlama3ClassificationInContextMeanPerClassAccWithKLAndEntropy,
Caltech101VLlama3ClassificationInContextMeanPerClassAccWithKLAndEntropy,
Cifar10DummyVLlama3ClassificationInContextAccWithKLAndEntropy,
Cifar10SampleVLlama3ClassificationInContextAccWithKLAndEntropy,
Cifar10VLlama3ClassificationInContextAccWithKLAndEntropy,
Cifar100SampleVLlama3ClassificationInContextAccWithKLAndEntropy,
Cifar100VLlama3ClassificationInContextAccWithKLAndEntropy,
ClevrChatbotVLlama3ClassificationInContextAccWithKLAndEntropy,
ClevrNewSplitsVLlama3ClassificationInContextAccWithKLAndEntropy,
ClevrSampleVLlama3ClassificationInContextAccWithKLAndEntropy,
ClevrVLlama3ClassificationInContextAccWithKLAndEntropy,
DTDSampleVLlama3ClassificationInContextAccWithKLAndEntropy,
DTDVLlama3ClassificationInContextAccWithKLAndEntropy,
FairFaceAgeNewSplitsVLlama3ClassificationInContextAccWithKLAndEntropy,
FairFaceAgeSampleVLlama3ClassificationInContextAccWithKLAndEntropy,
FairFaceAgeVLlama3ClassificationInContextAccWithKLAndEntropy,
FairFaceGenderNewSplitsVLlama3ClassificationInContextAccWithKLAndEntropy,
FairFaceGenderSampleVLlama3ClassificationInContextAccWithKLAndEntropy,
FairFaceGenderVLlama3ClassificationInContextAccWithKLAndEntropy,
FairFaceRaceNewSplitsVLlama3ClassificationInContextAccWithKLAndEntropy,
FairFaceRaceSampleVLlama3ClassificationInContextAccWithKLAndEntropy,
FairFaceRaceVLlama3ClassificationInContextAccWithKLAndEntropy,
Food101SampleVLlama3ClassificationInContextAccWithKLAndEntropy,
Food101VLlama3ClassificationInContextAccWithKLAndEntropy,
HatefulMemesNewSplitsVLlama3ClassificationInContextAccWithKLAndEntropyROCAUC,
HatefulMemesVLlama3ClassificationInContextAccWithKLAndEntropyROCAUC,
IIIT5KSampleVLlama3ClassificationInContextAccWithKLAndEntropy,
IIIT5KVLlama3ClassificationInContextAccWithKLAndEntropy,
ImageNet1kNewSplits1kSupportVLlama3ClassificationInContextAccWithKLAndEntropy,
ImageNet1kNewSplits5kSupportVLlama3ClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart0NewSplits1kSupportVLlama3ClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart0NewSplits5kSupportVLlama3ClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart1NewSplits1kSupportVLlama3ClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart1NewSplits5kSupportVLlama3ClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart2NewSplits1kSupportVLlama3ClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart2NewSplits5kSupportVLlama3ClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart3NewSplits1kSupportVLlama3ClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart3NewSplits5kSupportVLlama3ClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart4NewSplits1kSupportVLlama3ClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart4NewSplits5kSupportVLlama3ClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart5NewSplits1kSupportVLlama3ClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart5NewSplits5kSupportVLlama3ClassificationInContextAccWithKLAndEntropy,
ImageNet1kSampleVLlama3ClassificationInContextAccWithKLAndEntropy,
ImageNet1kVLlama3ClassificationInContextAccWithKLAndEntropy,
MathVistaMCQChatbotVLlama3ClassificationInContextAccWithKLAndEntropy,
MMBenchChatbotValDedupVLlama3ClassificationInContextAccWithKLAndEntropy,
MMBenchChatbotVLlama3ClassificationInContextAccWithKLAndEntropy,
MMBenchNewSplitsVLlama3ClassificationInContextAccWithKLAndEntropy,
MMMUMCQChatbotVLlama3ClassificationInContextAccWithKLAndEntropy,
MMMUMCQMultipleImagesChatbotVLlama3ClassificationInContextAccWithKLAndEntropy,
MMMUMCQSingleImageChatbotVLlama3ClassificationInContextAccWithKLAndEntropy,
MMStarChatbotVLlama3ClassificationInContextAccWithKLAndEntropy,
NLVR2NewSplitsVLlama3ClassificationInContextAccWithKLAndEntropy,
NLVR2SampleVLlama3ClassificationInContextAccWithKLAndEntropy,
OxfordPetsSampleVLlama3ClassificationInContextMeanPerClassAccWithKLAndEntropy,
OxfordPetsVLlama3ClassificationInContextMeanPerClassAccWithKLAndEntropy,
POPEChatbotVLlama3ClassificationInContextAccWithKLAndEntropy,
QBenchChatbotVLlama3ClassificationInContextAccWithKLAndEntropy,
RavenChatbotVLlama3ClassificationInContextAccWithKLAndEntropy,
RenderedSST2NewSplitsVLlama3ClassificationInContextAccWithKLAndEntropy,
RenderedSST2SampleVLlama3ClassificationInContextAccWithKLAndEntropy,
RenderedSST2VLlama3ClassificationInContextAccWithKLAndEntropy,
ScienceQAImgChatbotgNoMCQVLlama3ClassificationInContextAccWithKLAndEntropy,
ScienceQAImgChatbotVLlama3ClassificationInContextAccWithKLAndEntropy,
ScienceQANewSplitsOldSetupVLlama3ClassificationInContextAccWithKLAndEntropy,
ScienceQANewSplitsVLlama3ClassificationInContextAccWithKLAndEntropy,
ScienceQASampleVLlama3ClassificationInContextAccWithKLAndEntropy,
ScienceQAVLlama3ClassificationInContextAccWithKLAndEntropy,
SEEDAllVLlama3ClassificationInContextAccWithKLAndEntropy,
SEEDImgChatbotVLlama3ClassificationInContextAccWithKLAndEntropy,
SEEDInstanceAttributesVLlama3ClassificationInContextAccWithKLAndEntropy,
SEEDInstanceIdentityVLlama3ClassificationInContextAccWithKLAndEntropy,
SEEDInstanceInteractionVLlama3ClassificationInContextAccWithKLAndEntropy,
SEEDInstanceLocationVLlama3ClassificationInContextAccWithKLAndEntropy,
SEEDInstancesCountingVLlama3ClassificationInContextAccWithKLAndEntropy,
SEEDSceneUnderstandingVLlama3ClassificationInContextAccWithKLAndEntropy,
SEEDSpatialRelationVLlama3ClassificationInContextAccWithKLAndEntropy,
SEEDTextUnderstandingVLlama3ClassificationInContextAccWithKLAndEntropy,
SEEDVisualReasoningVLlama3ClassificationInContextAccWithKLAndEntropy,
SimpleImageNet1kSampleVLlama3ClassificationInContextAccWithKLAndEntropy,
SimpleImageNet1kVLlama3ClassificationInContextAccWithKLAndEntropy,
SNLIVEImageOnlySampleVLlama3ClassificationInContextAccWithKLAndEntropy,
SNLIVEImagePremiseSampleVLlama3ClassificationInContextAccWithKLAndEntropy,
StanfordCarsSampleVLlama3ClassificationInContextAccWithKLAndEntropy,
StanfordCarsVLlama3ClassificationInContextAccWithKLAndEntropy,
SugarCrepeAddAttVLlama3ClassificationInContextAccWithKLAndEntropy,
SugarCrepeAddObjVLlama3ClassificationInContextAccWithKLAndEntropy,
SugarCrepeReplaceAttVLlama3ClassificationInContextAccWithKLAndEntropy,
SugarCrepeReplaceObjVLlama3ClassificationInContextAccWithKLAndEntropy,
SugarCrepeReplaceRelVLlama3ClassificationInContextAccWithKLAndEntropy,
SugarCrepeSwapAttVLlama3ClassificationInContextAccWithKLAndEntropy,
SugarCrepeSwapObjVLlama3ClassificationInContextAccWithKLAndEntropy,
SUN397SampleVLlama3ClassificationInContextAccWithKLAndEntropy,
SUN397VLlama3ClassificationInContextAccWithKLAndEntropy,
VisDialNewSplitsVLlama3ClassificationInContextNDCG,
VSRChatbotVLlama3ClassificationInContextAccWithKLAndEntropy,
)
from m4.models.vllama3.evaluation_open_ended_vqa_in_context_vllama3 import (
AdVQASampleVLlama3OpenEndedVQAInContextAcc,
AdVQAVLlama3OpenEndedVQAInContextAcc,
ChartQAChatbotVLlama3OpenEndedVQAInContextAcc,
DocVQAChatbotVLlama3OpenEndedVQAInContextAnls,
DocVQASampleVLlama3OpenEndedVQAInContextAnls,
DocVQAVLlama3OpenEndedVQAInContextAnls,
GQAChatbotVLlama3OpenEndedVQAInContextAcc,
LLaVAWildChatbotVLlama3OpenEndedVQAInContextAcc,
MathVistaOpenEndedChatbotVLlama3OpenEndedVQAInContextAcc,
MathVistaVLlama3OpenEndedVQAInContextAcc,
MMMUOpenEndedChatbotVLlama3OpenEndedVQAInContextAcc,
MMMUOpenEndedSingleImageChatbotVLlama3OpenEndedVQAInContextAcc,
MMMUVLlama3OpenEndedVQAInContextAcc,
MMVETChatbotVLlama3OpenEndedVQAInContextAcc,
OKVQAChatbotVLlama3OpenEndedVQAInContextAcc,
OKVQANewSplitsVLlama3OpenEndedVQAInContextAcc,
OKVQASampleVLlama3OpenEndedVQAInContextAcc,
OKVQAVLlama3OpenEndedVQAInContextAcc,
TextVQAChatbotVLlama3OpenEndedVQAInContextAcc,
TextVQANewSplitsVLlama3OpenEndedVQAInContextAcc,
TextVQASampleVLlama3OpenEndedVQAInContextAcc,
TextVQAVLlama3OpenEndedVQAInContextAcc,
VizWizNewSplitsVLlama3OpenEndedVQAInContextAcc,
VizWizSampleVLlama3OpenEndedVQAInContextAcc,
VizWizVLlama3OpenEndedVQAInContextAcc,
VQAv2ChatbotVLlama3OpenEndedVQAInContextAcc,
VQAv2DummyVLlama3OpenEndedVQAInContextAcc,
VQAv2NewSplitsVLlama3OpenEndedVQAInContextAcc,
VQAv2Part0NewSplitsVLlama3OpenEndedVQAInContextAcc,
VQAv2Part1NewSplitsVLlama3OpenEndedVQAInContextAcc,
VQAv2Part2NewSplitsVLlama3OpenEndedVQAInContextAcc,
VQAv2Part3NewSplitsVLlama3OpenEndedVQAInContextAcc,
VQAv2Part4NewSplitsVLlama3OpenEndedVQAInContextAcc,
VQAv2Part5NewSplitsVLlama3OpenEndedVQAInContextAcc,
VQAv2SampleVLlama3OpenEndedVQAInContextAcc,
VQAv2VLlama3OpenEndedVQAInContextAcc,
)
from m4.models.vmistral.evaluation_captioning_in_context_vmistral import (
CocoNewSplitsVMistralImageCaptioningInContextBleuCiderMeteorRouge,
CocoSampleVMistralImageCaptioningInContextBleuCiderMeteorRouge,
CocoVMistralImageCaptioningInContextBleuCiderMeteorRouge,
CommonGenVMistralImageCaptioningInContextBleuCiderMeteorRouge,
CommonGenVMistralImageCaptioningInContextTextGenMetrics,
Flickr30kNewSplitsVMistralImageCaptioningInContextBleuCiderMeteorRouge,
IIIT5KSampleVMistralImageCaptioningInContextExactMatch,
IIIT5KVMistralImageCaptioningInContextExactMatch,
NoCapsNewSplitsVMistralImageCaptioningInContextTextGenMetrics,
NoCapsSampleVMistralImageCaptioningInContextTextGenMetrics,
NoCapsVMistralImageCaptioningInContextTextGenMetrics,
TextCapsNewSplitsVMistralImageCaptioningInContextBleuCiderMeteorRouge,
TextCapsSampleVMistralImageCaptioningInContextBleuCiderMeteorRouge,
TextCapsSampleVMistralImageCaptioningInContextTextGenMetrics,
TextCapsVMistralImageCaptioningInContextBleuCiderMeteorRouge,
TextCapsVMistralImageCaptioningInContextTextGenMetrics,
)
from m4.models.vmistral.evaluation_classification_in_context_vmistral import (
Caltech101SampleVMistralClassificationInContextMeanPerClassAccWithKLAndEntropy,
Caltech101VMistralClassificationInContextMeanPerClassAccWithKLAndEntropy,
Cifar10DummyVMistralClassificationInContextAccWithKLAndEntropy,
Cifar10SampleVMistralClassificationInContextAccWithKLAndEntropy,
Cifar10VMistralClassificationInContextAccWithKLAndEntropy,
Cifar100SampleVMistralClassificationInContextAccWithKLAndEntropy,
Cifar100VMistralClassificationInContextAccWithKLAndEntropy,
ClevrChatbotVMistralClassificationInContextAccWithKLAndEntropy,
ClevrNewSplitsVMistralClassificationInContextAccWithKLAndEntropy,
ClevrSampleVMistralClassificationInContextAccWithKLAndEntropy,
ClevrVMistralClassificationInContextAccWithKLAndEntropy,
DTDSampleVMistralClassificationInContextAccWithKLAndEntropy,
DTDVMistralClassificationInContextAccWithKLAndEntropy,
FairFaceAgeNewSplitsVMistralClassificationInContextAccWithKLAndEntropy,
FairFaceAgeSampleVMistralClassificationInContextAccWithKLAndEntropy,
FairFaceAgeVMistralClassificationInContextAccWithKLAndEntropy,
FairFaceGenderNewSplitsVMistralClassificationInContextAccWithKLAndEntropy,
FairFaceGenderSampleVMistralClassificationInContextAccWithKLAndEntropy,
FairFaceGenderVMistralClassificationInContextAccWithKLAndEntropy,
FairFaceRaceNewSplitsVMistralClassificationInContextAccWithKLAndEntropy,
FairFaceRaceSampleVMistralClassificationInContextAccWithKLAndEntropy,
FairFaceRaceVMistralClassificationInContextAccWithKLAndEntropy,
Food101SampleVMistralClassificationInContextAccWithKLAndEntropy,
Food101VMistralClassificationInContextAccWithKLAndEntropy,
HatefulMemesNewSplitsVMistralClassificationInContextAccWithKLAndEntropyROCAUC,
HatefulMemesVMistralClassificationInContextAccWithKLAndEntropyROCAUC,
IIIT5KSampleVMistralClassificationInContextAccWithKLAndEntropy,
IIIT5KVMistralClassificationInContextAccWithKLAndEntropy,
ImageNet1kNewSplits1kSupportVMistralClassificationInContextAccWithKLAndEntropy,
ImageNet1kNewSplits5kSupportVMistralClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart0NewSplits1kSupportVMistralClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart0NewSplits5kSupportVMistralClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart1NewSplits1kSupportVMistralClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart1NewSplits5kSupportVMistralClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart2NewSplits1kSupportVMistralClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart2NewSplits5kSupportVMistralClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart3NewSplits1kSupportVMistralClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart3NewSplits5kSupportVMistralClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart4NewSplits1kSupportVMistralClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart4NewSplits5kSupportVMistralClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart5NewSplits1kSupportVMistralClassificationInContextAccWithKLAndEntropy,
ImageNet1kPart5NewSplits5kSupportVMistralClassificationInContextAccWithKLAndEntropy,
ImageNet1kSampleVMistralClassificationInContextAccWithKLAndEntropy,
ImageNet1kVMistralClassificationInContextAccWithKLAndEntropy,
MathVistaMCQChatbotVMistralClassificationInContextAccWithKLAndEntropy,
MMBenchChatbotValDedupVMistralClassificationInContextAccWithKLAndEntropy,
MMBenchChatbotVMistralClassificationInContextAccWithKLAndEntropy,
MMBenchNewSplitsVMistralClassificationInContextAccWithKLAndEntropy,
MMMUMCQChatbotVMistralClassificationInContextAccWithKLAndEntropy,
NLVR2NewSplitsVMistralClassificationInContextAccWithKLAndEntropy,
NLVR2SampleVMistralClassificationInContextAccWithKLAndEntropy,
OxfordPetsSampleVMistralClassificationInContextMeanPerClassAccWithKLAndEntropy,
OxfordPetsVMistralClassificationInContextMeanPerClassAccWithKLAndEntropy,
POPEChatbotVMistralClassificationInContextAccWithKLAndEntropy,
QBenchChatbotVMistralClassificationInContextAccWithKLAndEntropy,
RavenChatbotVMistralClassificationInContextAccWithKLAndEntropy,
RenderedSST2NewSplitsVMistralClassificationInContextAccWithKLAndEntropy,
RenderedSST2SampleVMistralClassificationInContextAccWithKLAndEntropy,
RenderedSST2VMistralClassificationInContextAccWithKLAndEntropy,
ScienceQAImgChatbotgNoMCQVMistralClassificationInContextAccWithKLAndEntropy,
ScienceQAImgChatbotVMistralClassificationInContextAccWithKLAndEntropy,
ScienceQANewSplitsOldSetupVMistralClassificationInContextAccWithKLAndEntropy,
ScienceQANewSplitsVMistralClassificationInContextAccWithKLAndEntropy,
ScienceQASampleVMistralClassificationInContextAccWithKLAndEntropy,
ScienceQAVMistralClassificationInContextAccWithKLAndEntropy,
SEEDAllVMistralClassificationInContextAccWithKLAndEntropy,
SEEDImgChatbotVMistralClassificationInContextAccWithKLAndEntropy,
SEEDInstanceAttributesVMistralClassificationInContextAccWithKLAndEntropy,
SEEDInstanceIdentityVMistralClassificationInContextAccWithKLAndEntropy,
SEEDInstanceInteractionVMistralClassificationInContextAccWithKLAndEntropy,
SEEDInstanceLocationVMistralClassificationInContextAccWithKLAndEntropy,
SEEDInstancesCountingVMistralClassificationInContextAccWithKLAndEntropy,
SEEDSceneUnderstandingVMistralClassificationInContextAccWithKLAndEntropy,
SEEDSpatialRelationVMistralClassificationInContextAccWithKLAndEntropy,
SEEDTextUnderstandingVMistralClassificationInContextAccWithKLAndEntropy,
SEEDVisualReasoningVMistralClassificationInContextAccWithKLAndEntropy,
SimpleImageNet1kSampleVMistralClassificationInContextAccWithKLAndEntropy,
SimpleImageNet1kVMistralClassificationInContextAccWithKLAndEntropy,
SNLIVEImageOnlySampleVMistralClassificationInContextAccWithKLAndEntropy,
SNLIVEImagePremiseSampleVMistralClassificationInContextAccWithKLAndEntropy,
StanfordCarsSampleVMistralClassificationInContextAccWithKLAndEntropy,
StanfordCarsVMistralClassificationInContextAccWithKLAndEntropy,
SugarCrepeAddAttVMistralClassificationInContextAccWithKLAndEntropy,
SugarCrepeAddObjVMistralClassificationInContextAccWithKLAndEntropy,
SugarCrepeReplaceAttVMistralClassificationInContextAccWithKLAndEntropy,
SugarCrepeReplaceObjVMistralClassificationInContextAccWithKLAndEntropy,
SugarCrepeReplaceRelVMistralClassificationInContextAccWithKLAndEntropy,
SugarCrepeSwapAttVMistralClassificationInContextAccWithKLAndEntropy,
SugarCrepeSwapObjVMistralClassificationInContextAccWithKLAndEntropy,
SUN397SampleVMistralClassificationInContextAccWithKLAndEntropy,
SUN397VMistralClassificationInContextAccWithKLAndEntropy,
VisDialNewSplitsVMistralClassificationInContextNDCG,
VSRChatbotVMistralClassificationInContextAccWithKLAndEntropy,
)
from m4.models.vmistral.evaluation_classification_vqa_in_context_vmistral import (
VQAv2SampleVMistralClassificationVQAInContextAcc,
VQAv2VMistralClassificationVQAInContextAcc,
)
from m4.models.vmistral.evaluation_image_caption_matching_vmistral import (
WinogroundVMistralImageCaptionMatchingAccWithKLAndEntropy,
)
from m4.models.vmistral.evaluation_open_ended_vqa_in_context_vmistral import (
AdVQASampleVMistralOpenEndedVQAInContextAcc,
AdVQAVMistralOpenEndedVQAInContextAcc,
ChartQAChatbotVMistralOpenEndedVQAInContextAcc,
DocVQAChatbotVMistralOpenEndedVQAInContextAnls,
DocVQASampleVMistralOpenEndedVQAInContextAnls,
DocVQAVMistralOpenEndedVQAInContextAnls,
GQAChatbotVMistralOpenEndedVQAInContextAcc,
LLaVAWildChatbotVMistralOpenEndedVQAInContextAcc,
MathVistaOpenEndedChatbotVMistralOpenEndedVQAInContextAcc,
MathVistaVMistralOpenEndedVQAInContextAcc,
MMMUOpenEndedChatbotVMistralOpenEndedVQAInContextAcc,
MMMUVMistralOpenEndedVQAInContextAcc,
MMVETChatbotVMistralOpenEndedVQAInContextAcc,
OKVQAChatbotVMistralOpenEndedVQAInContextAcc,
OKVQANewSplitsVMistralOpenEndedVQAInContextAcc,
OKVQASampleVMistralOpenEndedVQAInContextAcc,
OKVQAVMistralOpenEndedVQAInContextAcc,
TextVQAChatbotVMistralOpenEndedVQAInContextAcc,
TextVQANewSplitsVMistralOpenEndedVQAInContextAcc,
TextVQASampleVMistralOpenEndedVQAInContextAcc,
TextVQAVMistralOpenEndedVQAInContextAcc,
VizWizNewSplitsVMistralOpenEndedVQAInContextAcc,
VizWizSampleVMistralOpenEndedVQAInContextAcc,
VizWizVMistralOpenEndedVQAInContextAcc,
VQAv2ChatbotVMistralOpenEndedVQAInContextAcc,
VQAv2DummyVMistralOpenEndedVQAInContextAcc,
VQAv2NewSplitsVMistralOpenEndedVQAInContextAcc,
VQAv2Part0NewSplitsVMistralOpenEndedVQAInContextAcc,
VQAv2Part1NewSplitsVMistralOpenEndedVQAInContextAcc,
VQAv2Part2NewSplitsVMistralOpenEndedVQAInContextAcc,
VQAv2Part3NewSplitsVMistralOpenEndedVQAInContextAcc,
VQAv2Part4NewSplitsVMistralOpenEndedVQAInContextAcc,
VQAv2Part5NewSplitsVMistralOpenEndedVQAInContextAcc,
VQAv2SampleVMistralOpenEndedVQAInContextAcc,
VQAv2VMistralOpenEndedVQAInContextAcc,
)
from m4.models.vmistral.evaluation_perplexity_in_context_vmistral import (
Cm4SampleVMistralPerplexityInContextMaxSeLen512,
Cm4SampleVMistralPerplexityInContextMaxSeLen1024,
Cm4VMistralPerplexityInContextMaxSeLen512,
Cm4VMistralPerplexityInContextMaxSeLen1024,
CocoSampleVMistralPerplexityInContext,
CocoVMistralPerplexityInContext,
CommonGenVMistralPerplexityInContext,
EnWikiSampleVMistralPerplexityInContextMaxSeLen512,
EnWikiSampleVMistralPerplexityInContextMaxSeLen1024,
EnWikiVMistralPerplexityInContextMaxSeLen512,
EnWikiVMistralPerplexityInContextMaxSeLen1024,
IIIT5KSampleVMistralPerplexityInContext,
IIIT5KVMistralPerplexityInContext,
MiniGPTCaptionsVMistralPerplexityInContext,
NoCapsSampleVMistralPerplexityInContext,
NoCapsVMistralPerplexityInContext,
TextCapsSampleVMistralPerplexityInContext,
TextCapsVMistralPerplexityInContext,
)
# Needed for the tests
VGPT2_TASKS = {
Predictor.in_contexter: [
Caltech101Vgpt2ClassificationInContextMeanPerClassAccWithKLAndEntropy,
Cifar10Vgpt2ClassificationInContextAccWithKLAndEntropy,
Cifar100Vgpt2ClassificationInContextAccWithKLAndEntropy,
ClevrVgpt2ClassificationInContextAccWithKLAndEntropy,
DTDVgpt2ClassificationInContextAccWithKLAndEntropy,
Food101Vgpt2ClassificationInContextAccWithKLAndEntropy,
HatefulMemesVgpt2ClassificationInContextAccWithKLAndEntropyROCAUC,
ImageNet1kVgpt2ClassificationInContextAccWithKLAndEntropy,
OxfordPetsVgpt2ClassificationInContextMeanPerClassAccWithKLAndEntropy,
RenderedSST2Vgpt2ClassificationInContextAccWithKLAndEntropy,
StanfordCarsVgpt2ClassificationInContextAccWithKLAndEntropy,
SUN397Vgpt2ClassificationInContextAccWithKLAndEntropy,
VQAv2Vgpt2OpenEndedVQAInContextAcc,
OKVQAVgpt2OpenEndedVQAInContextAcc,
TextVQAVgpt2OpenEndedVQAInContextAcc,
AdVQAVgpt2OpenEndedVQAInContextAcc,
ScienceQAVgpt2ClassificationInContextAccWithKLAndEntropy,
ScienceQANewSplitsVgpt2ClassificationInContextAccWithKLAndEntropy,
VQAv2Vgpt2ClassificationVQAInContextAcc,
TextCapsVgpt2ImageCaptioningInContextTextGenMetrics,
TextCapsVgpt2ImageCaptioningInContextBleuCiderMeteorRouge,
CommonGenVgpt2ImageCaptioningInContextTextGenMetrics,
CommonGenVgpt2ImageCaptioningInContextBleuCiderMeteorRouge,
FairFaceAgeVgpt2ClassificationInContextAccWithKLAndEntropy,
FairFaceGenderVgpt2ClassificationInContextAccWithKLAndEntropy,
FairFaceRaceVgpt2ClassificationInContextAccWithKLAndEntropy,
ClevrVgpt2ClassificationInContextAccWithKLAndEntropy,
NoCapsVgpt2ImageCaptioningInContextTextGenMetrics,
CocoVgpt2ImageCaptioningInContextBleuCiderMeteorRouge,
IIIT5KVgpt2ClassificationInContextAccWithKLAndEntropy,
IIIT5KVgpt2ImageCaptioningInContextExactMatch,
SimpleImageNet1kVgpt2ClassificationInContextAccWithKLAndEntropy,
],
}
VGPT2_SAMPLE_TASKS = {
Predictor.in_contexter: [
Caltech101SampleVgpt2ClassificationInContextMeanPerClassAccWithKLAndEntropy,
Cifar10SampleVgpt2ClassificationInContextAccWithKLAndEntropy,
Cifar100SampleVgpt2ClassificationInContextAccWithKLAndEntropy,
ClevrSampleVgpt2ClassificationInContextAccWithKLAndEntropy,
DTDSampleVgpt2ClassificationInContextAccWithKLAndEntropy,
Food101SampleVgpt2ClassificationInContextAccWithKLAndEntropy,
ImageNet1kSampleVgpt2ClassificationInContextAccWithKLAndEntropy,
OxfordPetsSampleVgpt2ClassificationInContextMeanPerClassAccWithKLAndEntropy,
RenderedSST2SampleVgpt2ClassificationInContextAccWithKLAndEntropy,
StanfordCarsSampleVgpt2ClassificationInContextAccWithKLAndEntropy,
SUN397SampleVgpt2ClassificationInContextAccWithKLAndEntropy,
VQAv2SampleVgpt2OpenEndedVQAInContextAcc,
OKVQASampleVgpt2OpenEndedVQAInContextAcc,
TextVQASampleVgpt2OpenEndedVQAInContextAcc,
AdVQASampleVgpt2OpenEndedVQAInContextAcc,
ScienceQASampleVgpt2ClassificationInContextAccWithKLAndEntropy,
VQAv2SampleVgpt2ClassificationVQAInContextAcc,
FairFaceAgeSampleVgpt2ClassificationInContextAccWithKLAndEntropy,
FairFaceGenderSampleVgpt2ClassificationInContextAccWithKLAndEntropy,
FairFaceRaceSampleVgpt2ClassificationInContextAccWithKLAndEntropy,
TextCapsSampleVgpt2ImageCaptioningInContextBleuCiderMeteorRouge,
SNLIVEImageOnlySampleVgpt2ClassificationInContextAccWithKLAndEntropy,
SNLIVEImagePremiseSampleVgpt2ClassificationInContextAccWithKLAndEntropy,
NLVR2SampleVgpt2ClassificationInContextAccWithKLAndEntropy,
NLVR2NewSplitsVgpt2ClassificationInContextAccWithKLAndEntropy,
TextCapsSampleVgpt2ImageCaptioningInContextTextGenMetrics,
ClevrSampleVgpt2ClassificationInContextAccWithKLAndEntropy,
NoCapsSampleVgpt2ImageCaptioningInContextTextGenMetrics,
CocoSampleVgpt2ImageCaptioningInContextBleuCiderMeteorRouge,
IIIT5KSampleVgpt2ClassificationInContextAccWithKLAndEntropy,
IIIT5KSampleVgpt2ImageCaptioningInContextExactMatch,
SimpleImageNet1kSampleVgpt2ClassificationInContextAccWithKLAndEntropy,
],
}