from typing import Sequence, Union

import torch.nn as nn

from allenact.base_abstractions.preprocessor import Preprocessor
from allenact.utils.experiment_utils import Builder, TrainingPipeline
from allenact_plugins.clip_plugin.clip_preprocessors import (
    ClipViTPreprocessor,
    NaivePreprocessor
)
from projects.plugins.ithor_plugin.ithor_sensors import (
    GoalObjectTypeThorSensor,
    RGBSensorThor,
)
from projects.object_navigation.baseline_configs.clip.zeroshot_mixins import (
    CLIPViTGRUActorCriticMixin
)
from projects.object_navigation.baseline_configs.ithor.objectnav_ithor_base import (
    ObjectNaviThorMultiMDPsBaseConfig
)
from projects.object_navigation.baseline_configs.navigation_base import ObjectNavPPOMixin


class ObjectNaviThorClipViTRGBPPOExperimentConfig(ObjectNaviThorMultiMDPsBaseConfig):
    """A CLIP Object Navigation experiment configuration in RoboThor
    with RGB input."""

    CLIP_MODEL_TYPE = "ViT-B/32"
    # NOISE_STD = 0.02
    # SEMANTIC_NOISE = (0.0, True, "../logs/PROMPTS/10promptcls/checkpoints/text_features_best.pth", 0.996)
    NOISE_STD = 0.0

    SENSORS = [
        RGBSensorThor(
            height=ObjectNaviThorMultiMDPsBaseConfig.SCREEN_SIZE,
            width=ObjectNaviThorMultiMDPsBaseConfig.SCREEN_SIZE,
            use_resnet_normalization=True,
            mean=ClipViTPreprocessor.CLIP_RGB_MEANS,
            stdev=ClipViTPreprocessor.CLIP_RGB_STDS,
            uuid="rgb_lowres",
        ),
        GoalObjectTypeThorSensor(object_types=ObjectNaviThorMultiMDPsBaseConfig.TARGET_TYPES,),
    ]
    
    PROMPT = (
        "../logs/PROMPTS/BRIGHTNESS/checkpoints/contrastive__latest.pth",
        "../logs/PROMPTS/CONTRAST/checkpoints/contrastive__latest.pth",
        "../logs/PROMPTS/SATURATION/checkpoints/contrastive__latest.pth",
        "../logs/PROMPTS/HUE/checkpoints/contrastive__latest.pth",
        
        "../logs/PROMPTS/FOV_39-59/checkpoints/comparative_action_byol_latest.pth",
        "../logs/PROMPTS/FOV_69-89/checkpoints/comparative_action_byol_latest.pth",
        "../logs/PROMPTS/FOV_99-139/checkpoints/comparative_action_byol_latest.pth",

        "../logs/PROMPTS/LOOK/checkpoints/comparative_action_byol_latest.pth",
        "../logs/PROMPTS/ROTATE/checkpoints/comparative_action_byol_latest.pth",
        "../logs/PROMPTS/STEPSIZE/checkpoints/comparative_action_byol_latest.pth",
    )
    MULTI_P_MODE = [
        ("ATTEMPT","WEIGHTED", "AVG"),
        ("SESoM","WEIGHTED", "AVG"),
        ]
    META_MODE = True
    SOURCE_MODEL = (
        # "/home/meohee/MMRL/allenact/storage/MAIN-EXP/ConPE/checkpoints/PromptATTNCLIPViTGRU-DDPPO-MDPs/2023-04-26_14-40-02/exp_PromptATTNCLIPViTGRU-DDPPO-MDPs__stage_00__steps_000002000000.pt",
        None,
        "/home/meohee/MMRL/allenact/storage/MAIN-EXP/EMBCLIP/checkpoints/ViTGRU-DDPPO-MDPs/2023-04-26_02-28-35/exp_ViTGRU-DDPPO-MDPs__stage_00__steps_000002500000.pt"
        )
    

    def __init__(self, **kwargs):
        super().__init__(**kwargs)
        
        #### Domain defined by domain factors ####
        self.STEP_SIZE =             [0.1, 0.15, 0.25, 0.35]
        self.ROTATION_DEGREES =      [90.0, 60.0, 30.0, 10.0]
        self.VISIBILITY_DISTANCE =   [1.0 , 1.0, 1.0, 1.0]
        self.LIGHTING_VALUE =        [(0.2, 0.9, 1.5, -0.4), (1.1, 1.0, 1.5, -0.1), None, (2.0, 1.5, 2, 0.4)]
        self.HORIZONTAL_FIELD_OF_VIEW = [59, 69, 79, 99]
        self.LOOK_DEGREES = [40, 10, 30, 20]
        # self.STEP_SIZE =                [0.25, 0.25, 0.25, 0.25, 0.25]
        # self.ROTATION_DEGREES =         [30.0, 30.0, 30.0, 30.0, 30.0]
        # self.VISIBILITY_DISTANCE =      [1.0 , 1.0, 1.0, 1.0, 1.0]
        # self.LIGHTING_VALUE =           [(0.2, None, None, None), (None, 3.4, None, None), (None, None, 0.5, None), (None, None, None, 0.4), None]
        # self.HORIZONTAL_FIELD_OF_VIEW = [79, 79, 79, 79, 139]
        # self.LOOK_DEGREES =             [30, 30, 30, 30, 30]
        # self.STEP_SIZE =             [0.25, 0.3, 0.05, 0.35]
        # self.ROTATION_DEGREES =      [30, 10, 90, 5]
        # self.VISIBILITY_DISTANCE =   [1.0, 1.0 , 1.0, 1.0]
        # self.LIGHTING_VALUE =        [None, (1.7, 1.4, 1.5, 0.3), (0.4, 1.2, 1.7, 0.0), (0.6, 1.3, 1.8, 0.2)]
        # self.HORIZONTAL_FIELD_OF_VIEW = [79, 89, 59, 129]
        # self.LOOK_DEGREES = [30, 15, 5, 10]
        # candidate 1
        # self.STEP_SIZE =             [0.25]
        # self.ROTATION_DEGREES =      [30.0]
        # self.VISIBILITY_DISTANCE =   [1.0]
        # self.LIGHTING_VALUE =        [None]
        # self.HORIZONTAL_FIELD_OF_VIEW = [79]
        # self.LOOK_DEGREES = [30.0]
        ##########################################
        self.DATA_GEN = False

        self.preprocessing_and_model = CLIPViTGRUActorCriticMixin(
            sensors=self.SENSORS,
            clip_model_type=self.CLIP_MODEL_TYPE,
            screen_size=self.SCREEN_SIZE,
            goal_sensor_type=GoalObjectTypeThorSensor,
            pool=False,
            pooling_type='',
            target_types=self.TARGET_TYPES,
            prompt = self.PROMPT,
            multi_p_mode = self.MULTI_P_MODE[0],
            meta_mode = self.META_MODE,
            noise_std = self.NOISE_STD,
            source_model = self.SOURCE_MODEL
        )

    def training_pipeline(self, **kwargs) -> TrainingPipeline:
        return ObjectNavPPOMixin.training_pipeline(
            auxiliary_uuids=[],
            multiple_beliefs=False,
            advance_scene_rollout_period=self.ADVANCE_SCENE_ROLLOUT_PERIOD,
        )

    def preprocessors(self) -> Sequence[Union[Preprocessor, Builder[Preprocessor]]]:
        return self.preprocessing_and_model.preprocessors()

    def create_model(self, **kwargs) -> nn.Module:
        return self.preprocessing_and_model.create_model(
            num_actions=self.ACTION_SPACE.n, **kwargs
        )

    def tag(cls):
        return "PromptATTNCLIPViTGRU-DDPPO-MDPs"
# file name: objectnav_ithor_rgb_clip_vit32_pcomps_gru_ddppo_mdps