Spaces:
Running
Running
from typing import List | |
from data.dataloader import build_dataloader | |
# from methods.elasticdnn.api.online_model import ElasticDNN_OnlineModel | |
from methods.elasticdnn.api.online_model_v2 import ElasticDNN_OnlineModel | |
import torch | |
import sys | |
from torch import nn | |
from methods.elasticdnn.api.model import ElasticDNN_OfflineSegFMModel, ElasticDNN_OfflineSegMDModel | |
from methods.elasticdnn.api.algs.md_pretraining_wo_fbs import ElasticDNN_MDPretrainingWoFBSAlg | |
from methods.elasticdnn.model.base import ElasticDNNUtil | |
from methods.elasticdnn.pipeline.offline.fm_to_md.base import FM_to_MD_Util | |
from methods.elasticdnn.pipeline.offline.fm_to_md.vit import FM_to_MD_ViT_Util | |
from methods.elasticdnn.pipeline.offline.fm_lora.base import FMLoRA_Util | |
from methods.elasticdnn.pipeline.offline.fm_lora.vit import FMLoRA_ViT_Util | |
from methods.elasticdnn.model.vit import ElasticViTUtil | |
from utils.common.file import ensure_dir | |
from utils.dl.common.model import LayerActivation, get_module, get_parameter | |
from utils.common.exp import save_models_dict_for_init, get_res_save_dir | |
from data import build_scenario | |
from utils.dl.common.loss import CrossEntropyLossSoft | |
import torch.nn.functional as F | |
from utils.dl.common.env import create_tbwriter | |
import os | |
from utils.common.log import logger | |
from utils.common.data_record import write_json | |
# from methods.shot.shot import OnlineShotModel | |
from methods.gem.gem_el_bert import GEMAlg | |
import tqdm | |
from methods.feat_align.mmd import mmd_rbf | |
from experiments.utils.elasticfm_da import init_online_model, elasticfm_da | |
device = 'cuda' | |
app_name = 'secls' | |
sd_sparsity = 0.8 | |
settings = { | |
'involve_fm': True | |
} | |
scenario = build_scenario( | |
source_datasets_name=['HL5Domains-ApexAD2600Progressive', 'HL5Domains-CanonG3', 'HL5Domains-CreativeLabsNomadJukeboxZenXtra40GB', | |
'HL5Domains-NikonCoolpix4300', 'HL5Domains-Nokia6610'], | |
target_datasets_order=['Liu3Domains-Computer', 'Liu3Domains-Router', 'Liu3Domains-Speaker', | |
'Ding9Domains-DiaperChamp', 'Ding9Domains-Norton', 'Ding9Domains-LinksysRouter', | |
'Ding9Domains-MicroMP3', 'Ding9Domains-Nokia6600', 'Ding9Domains-CanonPowerShotSD500', | |
'Ding9Domains-ipod', 'Ding9Domains-HitachiRouter', 'Ding9Domains-CanonS100', | |
'SemEval-Laptop', 'SemEval-Rest'] * 2 + ['Liu3Domains-Computer', 'Liu3Domains-Router'], | |
da_mode='close_set', | |
data_dirs={ | |
**{k: f'/data/zql/datasets/nlp_asc_19_domains/dat/absa/Bing5Domains/asc/{k.split("-")[1]}' | |
for k in ['HL5Domains-ApexAD2600Progressive', 'HL5Domains-CanonG3', 'HL5Domains-CreativeLabsNomadJukeboxZenXtra40GB', | |
'HL5Domains-NikonCoolpix4300', 'HL5Domains-Nokia6610']}, | |
**{k: f'/data/zql/datasets/nlp_asc_19_domains/dat/absa/Bing3Domains/asc/{k.split("-")[1]}' | |
for k in ['Liu3Domains-Computer', 'Liu3Domains-Router', 'Liu3Domains-Speaker']}, | |
**{k: f'/data/zql/datasets/nlp_asc_19_domains/dat/absa/Bing9Domains/asc/{k.split("-")[1]}' | |
for k in ['Ding9Domains-DiaperChamp', 'Ding9Domains-Norton', 'Ding9Domains-LinksysRouter', | |
'Ding9Domains-MicroMP3', 'Ding9Domains-Nokia6600', 'Ding9Domains-CanonPowerShotSD500', | |
'Ding9Domains-ipod', 'Ding9Domains-HitachiRouter', 'Ding9Domains-CanonS100']}, | |
**{k: f'/data/zql/datasets/nlp_asc_19_domains/dat/absa/XuSemEval/asc/14/{k.split("-")[1].lower()}' | |
for k in ['SemEval-Laptop', 'SemEval-Rest']}, | |
}, | |
) | |
from experiments.elasticdnn.bert_base.online.se_cls_cl.model import ElasticDNN_SeClsOnlineModel | |
elasticfm_model = ElasticDNN_SeClsOnlineModel('secls', init_online_model( | |
'experiments/elasticdnn/bert_base/offline/fm_to_md/se_cls/results/secls_md_w_fbs_index.py/20230704/999994-085209-logic_verify/models/fm_best.pt', | |
'experiments/elasticdnn/bert_base/offline/fm_to_md/se_cls/results/secls_md_w_fbs_index.py/20230704/999994-085209-logic_verify/models/md_best.pt', | |
'cls', __file__ | |
), device, { | |
'md_to_fm_alpha': 0.2, | |
'fm_to_md_alpha': 0.2 | |
}) | |
da_alg = GEMAlg | |
from experiments.elasticdnn.bert_base.online.se_cls_cl.model import SeClsOnlineGEMModel | |
da_model = SeClsOnlineGEMModel | |
da_alg_hyp = { | |
'train_batch_size': 16, | |
'val_batch_size': 64, | |
'num_workers': 8, | |
'optimizer': 'AdamW', | |
'optimizer_args': {'lr': 1e-4, 'betas': [0.9, 0.999], 'weight_decay': 0.01}, | |
'scheduler': '', | |
'scheduler_args': {}, | |
'num_iters': 100, | |
'val_freq': 20, | |
'n_memories': 16, | |
'n_inputs': 3 * 224 * 224, | |
'margin': 0.5, | |
'num_my_iters': 0, | |
'sd_sparsity': 0.7 | |
} | |
elasticfm_da( | |
[app_name], | |
[scenario], | |
[elasticfm_model], | |
[da_alg], | |
[da_alg_hyp], | |
[da_model], | |
device, | |
settings, | |
__file__, | |
sys.argv[1] | |
) | |