Spaces:
Running
Running
from typing import List | |
from data.dataloader import build_dataloader | |
# from methods.elasticdnn.api.online_model import ElasticDNN_OnlineModel | |
from methods.elasticdnn.api.online_model_v2 import ElasticDNN_OnlineModel | |
import torch | |
import sys | |
from torch import nn | |
from methods.elasticdnn.api.model import ElasticDNN_OfflineSegFMModel, ElasticDNN_OfflineSegMDModel | |
from methods.elasticdnn.api.algs.md_pretraining_wo_fbs import ElasticDNN_MDPretrainingWoFBSAlg | |
from methods.elasticdnn.model.base import ElasticDNNUtil | |
from methods.elasticdnn.pipeline.offline.fm_to_md.base import FM_to_MD_Util | |
from methods.elasticdnn.pipeline.offline.fm_to_md.vit import FM_to_MD_ViT_Util | |
from methods.elasticdnn.pipeline.offline.fm_lora.base import FMLoRA_Util | |
from methods.elasticdnn.pipeline.offline.fm_lora.vit import FMLoRA_ViT_Util | |
from methods.elasticdnn.model.vit import ElasticViTUtil | |
from utils.common.file import ensure_dir | |
from utils.dl.common.model import LayerActivation, get_module, get_parameter | |
from utils.common.exp import save_models_dict_for_init, get_res_save_dir | |
from data import build_scenario | |
from utils.dl.common.loss import CrossEntropyLossSoft | |
import torch.nn.functional as F | |
from utils.dl.common.env import create_tbwriter | |
import os | |
from utils.common.log import logger | |
from utils.common.data_record import write_json | |
# from methods.shot.shot import OnlineShotModel | |
from methods.feat_align.main import OnlineFeatAlignModel, FeatAlignAlg | |
import tqdm | |
from methods.feat_align.mmd import mmd_rbf | |
from experiments.utils.elasticfm_da import init_online_model, elasticfm_da | |
device = 'cuda' | |
app_name = 'pos' | |
sd_sparsity = 0.8 | |
settings = { | |
'involve_fm': True | |
} | |
scenario = build_scenario( | |
source_datasets_name=[i + '-TokenCls' for i in ['HL5Domains-ApexAD2600Progressive', 'HL5Domains-CanonG3', 'HL5Domains-CreativeLabsNomadJukeboxZenXtra40GB', | |
'HL5Domains-NikonCoolpix4300', 'HL5Domains-Nokia6610']], | |
target_datasets_order=[i + '-TokenCls' for i in ['Liu3Domains-Computer', 'Liu3Domains-Router', 'Liu3Domains-Speaker', | |
'Ding9Domains-DiaperChamp', 'Ding9Domains-Norton', 'Ding9Domains-LinksysRouter', | |
'Ding9Domains-MicroMP3', 'Ding9Domains-Nokia6600', 'Ding9Domains-CanonPowerShotSD500', | |
'Ding9Domains-ipod', 'Ding9Domains-HitachiRouter', 'Ding9Domains-CanonS100', | |
'SemEval-Laptop', 'SemEval-Rest'] * 2 + ['Liu3Domains-Computer', 'Liu3Domains-Router']], | |
da_mode='close_set', | |
data_dirs={ | |
**{k: f'/data/zql/datasets/nlp_asc_19_domains/dat/absa/Bing5Domains/asc/{k.split("-")[1]}' | |
for k in [i + '-TokenCls' for i in ['HL5Domains-ApexAD2600Progressive', 'HL5Domains-CanonG3', 'HL5Domains-CreativeLabsNomadJukeboxZenXtra40GB', | |
'HL5Domains-NikonCoolpix4300', 'HL5Domains-Nokia6610']]}, | |
**{k: f'/data/zql/datasets/nlp_asc_19_domains/dat/absa/Bing3Domains/asc/{k.split("-")[1]}' | |
for k in [i + '-TokenCls' for i in ['Liu3Domains-Computer', 'Liu3Domains-Router', 'Liu3Domains-Speaker']]}, | |
**{k: f'/data/zql/datasets/nlp_asc_19_domains/dat/absa/Bing9Domains/asc/{k.split("-")[1]}' | |
for k in [i + '-TokenCls' for i in ['Ding9Domains-DiaperChamp', 'Ding9Domains-Norton', 'Ding9Domains-LinksysRouter', | |
'Ding9Domains-MicroMP3', 'Ding9Domains-Nokia6600', 'Ding9Domains-CanonPowerShotSD500', | |
'Ding9Domains-ipod', 'Ding9Domains-HitachiRouter', 'Ding9Domains-CanonS100']]}, | |
**{k: f'/data/zql/datasets/nlp_asc_19_domains/dat/absa/XuSemEval/asc/14/{k.split("-")[1].lower()}' | |
for k in [i + '-TokenCls' for i in ['SemEval-Laptop', 'SemEval-Rest']]}, | |
}, | |
) | |
from experiments.elasticdnn.bert_base.online.pos.model import ElasticDNN_POSOnlineModel | |
elasticfm_model = ElasticDNN_POSOnlineModel('pos', init_online_model( | |
'experiments/elasticdnn/bert_base/offline/fm_to_md/pos/results/pos_md_w_fbs_index.py/20230704/999998-085253-trial/models/fm_best.pt', | |
'experiments/elasticdnn/bert_base/offline/fm_to_md/pos/results/pos_md_w_fbs_index.py/20230704/999998-085253-trial/models/md_best.pt', | |
'pos', __file__ | |
), device, { | |
'md_to_fm_alpha': 0.1, | |
'fm_to_md_alpha': 0.1 | |
}) | |
da_alg = FeatAlignAlg | |
from experiments.elasticdnn.bert_base.online.pos.model import POSOnlineFeatAlignModel | |
da_model = POSOnlineFeatAlignModel | |
da_alg_hyp = { | |
'train_batch_size': 16, | |
'val_batch_size': 64, | |
'num_workers': 8, | |
'optimizer': 'SGD', | |
'optimizer_args': {'lr': 1e-4, 'momentum': 0.9}, | |
'scheduler': '', | |
'scheduler_args': {}, | |
'num_iters': 100, | |
'val_freq': 20, | |
'feat_align_loss_weight': 1.0, | |
'sd_sparsity': 0.7 | |
} | |
elasticfm_da( | |
[app_name], | |
[scenario], | |
[elasticfm_model], | |
[da_alg], | |
[da_alg_hyp], | |
[da_model], | |
device, | |
settings, | |
__file__, | |
sys.argv[1] | |
) | |