diff --git a/examples/transfer/README.md b/examples/transfer/README.md
new file mode 100644
index 0000000..e69de29
diff --git a/examples/transfer/transfer_bo.py b/examples/transfer/transfer_bo.py
new file mode 100644
index 0000000..ae02cdf
--- /dev/null
+++ b/examples/transfer/transfer_bo.py
@@ -0,0 +1,63 @@
+import numpy as np
+# import matplotlib.pyplot as plt
+from ConfigSpace import ConfigurationSpace
+from xbbo.configspace.space import DenseConfiguration
+from ConfigSpace.hyperparameters import UniformFloatHyperparameter
+from ConfigSpace.conditions import LessThanCondition
+
+# from xbbo.search_algorithm.transfer_tst_optimizer import TransferBO
+# from xbbo.search_algorithm.transfer_taf_optimizer import TransferBO
+# from xbbo.search_algorithm.transfer_rgpe_mean_optimizer import TransferBO
+# from xbbo.search_algorithm.transfer_taf_rgpe_optimizer import TransferBO
+# from xbbo.search_algorithm.transfer_RMoGP_optimizer import TransferBO
+from xbbo.search_algorithm.transfer_bo_optimizer import TransferBO
+
+from xbbo.problem.transfer_problem import BenchName, TransferBenchmark
+from xbbo.core.constants import MAXINT
+
+if __name__ == "__main__":
+    MAX_CALL = 30
+    rng = np.random.RandomState(42)
+
+    transfer_bench = TransferBenchmark(bench_name=BenchName.TST,
+                                       target_task_name="A9A",
+                                       data_path_root='./data',
+                                       data_base_name='svm',
+                                       rng=rng.randint(MAXINT))
+    # transfer_bench = TransferBenchmark(bench_name=BenchName.Table_deepar,
+    #                                    target_task_name="wiki-rolling",
+    #                                    data_path_root='./data/offline_evaluations',
+    #                                    data_base_name='DeepAR.csv.zip',
+    #                                    rng=rng.randint(MAXINT))
+    cs = transfer_bench.get_configuration_space()
+    old_D_X, old_D_y = transfer_bench.get_old_data()
+
+    # use transfer
+    # hpopt = TransferBO(space=cs, seed=rng.randint(MAXINT), suggest_limit=MAX_CALL, initial_design='sobol', surrogate='tst', acq_func='ei', weight_srategy='kernel', acq_opt='rs') # TST-R
+    hpopt = TransferBO(space=cs, seed=rng.randint(MAXINT), suggest_limit=MAX_CALL, initial_design='sobol', surrogate='gp', acq_func='taf', weight_srategy='kernel', acq_opt='rs') # TAF
+    # hpopt = TransferBO(space=cs, seed=rng.randint(MAXINT), suggest_limit=MAX_CALL, initial_design='sobol', surrogate='tst', acq_func='ei', weight_srategy='rw', acq_opt='rs') # RGPE(mean)
+    # hpopt = TransferBO(space=cs, seed=rng.randint(MAXINT), suggest_limit=MAX_CALL, initial_design='sobol', surrogate='gp', acq_func='taf', weight_srategy='rw', acq_opt='rs') # TAF(rw)
+    # hpopt = TransferBO(space=cs, seed=rng.randint(MAXINT), suggest_limit=MAX_CALL, initial_design='sobol', surrogate='gp', acq_func='mogp', weight_srategy='rw', acq_opt='rs') # RMoGP
+    # not use transfer
+    # hpopt = TransferBO(space=cs,
+    #                    seed=rng.randint(MAXINT),
+    #                    suggest_limit=MAX_CALL,
+    #                    initial_design='sobol',
+    #                    surrogate='gp',
+    #                    acq_func='ei',
+    #                    weight_srategy='kernel',
+    #                    acq_opt='rs')  # vanila bo
+    hpopt.get_transfer_knowledge(old_D_X, old_D_y)
+    # ---- Begin BO-loop ----
+    for i in range(MAX_CALL):
+        # suggest
+        trial_list = hpopt.suggest()
+        # evaluate
+        obs = transfer_bench(trial_list[0].config_dict)
+        # observe
+        trial_list[0].add_observe_value(obs)
+        hpopt.observe(trial_list=trial_list)
+
+        print(obs)
+
+    print('find best (value, config):{}'.format(hpopt.trials.get_best()))
diff --git a/examples/transfer_bo.py b/examples/transfer_bo.py
deleted file mode 100644
index d6531ca..0000000
--- a/examples/transfer_bo.py
+++ /dev/null
@@ -1,101 +0,0 @@
-import numpy as np
-# import matplotlib.pyplot as plt
-from ConfigSpace import ConfigurationSpace
-from xbbo.configspace.space import DenseConfiguration
-from ConfigSpace.hyperparameters import UniformFloatHyperparameter
-from ConfigSpace.conditions import LessThanCondition
-
-# from xbbo.search_algorithm.transfer_tst_optimizer import SMBO
-# from xbbo.search_algorithm.transfer_taf_optimizer import SMBO
-# from xbbo.search_algorithm.transfer_rgpe_mean_optimizer import SMBO
-# from xbbo.search_algorithm.transfer_taf_rgpe_optimizer import SMBO
-# from xbbo.search_algorithm.transfer_RMoGP_optimizer import SMBO
-from xbbo.search_algorithm.transfer_bo_optimizer import SMBO
-
-from xbbo.problem.offline_hp import Model
-from xbbo.core.constants import MAXINT
-from xbbo.surrogate.transfer.base_surrogate import BaseModel
-
-def rosenbrock_2d(x):
-    """ The 2 dimensional Rosenbrock function as a toy model
-    The Rosenbrock function is well know in the optimization community and
-    often serves as a toy problem. It can be defined for arbitrary
-    dimensions. The minimium is always at x_i = 1 with a function value of
-    zero. All input parameters are continuous. The search domain for
-    all x's is the interval [-5, 10].
-    """
-
-    x1 = x["x0"]
-    # x2 = x["x1"]
-    x2 = x.get('x1', x1)
-
-    val = 100. * (x2 - x1 ** 2.) ** 2. + (1 - x1) ** 2.
-    return val
-
-def branin(config):
-    x1, x2 = config['x1'], config['x2']
-    y = (x2 - 5.1 / (4 * np.pi ** 2) * x1 ** 2 + 5 / np.pi * x1 - 6) ** 2 \
-        + 10 * (1 - 1 / (8 * np.pi)) * np.cos(x1) + 10
-    return y
-
-def build_space(rng):
-    cs = ConfigurationSpace(seed=rng.randint(MAXINT))
-    x0 = UniformFloatHyperparameter("x0", -5, 10, default_value=-3)
-    x1 = UniformFloatHyperparameter("x1", -5, 10, default_value=-4)
-    cs.add_hyperparameters([x0, x1])
-    con = LessThanCondition(x1, x0, 1.)
-    cs.add_condition(con)
-    return cs
-
-def build_branin_space(rng):
-    cs = ConfigurationSpace(seed=rng.randint(MAXINT))
-    x1 = UniformFloatHyperparameter("x1", -5, 10, default_value=0)
-    x2 = UniformFloatHyperparameter("x2", 0, 15, default_value=0)
-    cs.add_hyperparameters([x1, x2])
-    return cs
-
-if __name__ == "__main__":
-    MAX_CALL = 30
-    rng = np.random.RandomState(42)
-
-    test_model = Model(rng.randint(MAXINT), test_task='a6a', )
-
-    cs = ConfigurationSpace(seed=rng.randint(MAXINT))
-    confs = test_model.get_api_config()
-    for conf in confs:
-        cs.add_hyperparameter(UniformFloatHyperparameter(conf, confs[conf]['range'][0], confs[conf]['range'][1]))
-    blackbox_func = test_model.evaluate
-    base_models = []
-    for i in range(len(test_model.old_D_x)):
-        base_models.append(BaseModel(cs, rng=rng,do_optimize=False))
-        base_models[-1].train(test_model.old_D_x[i], test_model.old_D_y[i])
-
-    # use transfer
-    # hpopt = SMBO(space=cs, seed=rng.randint(MAXINT), suggest_limit=MAX_CALL, initial_design='sobol', surrogate='gp', acq_func='ei', weight_srategy='kernel', acq_opt='rs', base_models=base_models) # vanila bo
-    # hpopt = SMBO(space=cs, seed=rng.randint(MAXINT), suggest_limit=MAX_CALL, initial_design='sobol', surrogate='tst', acq_func='ei', weight_srategy='kernel', acq_opt='rs', base_models=base_models) # TST-R
-    # hpopt = SMBO(space=cs, seed=rng.randint(MAXINT), suggest_limit=MAX_CALL, initial_design='sobol', surrogate='gp', acq_func='taf', weight_srategy='kernel', acq_opt='rs', base_models=base_models) # TAF
-    # hpopt = SMBO(space=cs, seed=rng.randint(MAXINT), suggest_limit=MAX_CALL, initial_design='sobol', surrogate='tst', acq_func='ei', weight_srategy='rw', acq_opt='rs', base_models=base_models) # RGPE(mean)
-    # hpopt = SMBO(space=cs, seed=rng.randint(MAXINT), suggest_limit=MAX_CALL, initial_design='sobol', surrogate='gp', acq_func='taf', weight_srategy='rw', acq_opt='rs', base_models=base_models) # TAF(rw)
-    hpopt = SMBO(space=cs, seed=rng.randint(MAXINT), suggest_limit=MAX_CALL, initial_design='sobol', surrogate='gp', acq_func='mogp', weight_srategy='rw', acq_opt='rs', base_models=base_models) # RMoGP
-    # not use transfer
-    # hpopt = SMBO(space=cs, seed=rng.randint(MAXINT), suggest_limit=MAX_CALL, initial_design='sobol', surrogate='gp', acq_opt='rs_ls', base_models=[]]) 
-    # Example call of the black-box function
-    def_value = blackbox_func(cs.get_default_configuration())
-    print("Default Value: %.2f" % def_value)
-    # ---- Begin BO-loop ----
-    for i in range(MAX_CALL):
-        # suggest
-        trial_list = hpopt.suggest()
-        # evaluate 
-        value = blackbox_func(trial_list[0].config_dict)
-        # observe
-        trial_list[0].add_observe_value(observe_value=value)
-        hpopt.observe(trial_list=trial_list)
-        
-        print(value)
-    
-    # plt.plot(hpopt.trials.get_history()[0])
-    # plt.savefig('./out/rosenbrock_bo_gp.png')
-    # plt.show()
-    print('find best value:{}'.format(hpopt.trials.get_best()[0]))
-
diff --git a/xbbo/acquisition_function/transfer/taf.py b/xbbo/acquisition_function/transfer/taf.py
index 6d09864..dc4240a 100644
--- a/xbbo/acquisition_function/transfer/taf.py
+++ b/xbbo/acquisition_function/transfer/taf.py
@@ -95,8 +95,11 @@ class TAF_AcqFunc(AbstractAcquisitionFunction):
         # denominator = self.selfWeight
         f *= self.selfWeight
         for d in range(len(self.weight)):
-            f += self.weight[d] * (self.base_incuments[d] - self.pre_weight_model[d].predict(
-                X, None)[0]).clip(0)
+            base_pred_mean = self.pre_weight_model[d].predict(
+                X, None)[0]
+            if len(base_pred_mean.shape) == 1:
+                base_pred_mean = np.expand_dims(base_pred_mean, axis=-1)
+            f += self.weight[d] * (self.base_incuments[d] - base_pred_mean).clip(0)
             # denominator += self.weight[d]
 
         return f
diff --git a/xbbo/problem/base.py b/xbbo/problem/base.py
index 2104eb4..269c517 100644
--- a/xbbo/problem/base.py
+++ b/xbbo/problem/base.py
@@ -1,5 +1,5 @@
 import abc
-
+import numpy as np
 import ConfigSpace
 from xbbo.core.constants import Key
 
@@ -23,7 +23,7 @@ class AbstractBenchmark(object, metaclass=abc.ABCMeta):
         self.counter   = 0
 
         self.rng = create_rng(rng)
-        self.configuration_space = self.get_configuration_space()
+        # self.configuration_space = self.get_configuration_space()
 
     @abc.abstractmethod
     def objective_function(self, configuration, **kwargs):
diff --git a/xbbo/problem/fast_example_problem.py b/xbbo/problem/fast_example_problem.py
index 4c0570f..bb5cea0 100644
--- a/xbbo/problem/fast_example_problem.py
+++ b/xbbo/problem/fast_example_problem.py
@@ -16,7 +16,6 @@ from xbbo.core.constants import MAXINT, Key
 class Ackley(AbstractBenchmark):
     def __init__(self, dim=10, rng=np.random.RandomState(42)):
         self.dims      = dim
-        self.rng = rng
         self.keys = ["x_{}".format(i) for i in range(self.dims)]
         super().__init__(rng)
         self.get_configuration_space()
diff --git a/xbbo/problem/transfer_problem.py b/xbbo/problem/transfer_problem.py
new file mode 100644
index 0000000..c5b2cdf
--- /dev/null
+++ b/xbbo/problem/transfer_problem.py
@@ -0,0 +1,370 @@
+from abc import abstractmethod
+import os
+from enum import Enum
+from typing import Tuple, List, Callable
+import numpy as np
+import pandas as pd
+from pathlib import Path
+from ConfigSpace import ConfigurationSpace
+import ConfigSpace as CS
+from ConfigSpace.conditions import InCondition, LessThanCondition
+from ConfigSpace.hyperparameters import \
+    CategoricalHyperparameter, UniformFloatHyperparameter, UniformIntegerHyperparameter
+from xbbo.core.constants import MAXINT, Key
+from xbbo.problem.base import AbstractBenchmark
+
+class BenchName(Enum):
+    TST = 0
+    # surrogate = 1
+    Table_deepar = 1
+    Table_fcnet = 2
+    Table_xgboost = 3
+    Table_nas102 = 4
+
+class TransferData():
+    def __init__(self, bench_name:int, data_path_root:str, data_base_name:str, target_task_name:str) -> None:
+        self.bench_name = bench_name
+        self.data_base_name = data_base_name
+        self.data_path_root = data_path_root
+        self.target_task_name = target_task_name
+    
+    def load_data(self,):
+        key = str(self.__class__) + "_" + self.target_task_name
+        res = CACHE_DATA.get(key, False)
+        if res:
+            return res
+        CACHE_DATA[key] = self._load_data()
+        return CACHE_DATA[key]
+
+    def _load_data(self):
+        pass
+    
+    def get_configuration_space(self,):
+        pass
+    
+    @abstractmethod
+    def download_data(self,):
+        pass
+    
+    @property
+    def hp_names(self,):
+        return None
+
+# prevent duplicate load data
+CACHE_DATA = {}
+
+
+class TST_Data(TransferData):
+    def __init__(self, bench_name:int,data_path_root:str, data_base_name:str,target_task_name:str, download=True, sparse=False, hp_num=3,min_max_features=False, rng=np.random.RandomState(), **kwargs) -> None:
+        super().__init__(bench_name,data_path_root, data_base_name, target_task_name)
+        self.data_path = os.path.join(self.data_path_root, data_base_name)
+        self.min_max_features = min_max_features
+        self.sparse = sparse
+        self.hp_num = hp_num
+        self.download = download
+        self.url = "https://git.openi.org.cn/isleizhang/BBO-Datasets/datasets"
+        self.rng = rng
+        self.hp_keys = ['C', 'gamma', 'd']
+        
+    def _load_data(self):
+        if not os.path.exists(self.data_path):
+            assert self.download, 'ERROR: "{}" not exits.'.format(self.data_path)
+            self.download_data()
+        file_lists = os.listdir(self.data_path)
+        file_lists = list(map(lambda x: os.path.join(self.data_path,x), file_lists))
+        datasets_hp = []
+        datasets_label = []
+        filenames = []
+        for file in file_lists:
+            # data = []
+            filename = file.rsplit('/', maxsplit=1)[-1]
+            filenames.append(filename)
+            with open(file, 'r') as f:
+                insts = []  # 2dim
+                for line in f.readlines():  # convet categories
+                    line_array_raw = list(map(float, line.strip().split(' ')))
+                    idx_start = 1
+                    line_array = [line_array_raw[0]]
+                    # for ind_num in self.hp_indicator_num:
+                    #     line_array.append(line_array_raw[idx_start:idx_start+ind_num].index(1))
+                    #     idx_start += ind_num
+
+                    # line_array.extend(line_array_raw[idx_start:self.hp_num+1])
+                    line_array.extend(line_array_raw[idx_start:self.hp_num + 1+3])
+                    insts.append(line_array)
+
+            datasets = np.asarray(insts, dtype=np.float)
+            if self.sparse:
+                mask = datasets[:, 1] == 1
+                datasets_hp.append(datasets[mask, 1+3:])
+                # datasets_hp[-1] = datasets_hp[-1][mask]
+                datasets_label.append(-datasets[mask, 0:1])  # TODO convet to minimize problem (regret)
+            else:
+                datasets_hp.append(datasets[:, 1:])
+                datasets_label.append(-datasets[:, 0:1]) # TODO convet to minimize problem (regret)
+            mask = datasets_hp[-1][:, 0].astype(np.bool_)  # TODO
+            datasets_hp[-1] = datasets_hp[-1][mask, 3:]
+            datasets_label[-1] = datasets_label[-1][mask]
+            # if True:
+            #     datasets_label[-1] = datasets_label[-1]
+        if self.min_max_features:
+            # min-max scaling of input features
+            from sklearn.preprocessing import MinMaxScaler
+            scaler = MinMaxScaler().fit(np.vstack(datasets_hp))
+            datasets_hp = [scaler.transform(X) for X in datasets_hp]
+        test_idx = filenames.index(self.target_task_name)
+        test_task = datasets_hp.pop(test_idx)
+        test_task_label = datasets_label.pop(test_idx)
+        
+        return (datasets_hp, datasets_label, test_task, test_task_label)
+
+    def get_configuration_space(self):
+        if hasattr(self, "configuration_space"):
+            return self.configuration_space
+        self.configuration_space = ConfigurationSpace(seed=self.rng.randint(MAXINT))
+        x0 = UniformFloatHyperparameter("C", -1, 1)
+        x1 = UniformFloatHyperparameter("gamma", -1, 1)
+        x2 = UniformFloatHyperparameter("d", 0, 1)
+        self.configuration_space.add_hyperparameters([x0, x1, x2])
+        return self.configuration_space
+    
+    @property
+    def hp_names(self,):
+        return self.hp_keys
+
+    def download_data(self):
+        raise NotImplementedError("plese download {} in {}".format(self.url, self.data_path))
+
+class Table_Data(TransferData):
+    blackbox_tasks = {
+    BenchName.Table_nas102: [
+        'cifar10',
+        'cifar100',
+        'ImageNet16-120'
+    ],
+    BenchName.Table_fcnet: [
+        'naval',
+        'parkinsons',
+        'protein',
+        'slice',
+    ],
+    BenchName.Table_deepar: [
+        'm4-Hourly',
+        'm4-Daily',
+        'm4-Weekly',
+        'm4-Monthly',
+        'm4-Quarterly',
+        'm4-Yearly',
+        'electricity',
+        'exchange-rate',
+        'solar',
+        'traffic',
+    ],
+    BenchName.Table_xgboost: [
+        'a6a',
+        'australian',
+        'german.numer',
+        'heart',
+        'ijcnn1',
+        'madelon',
+        'skin_nonskin',
+        'spambase',
+        'svmguide1',
+        'w6a'
+        ],
+    }
+
+    error_metric = {
+        BenchName.Table_deepar: 'metric_CRPS',
+        BenchName.Table_fcnet: 'metric_error',
+        BenchName.Table_nas102: 'metric_error',
+        BenchName.Table_xgboost: 'metric_error',
+    }
+    
+    def __init__(self, bench_name:int,data_path_root:str, data_base_name:str, target_task_name:str, download=True, sparse=False, hp_num=3,min_max_features=False, rng=np.random.RandomState(), **kwargs) -> None:
+        super().__init__(bench_name,data_path_root, data_base_name, target_task_name)
+        self.data_base_name = data_base_name
+        self.data_path = os.path.join(data_path_root, data_base_name)
+        self.min_max_features = min_max_features
+        self.sparse = sparse
+        self.hp_num = hp_num
+        self.download = download
+        self.url = "https://git.openi.org.cn/isleizhang/BBO-Datasets/datasets"
+        self.rng = rng
+        self._metric_col = self.error_metric[bench_name]
+        
+    def _load_data(self):
+        if not os.path.exists(self.data_path):
+            assert self.download, 'ERROR: "{}" not exits.'.format(self.data_path)
+            self.download_data()
+        df = pd.read_csv(self.data_path)
+
+        assert self.target_task_name in df.task.unique()
+        assert self._metric_col in df.columns
+
+        Xy_dict = {}
+        for task in sorted(df.task.unique()):
+            mask = df.loc[:, 'task'] == task
+            hp_cols = [c for c in sorted(df.columns) if c.startswith("hp_")]
+            X = df.loc[mask, hp_cols].values
+            y = df.loc[mask, self._metric_col].values
+            if len(y.shape) == 1:
+                y = np.expand_dims(y, axis=1)
+            Xy_dict[task] = X, y
+
+        # todo it would be better done as a post-processing step
+        if self.bench_name in [BenchName.Table_fcnet, BenchName.Table_nas102]:
+            # applies onehot encoding to *all* hp columns as all hps are categories for those two blackboxes
+            # it would be nice to detect column types or pass it as an argument
+            from sklearn.preprocessing import OneHotEncoder
+            enc = OneHotEncoder(handle_unknown='ignore', sparse=False)
+            hp_cols = [c for c in sorted(df.columns) if c.startswith("hp_")]
+            enc.fit(df.loc[:, hp_cols])
+            for task, (X, y) in Xy_dict.items():
+                X_features = enc.transform(X)
+                Xy_dict[task] = X_features, y
+
+        if self.min_max_features:
+            # min-max scaling of input features
+            from sklearn.preprocessing import MinMaxScaler
+            X = np.vstack([X for (X, y) in Xy_dict.values()])
+            scaler = MinMaxScaler().fit(X)
+            Xy_dict = {t: (scaler.transform(X), y) for (t, (X, y)) in Xy_dict.items()}
+
+        Xys_train = [Xy_dict[t] for t in df.task.unique() if t != self.target_task_name]
+        Xy_test = Xy_dict[self.target_task_name]
+        self.hp_keys = [f'hp_{i}' for i in range(Xy_test[0].shape[1])]
+        L = list(zip(*Xys_train))
+        L.extend(Xy_test)
+        return L
+
+    def get_configuration_space(self):
+        if hasattr(self, "configuration_space"):
+            return self.configuration_space
+        self.configuration_space = ConfigurationSpace(seed=self.rng.randint(MAXINT))
+        for name in self.hp_keys:
+            x = UniformFloatHyperparameter(name, 0, 1)
+            self.configuration_space.add_hyperparameter(x)
+        return self.configuration_space
+
+    @property
+    def hp_names(self,):
+        return self.hp_keys
+
+    def download_data(self):
+        raise NotImplementedError("plese download {} in {}".format(self.url, self.data_path))
+        # download_and_extract_archive(self.url, download_root=self.data_path_root, filename=self.data_path, remove_finished=True)
+
+class TransferBenchmark(AbstractBenchmark):
+
+    def __init__(self, bench_name:int, data_base_name:str, target_task_name:str, rng=np.random.RandomState(), normalize_y=False, data_path_root='./data',**kwargs):
+        # np.random.seed(cfg.GENERAL.random_seed)
+        self.bench_name = bench_name
+        self.target_task_name = target_task_name
+        self.normalize_y = normalize_y
+        self.data_path_root = data_path_root
+        super().__init__(rng)
+        
+        if bench_name == BenchName.TST:
+            self.data_loader = TST_Data(bench_name=bench_name,data_path_root=data_path_root, data_base_name=data_base_name,target_task_name=target_task_name, rng=self.rng,**kwargs)
+            # self.old_D_x, self.old_D_y, self.new_D_x, self.new_D_y, self.hp_config = 
+            # self.api_config = self.hp_config
+        elif bench_name in [BenchName.Table_deepar, BenchName.Table_fcnet, BenchName.Table_nas102, BenchName.Table_xgboost]:
+            self.data_loader = Table_Data(bench_name=bench_name,data_path_root=data_path_root, data_base_name=data_base_name,target_task_name=target_task_name,min_max_features=True, rng=self.rng,**kwargs)
+        else:
+            raise NotImplemented
+        if normalize_y:
+            self.old_D_y = [(y - y.min())/(y.max()-y.min()) for y in self.old_D_y]
+
+        self._old_D_x, self._old_D_y, _new_D_x, _new_D_y = self.data_loader.load_data()
+        self._bbfunc = BlackboxOffline(_new_D_x, _new_D_y)
+        self._best_f = min(_new_D_y).item()
+        self._f_range = max(_new_D_y).item() - self._best_f
+        self._sorted_new_D_y = np.sort(_new_D_y).ravel()
+        self.get_configuration_space()
+        self.idxs = []
+        for name in self.data_loader.hp_names:
+            self.idxs.append(self.configuration_space.get_idx_by_hyperparameter_name(name))
+        self.idxs = np.argsort(self.idxs)
+        
+    @AbstractBenchmark._check_configuration
+    def objective_function(self, config, **kwargs):
+        f = self._bbfunc(np.asarray([config[k] for k in self.data_loader.hp_names])).item()
+        y = (f - self._best_f) / self._f_range if self.normalize_y else f
+
+        return {Key.FUNC_VALUE: y}
+    
+    @AbstractBenchmark._check_configuration
+    def objective_function_test(self, config, **kwargs):
+        return self.objective_function(config, **kwargs)
+    
+    def get_configuration_space(self,):
+        if hasattr(self, "configuration_space"):
+            return self.configuration_space
+        self.configuration_space = self.data_loader.get_configuration_space()
+        return self.configuration_space
+
+    def get_old_data(self):
+        return np.take(self._old_D_x, self.idxs, axis=-1), self._old_D_y
+    
+    def get_old_configurations(self,):
+        return CS.Configuration(self.configuration_space, vector=np.take(self._old_D_x,self.idxs, axis=-1)), self._old_D_y
+        
+    @staticmethod
+    def get_meta_information():
+        return {'name': 'Test Function: Transfer blackbox benchmark'}
+
+class Blackbox:
+    def __init__(
+            self,
+            input_dim: int,
+            output_dim: int,
+            eval_fun: Callable[[np.array], np.array],
+    ):
+        self.input_dim = input_dim
+        self.output_dim = output_dim
+        self.eval_fun = eval_fun
+
+    def __call__(self, x: np.array) -> np.array:
+        """
+        :param x: shape (input_dim,)
+        :return: shape (output_dim,)
+        """
+        assert x.shape == (self.input_dim,)
+        y = self.eval_fun(x)
+        assert y.shape == (self.output_dim,)
+        return y
+
+
+class BlackboxOffline(Blackbox):
+    def __init__(
+            self,
+            X: np.array,
+            y: np.array,
+    ):
+        """
+        A blackbox whose evaluations are already known.
+        To evaluate a new point, we return the value of the closest known point.
+        :param input_dim:
+        :param output_dim:
+        :param X: list of arguments evaluated, shape (n, input_dim)
+        :param y: list of outputs evaluated, shape (n, output_dim)
+        """
+        assert len(X) == len(y)
+        n, input_dim = X.shape
+        n, output_dim = y.shape
+
+        from sklearn.neighbors import KNeighborsRegressor
+        proj = KNeighborsRegressor(n_neighbors=1).fit(X, y)
+
+        super().__init__(
+            input_dim=input_dim,
+            output_dim=output_dim,
+            eval_fun=lambda x: proj.predict(x.reshape(1, -1))[0]
+        )
+        
+        
+if __name__ == "__main__":
+    bench = TransferBenchmark(BenchName.Table_deepar, 'DeepAR.csv.zip', target_task_name="m4-Hourly", data_path_root='./data/offline_evaluations')
+    cs = bench.get_configuration_space()
+    bench(cs.get_default_configuration())
\ No newline at end of file
diff --git a/xbbo/search_algorithm/transfer_bo_optimizer.py b/xbbo/search_algorithm/transfer_bo_optimizer.py
index d5945a1..dee9e62 100644
--- a/xbbo/search_algorithm/transfer_bo_optimizer.py
+++ b/xbbo/search_algorithm/transfer_bo_optimizer.py
@@ -17,11 +17,12 @@ logger = logging.getLogger(__name__)
 
 
 @alg_register.register('bo-transfer')
-class SMBO(AbstractOptimizer):
+class TransferBO(AbstractOptimizer):
     def __init__(self,
-                 space: DenseConfigurationSpace,
+                 space,
                  seed: int = 42,
                  initial_design: str = 'sobol',
+                 init_budget: int = None,
                  suggest_limit: int = np.inf,
                  surrogate: str = 'gp',
                  acq_func: str = 'ei',
@@ -37,81 +38,27 @@ class SMBO(AbstractOptimizer):
                                    suggest_limit=suggest_limit,
                                    **kwargs)
         self.predict_x_best = predict_x_best
-        self.dimension = self.space.get_dimensions()
+        self.dimension = self.space.get_dimensions(sparse=True)
 
         self.initial_design = ALL_avaliable_design[initial_design](
-            self.space, self.rng, ta_run_limit=suggest_limit, **kwargs)
+            self.space,
+            self.rng,
+            ta_run_limit=suggest_limit,
+            init_budget=init_budget,
+            **kwargs)
         self.init_budget = self.initial_design.init_budget
         self.hp_num = len(self.space)
         self.initial_design_configs = self.initial_design.select_configurations(
         )
-        self.trials = Trials(space,dim=self.dimension)
+        self.trials = Trials(space, dim=self.dimension)
 
         # self.rho = kwargs.get("rho", 1)
         self.bandwidth = kwargs.get("bandwdth", 0.1)
-        self.base_models = kwargs.get("base_models")
-        if self.base_models:
-            assert isinstance(self.base_models[0], BaseModel)
-            if surrogate == 'gp':
-                self.surrogate_model = GPR_sklearn(self.space, rng=self.rng)
-            elif surrogate == 'tst':
-                self.surrogate_model = TST_surrogate(self.space,
-                                                     self.base_models,
-                                                     rng=self.rng)
-        else:
-            raise NotImplementedError()
-        if weight_srategy == 'kernel':
-            self.weight_sratety = KernelRegress(self.space, self.base_models,
-                                                self.surrogate_model, self.rng)
-        elif weight_srategy == 'rw':
-            self.weight_sratety = RankingWeight(self.space,
-                                                self.base_models,
-                                                self.surrogate_model,
-                                                self.rng,
-                                                budget=suggest_limit,
-                                                is_purn=True)
-        elif weight_srategy == 'zero':
-            self.weight_sratety = ZeroWeight(self.space, self.base_models,
-                                             self.surrogate_model, self.rng)
-        else:
-            raise NotImplementedError()
-
-        if acq_func == 'mogp':
-            self.acquisition_func = MoGP_AcqFunc(self.surrogate_model,
-                                                 self.base_models, self.rng)
-        elif acq_func == 'taf':
-            self.acquisition_func = TAF_AcqFunc(self.surrogate_model,
-                                                self.base_models, self.rng)
-        elif acq_func == 'ei':
-            self.acquisition_func = EI_AcqFunc(self.surrogate_model, self.rng)
-        else:
-            raise NotImplementedError()
-
-        if acq_opt == 'ls':
-            self.acq_maximizer = LocalSearch(self.acquisition_func, self.space,
-                                             self.rng)
-        elif acq_opt == 'rs':
-            self.acq_maximizer = RandomSearch(self.acquisition_func,
-                                              self.space, self.rng)
-        elif acq_opt == 'rs_ls':
-            self.acq_maximizer = InterleavedLocalAndRandomSearch(
-                self.acquisition_func, self.space, self.rng)
-        elif acq_opt == 'scipy':
-            self.acq_maximizer = ScipyOptimizer(self.acquisition_func,
-                                                self.space, self.rng)
-        elif acq_opt == 'scipy_global':
-            self.acq_maximizer = ScipyGlobalOptimizer(self.acquisition_func,
-                                                      self.space, self.rng)
-        elif acq_opt == 'r_scipy':
-            self.acq_maximizer = RandomScipyOptimizer(self.acquisition_func,
-                                                      self.space, self.rng)
-        else:
-            raise ValueError('acq_opt {} not in {}'.format(
-                acq_opt,
-                ['ls', 'rs', 'rs_ls', 'scipy', 'scipy_global', 'r_scipy']))
-        logger.info(
-            "Execute Bayesian optimization...\n [Using ({})surrogate, ({})acquisition function, ({})acquisition optmizer]"
-            .format(surrogate, acq_func, acq_opt))
+        self._surrogate = surrogate
+        self._acq_func = acq_func
+        self._weight_srategy = weight_srategy
+        self._acq_opt = acq_opt
+        self._suggest_limit = suggest_limit
 
     def _suggest(self, n_suggestions=1):
         trial_list = []
@@ -126,7 +73,7 @@ class SMBO(AbstractOptimizer):
                 trial_list.append(
                     Trial(configuration=config,
                           config_dict=config.get_dictionary(),
-                          array=config.get_array(sparse=False)))
+                          array=config.get_array(sparse=True)))
         else:
             # update target surrogate model
             self.surrogate_model.train(
@@ -160,7 +107,7 @@ class SMBO(AbstractOptimizer):
                         trial_list.append(
                             Trial(configuration=config,
                                   config_dict=config.get_dictionary(),
-                                  array=config.get_array(sparse=False)))
+                                  array=config.get_array(sparse=True)))
                         _idx += 1
 
                         break
@@ -216,5 +163,73 @@ class SMBO(AbstractOptimizer):
 
         return x_best_array, best_observation
 
+    def get_transfer_knowledge(self, old_D_X, old_D_y):
+        self.base_models = []
+        for i in range(len(old_D_X)):
+            self.base_models.append(BaseModel(self.space, rng=self.rng, do_optimize=False))
+            self.base_models[-1].train(old_D_X[i], old_D_y[i])
+        # self.base_models = kwargs.get("base_models")
+        if self.base_models:
+            assert isinstance(self.base_models[0], BaseModel)
+            if self._surrogate == 'gp':
+                self.surrogate_model = GPR_sklearn(self.space, rng=self.rng)
+            elif self._surrogate == 'tst':
+                self.surrogate_model = TST_surrogate(self.space,
+                                                     self.base_models,
+                                                     rng=self.rng)
+        else:
+            raise NotImplementedError()
+        if self._weight_srategy == 'kernel':
+            self.weight_sratety = KernelRegress(self.space, self.base_models,
+                                                self.surrogate_model, self.rng)
+        elif self._weight_srategy == 'rw':
+            self.weight_sratety = RankingWeight(self.space,
+                                                self.base_models,
+                                                self.surrogate_model,
+                                                self.rng,
+                                                budget=self._suggest_limit,
+                                                is_purn=True)
+        elif self._weight_srategy == 'zero':
+            self.weight_sratety = ZeroWeight(self.space, self.base_models,
+                                             self.surrogate_model, self.rng)
+        else:
+            raise NotImplementedError()
+
+        if self._acq_func == 'mogp':
+            self.acquisition_func = MoGP_AcqFunc(self.surrogate_model,
+                                                 self.base_models, self.rng)
+        elif self._acq_func == 'taf':
+            self.acquisition_func = TAF_AcqFunc(self.surrogate_model,
+                                                self.base_models, self.rng)
+        elif self._acq_func == 'ei':
+            self.acquisition_func = EI_AcqFunc(self.surrogate_model, self.rng)
+        else:
+            raise NotImplementedError()
+
+        if self._acq_opt == 'ls':
+            self.acq_maximizer = LocalSearch(self.acquisition_func, self.space,
+                                             self.rng)
+        elif self._acq_opt == 'rs':
+            self.acq_maximizer = RandomSearch(self.acquisition_func,
+                                              self.space, self.rng)
+        elif self._acq_opt == 'rs_ls':
+            self.acq_maximizer = InterleavedLocalAndRandomSearch(
+                self.acquisition_func, self.space, self.rng)
+        elif self._acq_opt == 'scipy':
+            self.acq_maximizer = ScipyOptimizer(self.acquisition_func,
+                                                self.space, self.rng)
+        elif self._acq_opt == 'scipy_global':
+            self.acq_maximizer = ScipyGlobalOptimizer(self.acquisition_func,
+                                                      self.space, self.rng)
+        elif self._acq_opt == 'r_scipy':
+            self.acq_maximizer = RandomScipyOptimizer(self.acquisition_func,
+                                                      self.space, self.rng)
+        else:
+            raise ValueError('acq_opt {} not in {}'.format(
+                self._acq_opt,
+                ['ls', 'rs', 'rs_ls', 'scipy', 'scipy_global', 'r_scipy']))
+        logger.info(
+            "Execute Bayesian optimization...\n [Using ({})surrogate, ({})acquisition function, ({})acquisition optmizer]"
+            .format(self._surrogate, self._acq_func, self._acq_opt))
 
-opt_class = SMBO
+opt_class = TransferBO
diff --git a/xbbo/surrogate/gaussian_process.py b/xbbo/surrogate/gaussian_process.py
index d846218..07c1904 100644
--- a/xbbo/surrogate/gaussian_process.py
+++ b/xbbo/surrogate/gaussian_process.py
@@ -404,22 +404,3 @@ class GPR_sklearn(BaseGP):
                 f_opt_star = f_opt
                 theta_star = theta
         return theta_star
-
-    # def _set_has_conditions(self) -> None:
-    #     has_conditions = len(self.configspace.get_conditions()) > 0
-    #     to_visit = []
-    #     to_visit.append(self.kernel)
-    #     while len(to_visit) > 0:
-    #         current_param = to_visit.pop(0)
-    #         if isinstance(current_param,
-    #                       sklearn.gaussian_process.kernels.KernelOperator):
-    #             to_visit.insert(0, current_param.k1)
-    #             to_visit.insert(1, current_param.k2)
-    #             current_param.has_conditions = has_conditions
-    #         elif isinstance(current_param,
-    #                         sklearn.gaussian_process.kernels.Kernel):
-    #             current_param.has_conditions = has_conditions
-    #         else:
-    #             raise ValueError(current_param)
-
-
diff --git a/xbbo/surrogate/transfer/weight_stategy.py b/xbbo/surrogate/transfer/weight_stategy.py
index bc31042..ba912f0 100644
--- a/xbbo/surrogate/transfer/weight_stategy.py
+++ b/xbbo/surrogate/transfer/weight_stategy.py
@@ -173,7 +173,7 @@ class KernelRegress(ABCWeightStategy):
         base_model_means = []
         for model in self.base_models:
             base_model_means.append(
-                model._predict_normalize(trials.get_sparse_array(), None)[0])
+                model._predict_normalize(trials.get_array(), None)[0])
         if not base_model_means:
             return []
         base_model_means = np.stack(base_model_means)  # [model, obs_num, 1]
diff --git a/xbbo/utils/util.py b/xbbo/utils/util.py
index 426475c..e367389 100644
--- a/xbbo/utils/util.py
+++ b/xbbo/utils/util.py
@@ -1,10 +1,13 @@
+from typing import Optional
 import numpy as np
 import pickle, os, json
 from ConfigSpace.hyperparameters import (CategoricalHyperparameter,
                                          OrdinalHyperparameter, Constant,
                                          UniformFloatHyperparameter,
                                          UniformIntegerHyperparameter)
+import urllib
 
+import tqdm
 
 def dumpOBJ(path, filename, obj):
     with open(os.path.join(path, filename), 'wb') as f:
@@ -105,4 +108,21 @@ def create_rng(rng):
         return np.random.RandomState(rng)
     else:
         raise ValueError("%s is neither a number nor a RandomState. "
-                         "Initializing RandomState failed")
\ No newline at end of file
+                         "Initializing RandomState failed")
+        
+def download_and_extract_archive(
+    url: str,
+    download_root: str,
+    extract_root: Optional[str] = None,
+    filename: Optional[str] = None,
+    remove_finished: bool = False,
+) -> None:
+    download_root = os.path.expanduser(download_root)
+    if extract_root is None:
+        extract_root = download_root
+    if not filename:
+        filename = os.path.basename(url)
+
+    os.system('wget {} -O {} && unzip -d {} {}'.format(url,filename, extract_root, filename))
+    if remove_finished:
+        os.system('rm {}'.format(filename))