|
- [
- {
- "Name": "llama finetune npu",
- "Description": "",
- "JobType": "TRAIN",
- "Cluster": "C2Net",
- "ComputeSource": "NPU",
- "HasInternet": 2,
- "AccCardsNum": 1,
- "AccCardType": "ASCEND910",
- "CpuCores": 24,
- "MemGiB": 96,
- "GPUMemGiB": 32,
- "ShareMemGiB": 0,
- "Image": {
- "ImageID": "0b79fed7504c4etrain0llamafactory",
- "ImageName": "torch-npu-cann8-train",
- "ImageUrl": ""
- },
- "PretrainModelList": [
- {
- "ID": "94f3dd64-2a66-4612-bb7d-6ca5cac7b2f2",
- "ModelName": "Qwen2-0.5B"
- }
- ],
- "DatasetList": [
- {
- "ID": "a924818a-b82c-4c48-bf78-dd517077244f",
- "DatasetName": "huanhuan.zip"
- },
- {
- "ID": "937a8ab2-3c01-4be7-a4a0-c59be18809d1",
- "DatasetName": "glaive_toolcall_zh_demo.zip"
- }
- ],
- "BranchName": "master",
- "BootFile": "finetune.py",
- "Parameters": [
- {
- "Label": "stage",
- "Value": "sft"
- },
- {
- "Label": "preprocessing_numworkers",
- "Value": "16"
- },
- {
- "Label": "finetuning_type",
- "Value": "lora"
- },
- {
- "Label": "template",
- "Value": "qwen"
- },
- {
- "Label": "dataset",
- "Value": "huanhuan,glaive_toolcall_zh_demo"
- },
- {
- "Label": "model_name",
- "Value": "Qwen2-0.5B"
- },
- {
- "Label": "cutoff_len",
- "Value": "1024"
- },
- {
- "Label": "learning_rate",
- "Value": "1.0e-4"
- },
- {
- "Label": "num_train_epochs",
- "Value": "3"
- },
- {
- "Label": "max_samples",
- "Value": "1000"
- },
- {
- "Label": "per_device_train_batch_size",
- "Value": "1"
- },
- {
- "Label": "gradient_accumulation_steps",
- "Value": "2"
- },
- {
- "Label": "lr_scheduler_type",
- "Value": "cosine"
- },
- {
- "Label": "logging_steps",
- "Value": "10"
- },
- {
- "Label": "save_steps",
- "Value": "500"
- },
- {
- "Label": "warmup_ratio",
- "Value": "0.1"
- },
- {
- "Label": "val_size",
- "Value": "0.1"
- },
- {
- "Label": "per_device_eval_batch_size",
- "Value": "1"
- },
- {
- "Label": "eval_strategy",
- "Value": "steps"
- },
- {
- "Label": "eval_steps",
- "Value": "500"
- },
- {
- "Label": "plot_loss",
- "Value": "true"
- },
- {
- "Label": "overwrite_output_dir",
- "Value": "true"
- },
- {
- "Label": "fp16",
- "Value": "true"
- },
- {
- "Label": "overwrite_cache",
- "Value": "true"
- }
- ]
- },
- {
- "Name": "llama finetune gpu",
- "Description": "",
- "JobType": "TRAIN",
- "Cluster": "C2Net",
- "ComputeSource": "GPU",
- "HasInternet": 2,
- "AccCardsNum": 1,
- "AccCardType": "V100",
- "CpuCores": 8,
- "MemGiB": 50,
- "GPUMemGiB": 32,
- "ShareMemGiB": 0,
- "Image": {
- "ImageID": "",
- "ImageName": "",
- "ImageUrl": "192.168.242.22:443/default-workspace/2a72307689ae49758c80c896fffda0a1/image:llama-factory-gpu-v2"
- },
- "PretrainModelList": [
- {
- "ID": "94f3dd64-2a66-4612-bb7d-6ca5cac7b2f2",
- "ModelName": "Qwen2-0.5B"
- }
- ],
- "DatasetList": [
- {
- "ID": "a924818a-b82c-4c48-bf78-dd517077244f",
- "DatasetName": "huanhuan.zip"
- },
- {
- "ID": "30e51e73-28b5-4040-a3ea-e63ca8332dba",
- "DatasetName": "alpaca_zh_demo.zip"
- }
- ],
- "BranchName": "master",
- "BootFile": "finetune.py",
- "Parameters": [
- {
- "Label": "stage",
- "Value": "sft"
- },
- {
- "Label": "preprocessing_numworkers",
- "Value": "16"
- },
- {
- "Label": "finetuning_type",
- "Value": "lora"
- },
- {
- "Label": "template",
- "Value": "qwen"
- },
- {
- "Label": "dataset",
- "Value": "huanhuan,alpaca_zh_demo"
- },
- {
- "Label": "cutoff_len",
- "Value": "1024"
- },
- {
- "Label": "learning_rate",
- "Value": "1.0e-4"
- },
- {
- "Label": "num_train_epochs",
- "Value": "3"
- },
- {
- "Label": "max_samples",
- "Value": "1000"
- },
- {
- "Label": "per_device_train_batch_size",
- "Value": "1"
- },
- {
- "Label": "gradient_accumulation_steps",
- "Value": "2"
- },
- {
- "Label": "lr_scheduler_type",
- "Value": "cosine"
- },
- {
- "Label": "logging_steps",
- "Value": "10"
- },
- {
- "Label": "save_steps",
- "Value": "500"
- },
- {
- "Label": "warmup_ratio",
- "Value": "0.1"
- },
- {
- "Label": "val_size",
- "Value": "0.1"
- },
- {
- "Label": "per_device_eval_batch_size",
- "Value": "1"
- },
- {
- "Label": "eval_strategy",
- "Value": "steps"
- },
- {
- "Label": "eval_steps",
- "Value": "500"
- },
- {
- "Label": "model_name",
- "Value": "Qwen2-0.5B"
- },
- {
- "Label": "plot_loss",
- "Value": "true"
- },
- {
- "Label": "overwrite_output_dir",
- "Value": "true"
- },
- {
- "Label": "fp16",
- "Value": "true"
- },
- {
- "Label": "overwrite_cache",
- "Value": "true"
- }
- ]
- },
- {
- "Name": "llama finetune gpgpu",
- "Description": "",
- "JobType": "TRAIN",
- "Cluster": "C2Net",
- "ComputeSource": "ILUVATAR-GPGPU",
- "HasInternet": 2,
- "AccCardsNum": 1,
- "AccCardType": "BI-V100",
- "CpuCores": 30,
- "MemGiB": 64,
- "GPUMemGiB": 32,
- "ShareMemGiB": 0,
- "Image": {
- "ImageID": "",
- "ImageName": "",
- "ImageUrl": "10.208.20.54:1443/default-workspace/1e53e45fca0f4b44b15ca8d00025f2ba/image:llama-factory-gpgpu-train-v2"
- },
- "PretrainModelList": [
- {
- "ID": "94f3dd64-2a66-4612-bb7d-6ca5cac7b2f2",
- "ModelName": "Qwen2-0.5B"
- }
- ],
- "DatasetList": [
- {
- "ID": "30e51e73-28b5-4040-a3ea-e63ca8332dba",
- "DatasetName": "alpaca_zh_demo.zip"
- },
- {
- "ID": "a924818a-b82c-4c48-bf78-dd517077244f",
- "DatasetName": "huanhuan.zip"
- }
- ],
- "BranchName": "master",
- "BootFile": "finetune_gpgpu.py",
- "Parameters": [
- {
- "Label": "stage",
- "Value": "sft"
- },
- {
- "Label": "preprocessing_numworkers",
- "Value": "16"
- },
- {
- "Label": "finetuning_type",
- "Value": "lora"
- },
- {
- "Label": "template",
- "Value": "qwen"
- },
- {
- "Label": "dataset",
- "Value": "alpaca_zh_demo,huanhuan"
- },
- {
- "Label": "cutoff_len",
- "Value": "1024"
- },
- {
- "Label": "learning_rate",
- "Value": "1.0e-4"
- },
- {
- "Label": "num_train_epochs",
- "Value": "3"
- },
- {
- "Label": "max_samples",
- "Value": "1000"
- },
- {
- "Label": "per_device_train_batch_size",
- "Value": "1"
- },
- {
- "Label": "gradient_accumulation_steps",
- "Value": "2"
- },
- {
- "Label": "lr_scheduler_type",
- "Value": "cosine"
- },
- {
- "Label": "logging_steps",
- "Value": "10"
- },
- {
- "Label": "save_steps",
- "Value": "500"
- },
- {
- "Label": "warmup_ratio",
- "Value": "0.1"
- },
- {
- "Label": "val_size",
- "Value": "0.1"
- },
- {
- "Label": "per_device_eval_batch_size",
- "Value": "1"
- },
- {
- "Label": "eval_strategy",
- "Value": "steps"
- },
- {
- "Label": "eval_steps",
- "Value": "500"
- },
- {
- "Label": "model_name",
- "Value": "Qwen2-0.5B"
- },
- {
- "Label": "plot_loss",
- "Value": "true"
- },
- {
- "Label": "overwrite_output_dir",
- "Value": "true"
- },
- {
- "Label": "fp16",
- "Value": "true"
- },
- {
- "Label": "overwrite_cache",
- "Value": "true"
- }
- ]
- },
- {
- "Name": "Baichuan2-7b-base G",
- "Description": "",
- "JobType": "TRAIN",
- "Cluster": "C2Net",
- "ComputeSource": "GPU",
- "HasInternet": 2,
- "AccCardsNum": 1,
- "AccCardType": "V100",
- "CpuCores": 8,
- "MemGiB": 50,
- "GPUMemGiB": 32,
- "ShareMemGiB": 0,
- "Image": {
- "ImageID": "",
- "ImageName": "",
- "ImageUrl": "192.168.242.22:443/default-workspace/fccb038c23234b9e80105d4ccd152117/image:ChatGLM3-6B"
- },
- "PretrainModelList": [
- {
- "ID": "b5ec0a05-624c-44ea-aeda-0ab8a3bef65a",
- "ModelName": "Baichuan2-7b-base"
- }
- ],
- "DatasetList": [
- {
- "ID": "a924818a-b82c-4c48-bf78-dd517077244f",
- "DatasetName": "huanhuan.zip"
- },
- {
- "ID": "30e51e73-28b5-4040-a3ea-e63ca8332dba",
- "DatasetName": "alpaca_zh_demo.zip"
- }
- ],
- "BranchName": "master",
- "BootFile": "finetune.py",
- "Parameters": [
- {
- "Label": "stage",
- "Value": "sft"
- },
- {
- "Label": "preprocessing_numworkers",
- "Value": "16"
- },
- {
- "Label": "finetuning_type",
- "Value": "lora"
- },
- {
- "Label": "template",
- "Value": "baichuan2"
- },
- {
- "Label": "dataset",
- "Value": "huanhuan,alpaca_zh_demo"
- },
- {
- "Label": "cutoff_len",
- "Value": "1024"
- },
- {
- "Label": "learning_rate",
- "Value": "1.0e-4"
- },
- {
- "Label": "num_train_epochs",
- "Value": "1"
- },
- {
- "Label": "max_samples",
- "Value": "1000"
- },
- {
- "Label": "per_device_train_batch_size",
- "Value": "1"
- },
- {
- "Label": "gradient_accumulation_steps",
- "Value": "2"
- },
- {
- "Label": "lr_scheduler_type",
- "Value": "cosine"
- },
- {
- "Label": "logging_steps",
- "Value": "10"
- },
- {
- "Label": "save_steps",
- "Value": "500"
- },
- {
- "Label": "warmup_ratio",
- "Value": "0.1"
- },
- {
- "Label": "val_size",
- "Value": "0.1"
- },
- {
- "Label": "per_device_eval_batch_size",
- "Value": "1"
- },
- {
- "Label": "eval_strategy",
- "Value": "steps"
- },
- {
- "Label": "eval_steps",
- "Value": "500"
- },
- {
- "Label": "model_name",
- "Value": "Baichuan2-7b-base"
- },
- {
- "Label": "plot_loss",
- "Value": "true"
- },
- {
- "Label": "overwrite_output_dir",
- "Value": "true"
- },
- {
- "Label": "fp16",
- "Value": "true"
- },
- {
- "Label": "overwrite_cache",
- "Value": "true"
- }
- ]
- }
- ]
|