Crystalcareai
/

Qwen1.5-8x7b

Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

Crystalcareai commited on Feb 20

Commit

f3a237e

•

1 Parent(s): 65a5134

Delete AxolotlConfig.txt

Files changed (1) hide show

AxolotlConfig.txt +0 -74

AxolotlConfig.txt DELETED Viewed

@@ -1,74 +0,0 @@
-base_model: Crystalcareai/Qwen-1.5-8x7B
-model_type: Qwen2ForCausalLM
-tokenizer_type: Qwen2Tokenizer
-trust_remote_code: true
-load_in_8bit: false
-load_in_4bit: true
-strict: false
-datasets:
-  - path: Crystalcareai/MoD
-        type: sharegpt
-dataset_prepared_path: last_run_prepared
-val_set_size: 0.0
-output_dir: ./qlora-out
-model_config:
-  output_router_logits: true
-adapter: qlora
-lora_model_dir:
-sequence_len: 32768
-sample_packing: true
-pad_to_sequence_len: true
-lora_r: 32
-lora_alpha: 16
-lora_dropout: 0.05
-lora_target_linear: true
-lora_fan_in_fan_out:
-gradient_accumulation_steps: 2
-micro_batch_size: 2
-num_epochs: 4
-optimizer: adamw_bnb_8bit
-lr_scheduler: cosine
-learning_rate: 0.0002
-train_on_inputs: false
-group_by_length: false
-bf16: true
-fp16:
-tf32: false
-gradient_checkpointing: true
-early_stopping_patience:
-resume_from_checkpoint:
-local_rank:
-logging_steps: 1
-xformers_attention:
-flash_attention: true
-warmup_steps: 10
-evals_per_epoch: 4
-eval_table_size:
-eval_max_new_tokens: 128
-saves_per_epoch: 4
-debug:
-deepspeed: deepspeed_configs/zero2.json
-weight_decay: 0.0
-fsdp:
-fsdp_config:
-special_tokens: