| model: |
| name: sentiment_classifier |
| type: classification |
| model: |
| pretrained_model: xlm-roberta-base |
| num_labels: 3 |
| dropout: 0.1 |
| hidden_size: 768 |
| labels: |
| - negative |
| - neutral |
| - positive |
| class_weights: null |
| tokenizer: |
| max_length: 256 |
| padding: max_length |
| truncation: true |
| add_special_tokens: true |
| huggingface_hub: |
| enabled: true |
| repo_id: anpmts/sentiment-classifier |
| private: false |
| create_model_card: true |
| commit_message: Upload sentiment classifier model |
| model_card: |
| language: multilingual |
| license: apache-2.0 |
| tags: |
| - sentiment-analysis |
| - text-classification |
| - xlm-roberta |
| - sequence-classification |
| datasets: null |
| training: |
| epochs: 10 |
| batch_size: 128 |
| gradient_accumulation_steps: 1 |
| max_grad_norm: 1.0 |
| distributed: |
| enabled: true |
| backend: nccl |
| find_unused_parameters: true |
| precision: |
| mode: bf16 |
| performance: |
| torch_compile: false |
| compile_mode: reduce-overhead |
| cudnn_benchmark: true |
| gradient_checkpointing: false |
| tf32: true |
| flash_attention_2: false |
| matmul_precision: high |
| channels_last: false |
| optimizer: |
| type: adamw |
| lr: 2.0e-05 |
| weight_decay: 0.01 |
| eps: 1.0e-08 |
| betas: |
| - 0.9 |
| - 0.999 |
| fused: false |
| scheduler: |
| type: cosine |
| warmup_ratio: 0.1 |
| warmup_steps: null |
| num_cycles: 0.5 |
| early_stopping: |
| enabled: true |
| patience: 3 |
| min_delta: 0.001 |
| monitor: val_loss |
| mode: min |
| checkpoint: |
| save_top_k: 2 |
| monitor: val_loss |
| mode: min |
| save_last: true |
| every_n_epochs: 1 |
| resume_from_checkpoint: true |
| pretrained_checkpoint: null |
| load_only_model: true |
| eval: |
| eval_every_n_steps: null |
| eval_accumulation_steps: 1 |
| dataloader: |
| num_workers: 0 |
| pin_memory: true |
| persistent_workers: false |
| prefetch_factor: null |
| deterministic: false |
| benchmark: true |
| data: |
| data_source: local |
| chunked: |
| enabled: false |
| train_path: data/amazon_reviews/train |
| val_path: data/amazon_reviews/validation |
| test_path: data/amazon_reviews/test |
| chunk_size: 100000 |
| total_train_samples: 3600000 |
| text_field: text |
| label_field: sentiment_label |
| huggingface: |
| repo: anpmts/trustshop |
| split_mapping: |
| train: train |
| val: validation |
| test: test |
| field_mapping: |
| text: text |
| sentiment_label: sentiment_label |
| sentiment_score: sentiment_score |
| quality_label: quality |
| config_name: null |
| revision: null |
| max_samples: null |
| local: |
| data_dir: data/amazon_reviews |
| processed_dir: data/processed/amazon_reviews |
| split: |
| train: 0.7 |
| val: 0.15 |
| test: 0.15 |
| stratify: true |
| filter_quality: |
| enabled: false |
| keep_labels: |
| - valid |
| class_balancing: |
| enabled: false |
| strategy: oversample |
| oversample: |
| sampling_strategy: auto |
| smote: |
| k_neighbors: 5 |
| sampling_strategy: auto |
| augmentation: |
| enabled: false |
| techniques: |
| - synonym_replacement |
| - random_deletion |
| - random_swap |
| augment_ratio: 0.1 |
| preprocessing: |
| lowercase: false |
| remove_urls: true |
| remove_email: true |
| remove_special_chars: false |
| min_text_length: 10 |
| cache: |
| enabled: true |
| cache_dir: data/.cache/amazon_reviews |
| seed: 42 |
| validation: |
| check_missing_fields: false |
| check_empty_text: true |
| log_invalid_samples: true |
| project: |
| name: ts-train |
| seed: 42 |
| device: cuda |
| mixed_precision: true |
| paths: |
| data_dir: data |
| data_file: data/output.jsonl |
| output_dir: outputs |
| model_dir: models |
| log_dir: logs |
| logging: |
| use_wandb: true |
| wandb_project: ts-absa-classification |
| wandb_entity: null |
| use_tensorboard: true |
| log_interval: 10 |
| experiment: |
| name: null |
| tags: [] |
| notes: '' |
|
|