janbakker commited on
Commit
a51a00e
·
verified ·
1 Parent(s): ef492d4

Upload RobertaForSequenceClassification

Browse files
Files changed (2) hide show
  1. config.json +127 -0
  2. pytorch_model.bin +3 -0
config.json ADDED
@@ -0,0 +1,127 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "roberta-base",
3
+ "accelerator": null,
4
+ "accumulate_grad_batches": null,
5
+ "add_context": false,
6
+ "amp_backend": null,
7
+ "amp_level": null,
8
+ "architectures": [
9
+ "RobertaForSequenceClassification"
10
+ ],
11
+ "attention_probs_dropout_prob": 0.1,
12
+ "auto_lr_find": false,
13
+ "auto_scale_batch_size": false,
14
+ "auto_select_gpus": null,
15
+ "batch_size": 32,
16
+ "benchmark": null,
17
+ "binary_clf": false,
18
+ "bos_token_id": 0,
19
+ "check_val_every_n_epoch": 1,
20
+ "checkpoint": null,
21
+ "ckpt_metric": "val_macro_f1",
22
+ "classifier_dropout": null,
23
+ "context_dir": null,
24
+ "context_doc_id": null,
25
+ "context_window": 5,
26
+ "default_root_dir": null,
27
+ "detect_anomaly": false,
28
+ "devices": "2",
29
+ "doc_pos_embeds": false,
30
+ "enable_checkpointing": true,
31
+ "enable_model_summary": true,
32
+ "enable_progress_bar": true,
33
+ "eos_token_id": 2,
34
+ "fast_dev_run": false,
35
+ "gpus": null,
36
+ "gradient_clip_algorithm": null,
37
+ "gradient_clip_val": null,
38
+ "hidden_act": "gelu",
39
+ "hidden_dropout_prob": 0.1,
40
+ "hidden_size": 768,
41
+ "id2label": {
42
+ "0": "LABEL_0",
43
+ "1": "LABEL_1",
44
+ "2": "LABEL_2",
45
+ "3": "LABEL_3",
46
+ "4": "LABEL_4"
47
+ },
48
+ "inference_mode": true,
49
+ "initializer_range": 0.02,
50
+ "intermediate_size": 3072,
51
+ "ipus": null,
52
+ "label2id": {
53
+ "LABEL_0": 0,
54
+ "LABEL_1": 1,
55
+ "LABEL_2": 2,
56
+ "LABEL_3": 3,
57
+ "LABEL_4": 4
58
+ },
59
+ "layer_norm_eps": 1e-05,
60
+ "learning_rate": 1e-05,
61
+ "left_z_only": false,
62
+ "limit_predict_batches": null,
63
+ "limit_test_batches": null,
64
+ "limit_train_batches": null,
65
+ "limit_val_batches": null,
66
+ "log_class_acc": false,
67
+ "log_every_n_steps": 50,
68
+ "logger": true,
69
+ "lr_scheduler": false,
70
+ "max_epochs": 10,
71
+ "max_length": 128,
72
+ "max_position_embeddings": 514,
73
+ "max_samples": -1,
74
+ "max_steps": -1,
75
+ "max_time": null,
76
+ "min_epochs": null,
77
+ "min_steps": null,
78
+ "model_type": "roberta",
79
+ "move_metrics_to_cpu": false,
80
+ "multiple_trainloader_mode": "max_size_cycle",
81
+ "name": "classifier-merge",
82
+ "no_context_pos": false,
83
+ "num_attention_heads": 12,
84
+ "num_hidden_layers": 12,
85
+ "num_nodes": 1,
86
+ "num_processes": null,
87
+ "num_sanity_val_steps": 2,
88
+ "overfit_batches": 0.0,
89
+ "pad_token_id": 1,
90
+ "plugins": null,
91
+ "position_embedding_type": "absolute",
92
+ "precision": 32,
93
+ "profiler": null,
94
+ "project": "planning_experiments",
95
+ "reading_lvl": null,
96
+ "regression": false,
97
+ "reload_dataloaders_every_n_epochs": 0,
98
+ "replace_sampler_ddp": true,
99
+ "resume_from_checkpoint": null,
100
+ "save_dir": null,
101
+ "second_stage": false,
102
+ "simple_context_dir": null,
103
+ "simple_context_doc_id": null,
104
+ "src_lvl": null,
105
+ "strategy": null,
106
+ "sync_batchnorm": false,
107
+ "torch_dtype": "float32",
108
+ "tpu_cores": null,
109
+ "track_grad_norm": -1,
110
+ "train_check_interval": 0.2,
111
+ "train_file": "data/cochrane_sents_train.csv",
112
+ "train_split": 0.9,
113
+ "train_workers": 8,
114
+ "transformers_version": "4.29.1",
115
+ "type_vocab_size": 1,
116
+ "upsample_classes": false,
117
+ "use_cache": true,
118
+ "use_merge_labels": true,
119
+ "val_check_interval": null,
120
+ "val_file": "data/cochrane_sents_val.csv",
121
+ "val_split": 0.05,
122
+ "val_workers": 8,
123
+ "vocab_size": 50275,
124
+ "wandb_id": null,
125
+ "x_col": "complex",
126
+ "y_col": "label"
127
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5de050f40c32a8a1ed99db466db632893dd3b2543b14782e5cd4bf1b00d3fa3
3
+ size 498702005