ArneBinder commited on
Commit
b267f1b
·
verified ·
1 Parent(s): bcbef4e

upload models/dataset-sciarg/task-adur/cluster/2025-03-12_02-12-01

Browse files

model is from: https://github.com/ArneBinder/pie-document-level/pull/410#issuecomment-2711611125
- evaluated on SciArg validation set (from sciarg_prepared_with_fixed_validation_and_more_train)
- selection based on relaxed_span=true and criterion=span: idx 4

Files changed (3) hide show
  1. config.json +43 -43
  2. pytorch_model.bin +2 -2
  3. taskmodule_config.json +18 -18
config.json CHANGED
@@ -1,47 +1,47 @@
1
  {
2
- "model_type": "TokenClassificationModelWithSeq2SeqEncoderAndCrf",
3
- "model_name_or_path": "allenai/scibert_scivocab_uncased",
4
- "num_classes": 7,
5
- "learning_rate": 5e-05,
6
- "task_learning_rate": 0.005,
7
- "use_crf": true,
8
- "label_pad_id": -100,
9
- "special_token_label_id": 0,
10
- "classifier_dropout": null,
11
- "freeze_base_model": false,
12
- "warmup_proportion": 0.1,
13
- "seq2seq_encoder": {
14
- "type": "sequential",
15
- "drop0": {
16
- "type": "dropout",
17
- "p": 0.5
18
- },
19
- "lstm0": {
20
- "type": "lstm",
21
- "num_layers": 2,
22
- "bidirectional": true,
23
- "hidden_size": 300,
24
- "dropout": 0.4394
25
- }
26
- },
27
- "taskmodule_config": {
28
- "taskmodule_type": "LabeledSpanExtractionByTokenClassificationTaskModule",
29
- "tokenizer_name_or_path": "allenai/scibert_scivocab_uncased",
30
- "span_annotation": "labeled_spans",
31
- "partition_annotation": "labeled_partitions",
32
  "label_pad_id": -100,
33
- "labels": [
34
- "background_claim",
35
- "data",
36
- "own_claim"
37
- ],
38
- "include_ill_formed_predictions": true,
39
- "tokenize_kwargs": {
40
- "max_length": 512,
41
- "stride": 64,
42
- "return_overflowing_tokens": true
 
 
 
 
 
 
 
43
  },
44
- "pad_kwargs": null,
45
- "log_precision_recall_metrics": true
46
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
47
  }
 
1
  {
2
+ "model_type": "TokenClassificationModelWithSeq2SeqEncoderAndCrf",
3
+ "model_name_or_path": "allenai/scibert_scivocab_uncased",
4
+ "num_classes": 7,
5
+ "learning_rate": 5e-05,
6
+ "task_learning_rate": 0.01,
7
+ "use_crf": true,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8
  "label_pad_id": -100,
9
+ "special_token_label_id": 0,
10
+ "classifier_dropout": null,
11
+ "freeze_base_model": true,
12
+ "warmup_proportion": 0.1,
13
+ "seq2seq_encoder": {
14
+ "type": "sequential",
15
+ "drop0": {
16
+ "type": "dropout",
17
+ "p": 0.5
18
+ },
19
+ "lstm0": {
20
+ "type": "lstm",
21
+ "num_layers": 2,
22
+ "bidirectional": true,
23
+ "hidden_size": 300,
24
+ "dropout": 0.4394
25
+ }
26
  },
27
+ "taskmodule_config": {
28
+ "taskmodule_type": "LabeledSpanExtractionByTokenClassificationTaskModule",
29
+ "tokenizer_name_or_path": "allenai/scibert_scivocab_uncased",
30
+ "span_annotation": "labeled_spans",
31
+ "partition_annotation": "labeled_partitions",
32
+ "label_pad_id": -100,
33
+ "labels": [
34
+ "background_claim",
35
+ "data",
36
+ "own_claim"
37
+ ],
38
+ "include_ill_formed_predictions": true,
39
+ "tokenize_kwargs": {
40
+ "max_length": 512,
41
+ "stride": 64,
42
+ "return_overflowing_tokens": true
43
+ },
44
+ "pad_kwargs": null,
45
+ "log_precision_recall_metrics": true
46
+ }
47
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a183e009828e2fd988f97e52b5fd5a4f1eca39b65abc97b35b99498f7b0d9930
3
- size 458710913
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89133bb2f468981542946e3f5b19d3b80c3dd326e35a97a2a865ceba2c930297
3
+ size 458711358
taskmodule_config.json CHANGED
@@ -1,20 +1,20 @@
1
  {
2
- "taskmodule_type": "LabeledSpanExtractionByTokenClassificationTaskModule",
3
- "tokenizer_name_or_path": "allenai/scibert_scivocab_uncased",
4
- "span_annotation": "labeled_spans",
5
- "partition_annotation": "labeled_partitions",
6
- "label_pad_id": -100,
7
- "labels": [
8
- "background_claim",
9
- "data",
10
- "own_claim"
11
- ],
12
- "include_ill_formed_predictions": true,
13
- "tokenize_kwargs": {
14
- "max_length": 512,
15
- "stride": 64,
16
- "return_overflowing_tokens": true
17
- },
18
- "pad_kwargs": null,
19
- "log_precision_recall_metrics": true
20
  }
 
1
  {
2
+ "taskmodule_type": "LabeledSpanExtractionByTokenClassificationTaskModule",
3
+ "tokenizer_name_or_path": "allenai/scibert_scivocab_uncased",
4
+ "span_annotation": "labeled_spans",
5
+ "partition_annotation": "labeled_partitions",
6
+ "label_pad_id": -100,
7
+ "labels": [
8
+ "background_claim",
9
+ "data",
10
+ "own_claim"
11
+ ],
12
+ "include_ill_formed_predictions": true,
13
+ "tokenize_kwargs": {
14
+ "max_length": 512,
15
+ "stride": 64,
16
+ "return_overflowing_tokens": true
17
+ },
18
+ "pad_kwargs": null,
19
+ "log_precision_recall_metrics": true
20
  }