Commit
·
41e487b
1
Parent(s):
c5e2c6f
Upload 6 files
Browse files- .gitattributes +1 -0
- gliner_config.json +15 -14
- tokenizer.json +2 -2
.gitattributes
CHANGED
|
@@ -34,3 +34,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
processed_output.jsonl filter=lfs diff=lfs merge=lfs -text
|
gliner_config.json
CHANGED
|
@@ -1,10 +1,10 @@
|
|
| 1 |
{
|
|
|
|
| 2 |
"class_token_index": 256000,
|
| 3 |
"decoder_mode": null,
|
| 4 |
-
"dropout": 0.
|
| 5 |
"embed_ent_token": true,
|
| 6 |
"encoder_config": {
|
| 7 |
-
"_attn_implementation_autoset": false,
|
| 8 |
"_name_or_path": "jhu-clsp/mmBERT-base",
|
| 9 |
"add_cross_attention": false,
|
| 10 |
"architectures": [
|
|
@@ -27,6 +27,7 @@
|
|
| 27 |
"deterministic_flash_attn": false,
|
| 28 |
"diversity_penalty": 0.0,
|
| 29 |
"do_sample": false,
|
|
|
|
| 30 |
"early_stopping": false,
|
| 31 |
"embedding_dropout": 0.0,
|
| 32 |
"encoder_no_repeat_ngram_size": 0,
|
|
@@ -80,7 +81,6 @@
|
|
| 80 |
"prefix": null,
|
| 81 |
"problem_type": null,
|
| 82 |
"pruned_heads": {},
|
| 83 |
-
"reference_compile": null,
|
| 84 |
"remove_invalid_values": false,
|
| 85 |
"repad_logits_with_grad": false,
|
| 86 |
"repetition_penalty": 1.0,
|
|
@@ -98,13 +98,13 @@
|
|
| 98 |
"tokenizer_class": null,
|
| 99 |
"top_k": 50,
|
| 100 |
"top_p": 1.0,
|
| 101 |
-
"torch_dtype": "float32",
|
| 102 |
"torchscript": false,
|
| 103 |
"typical_p": 1.0,
|
| 104 |
"use_bfloat16": false,
|
| 105 |
"vocab_size": 256002
|
| 106 |
},
|
| 107 |
"ent_token": "<<ENT>>",
|
|
|
|
| 108 |
"eval_every": 500,
|
| 109 |
"fine_tune": true,
|
| 110 |
"freeze_token_rep": false,
|
|
@@ -117,25 +117,26 @@
|
|
| 117 |
"labels_decoder_config": null,
|
| 118 |
"labels_encoder": null,
|
| 119 |
"labels_encoder_config": null,
|
| 120 |
-
"log_dir": "models/
|
| 121 |
"loss_alpha": 0.75,
|
| 122 |
"loss_gamma": 0,
|
| 123 |
"loss_prob_margin": 0,
|
| 124 |
"loss_reduction": "sum",
|
| 125 |
-
"lr_encoder": "
|
| 126 |
"lr_others": "3e-5",
|
| 127 |
"masking": "none",
|
| 128 |
"max_grad_norm": 10.0,
|
| 129 |
-
"max_len":
|
| 130 |
"max_neg_type_ratio": 1,
|
| 131 |
-
"max_types":
|
| 132 |
"max_width": 12,
|
| 133 |
"model_name": "jhu-clsp/mmBERT-base",
|
| 134 |
"model_type": "gliner",
|
| 135 |
-
"name": "
|
| 136 |
"negatives": 1.0,
|
| 137 |
"num_post_fusion_layers": 1,
|
| 138 |
-
"num_steps":
|
|
|
|
| 139 |
"post_fusion_schema": null,
|
| 140 |
"prev_path": null,
|
| 141 |
"random_drop": true,
|
|
@@ -147,10 +148,10 @@
|
|
| 147 |
"size_sup": -1,
|
| 148 |
"span_mode": "markerV0",
|
| 149 |
"subtoken_pooling": "first",
|
| 150 |
-
"train_batch_size":
|
| 151 |
-
"train_data": "
|
| 152 |
-
"transformers_version": "4.
|
| 153 |
-
"
|
| 154 |
"vocab_size": 256002,
|
| 155 |
"warmup_ratio": 0.05,
|
| 156 |
"weight_decay_encoder": 0.1,
|
|
|
|
| 1 |
{
|
| 2 |
+
"bos_token_id": 2,
|
| 3 |
"class_token_index": 256000,
|
| 4 |
"decoder_mode": null,
|
| 5 |
+
"dropout": 0.3,
|
| 6 |
"embed_ent_token": true,
|
| 7 |
"encoder_config": {
|
|
|
|
| 8 |
"_name_or_path": "jhu-clsp/mmBERT-base",
|
| 9 |
"add_cross_attention": false,
|
| 10 |
"architectures": [
|
|
|
|
| 27 |
"deterministic_flash_attn": false,
|
| 28 |
"diversity_penalty": 0.0,
|
| 29 |
"do_sample": false,
|
| 30 |
+
"dtype": "float32",
|
| 31 |
"early_stopping": false,
|
| 32 |
"embedding_dropout": 0.0,
|
| 33 |
"encoder_no_repeat_ngram_size": 0,
|
|
|
|
| 81 |
"prefix": null,
|
| 82 |
"problem_type": null,
|
| 83 |
"pruned_heads": {},
|
|
|
|
| 84 |
"remove_invalid_values": false,
|
| 85 |
"repad_logits_with_grad": false,
|
| 86 |
"repetition_penalty": 1.0,
|
|
|
|
| 98 |
"tokenizer_class": null,
|
| 99 |
"top_k": 50,
|
| 100 |
"top_p": 1.0,
|
|
|
|
| 101 |
"torchscript": false,
|
| 102 |
"typical_p": 1.0,
|
| 103 |
"use_bfloat16": false,
|
| 104 |
"vocab_size": 256002
|
| 105 |
},
|
| 106 |
"ent_token": "<<ENT>>",
|
| 107 |
+
"eos_token_id": 1,
|
| 108 |
"eval_every": 500,
|
| 109 |
"fine_tune": true,
|
| 110 |
"freeze_token_rep": false,
|
|
|
|
| 117 |
"labels_decoder_config": null,
|
| 118 |
"labels_encoder": null,
|
| 119 |
"labels_encoder_config": null,
|
| 120 |
+
"log_dir": "models/",
|
| 121 |
"loss_alpha": 0.75,
|
| 122 |
"loss_gamma": 0,
|
| 123 |
"loss_prob_margin": 0,
|
| 124 |
"loss_reduction": "sum",
|
| 125 |
+
"lr_encoder": "2e-5",
|
| 126 |
"lr_others": "3e-5",
|
| 127 |
"masking": "none",
|
| 128 |
"max_grad_norm": 10.0,
|
| 129 |
+
"max_len": 2048,
|
| 130 |
"max_neg_type_ratio": 1,
|
| 131 |
+
"max_types": 200,
|
| 132 |
"max_width": 12,
|
| 133 |
"model_name": "jhu-clsp/mmBERT-base",
|
| 134 |
"model_type": "gliner",
|
| 135 |
+
"name": "span level gliner",
|
| 136 |
"negatives": 1.0,
|
| 137 |
"num_post_fusion_layers": 1,
|
| 138 |
+
"num_steps": 100000,
|
| 139 |
+
"pad_token_id": 0,
|
| 140 |
"post_fusion_schema": null,
|
| 141 |
"prev_path": null,
|
| 142 |
"random_drop": true,
|
|
|
|
| 148 |
"size_sup": -1,
|
| 149 |
"span_mode": "markerV0",
|
| 150 |
"subtoken_pooling": "first",
|
| 151 |
+
"train_batch_size": 16,
|
| 152 |
+
"train_data": "../dataset_gen/dataset_generated/processed_output.jsonl",
|
| 153 |
+
"transformers_version": "4.57.1",
|
| 154 |
+
"val_data": "../dataset_gen/dataset_generated/test_it.jsonl",
|
| 155 |
"vocab_size": 256002,
|
| 156 |
"warmup_ratio": 0.05,
|
| 157 |
"weight_decay_encoder": 0.1,
|
tokenizer.json
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4f65190517e4633347d84e0225b8c5c66a1a62321107ebc73c09d5cefa2b5cd5
|
| 3 |
+
size 34363810
|