DeepMount00 commited on
Commit
41e487b
·
1 Parent(s): c5e2c6f

Upload 6 files

Browse files
Files changed (3) hide show
  1. .gitattributes +1 -0
  2. gliner_config.json +15 -14
  3. tokenizer.json +2 -2
.gitattributes CHANGED
@@ -34,3 +34,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  tokenizer.json filter=lfs diff=lfs merge=lfs -text
 
 
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  tokenizer.json filter=lfs diff=lfs merge=lfs -text
37
+ processed_output.jsonl filter=lfs diff=lfs merge=lfs -text
gliner_config.json CHANGED
@@ -1,10 +1,10 @@
1
  {
 
2
  "class_token_index": 256000,
3
  "decoder_mode": null,
4
- "dropout": 0.4,
5
  "embed_ent_token": true,
6
  "encoder_config": {
7
- "_attn_implementation_autoset": false,
8
  "_name_or_path": "jhu-clsp/mmBERT-base",
9
  "add_cross_attention": false,
10
  "architectures": [
@@ -27,6 +27,7 @@
27
  "deterministic_flash_attn": false,
28
  "diversity_penalty": 0.0,
29
  "do_sample": false,
 
30
  "early_stopping": false,
31
  "embedding_dropout": 0.0,
32
  "encoder_no_repeat_ngram_size": 0,
@@ -80,7 +81,6 @@
80
  "prefix": null,
81
  "problem_type": null,
82
  "pruned_heads": {},
83
- "reference_compile": null,
84
  "remove_invalid_values": false,
85
  "repad_logits_with_grad": false,
86
  "repetition_penalty": 1.0,
@@ -98,13 +98,13 @@
98
  "tokenizer_class": null,
99
  "top_k": 50,
100
  "top_p": 1.0,
101
- "torch_dtype": "float32",
102
  "torchscript": false,
103
  "typical_p": 1.0,
104
  "use_bfloat16": false,
105
  "vocab_size": 256002
106
  },
107
  "ent_token": "<<ENT>>",
 
108
  "eval_every": 500,
109
  "fine_tune": true,
110
  "freeze_token_rep": false,
@@ -117,25 +117,26 @@
117
  "labels_decoder_config": null,
118
  "labels_encoder": null,
119
  "labels_encoder_config": null,
120
- "log_dir": "models/mmbert_gliner",
121
  "loss_alpha": 0.75,
122
  "loss_gamma": 0,
123
  "loss_prob_margin": 0,
124
  "loss_reduction": "sum",
125
- "lr_encoder": "5e-6",
126
  "lr_others": "3e-5",
127
  "masking": "none",
128
  "max_grad_norm": 10.0,
129
- "max_len": 8192,
130
  "max_neg_type_ratio": 1,
131
- "max_types": 100,
132
  "max_width": 12,
133
  "model_name": "jhu-clsp/mmBERT-base",
134
  "model_type": "gliner",
135
- "name": "mmBERT GLiNER NER",
136
  "negatives": 1.0,
137
  "num_post_fusion_layers": 1,
138
- "num_steps": 150,
 
139
  "post_fusion_schema": null,
140
  "prev_path": null,
141
  "random_drop": true,
@@ -147,10 +148,10 @@
147
  "size_sup": -1,
148
  "span_mode": "markerV0",
149
  "subtoken_pooling": "first",
150
- "train_batch_size": 4,
151
- "train_data": "data/sample_data.json",
152
- "transformers_version": "4.48.1",
153
- "val_data_dir": "none",
154
  "vocab_size": 256002,
155
  "warmup_ratio": 0.05,
156
  "weight_decay_encoder": 0.1,
 
1
  {
2
+ "bos_token_id": 2,
3
  "class_token_index": 256000,
4
  "decoder_mode": null,
5
+ "dropout": 0.3,
6
  "embed_ent_token": true,
7
  "encoder_config": {
 
8
  "_name_or_path": "jhu-clsp/mmBERT-base",
9
  "add_cross_attention": false,
10
  "architectures": [
 
27
  "deterministic_flash_attn": false,
28
  "diversity_penalty": 0.0,
29
  "do_sample": false,
30
+ "dtype": "float32",
31
  "early_stopping": false,
32
  "embedding_dropout": 0.0,
33
  "encoder_no_repeat_ngram_size": 0,
 
81
  "prefix": null,
82
  "problem_type": null,
83
  "pruned_heads": {},
 
84
  "remove_invalid_values": false,
85
  "repad_logits_with_grad": false,
86
  "repetition_penalty": 1.0,
 
98
  "tokenizer_class": null,
99
  "top_k": 50,
100
  "top_p": 1.0,
 
101
  "torchscript": false,
102
  "typical_p": 1.0,
103
  "use_bfloat16": false,
104
  "vocab_size": 256002
105
  },
106
  "ent_token": "<<ENT>>",
107
+ "eos_token_id": 1,
108
  "eval_every": 500,
109
  "fine_tune": true,
110
  "freeze_token_rep": false,
 
117
  "labels_decoder_config": null,
118
  "labels_encoder": null,
119
  "labels_encoder_config": null,
120
+ "log_dir": "models/",
121
  "loss_alpha": 0.75,
122
  "loss_gamma": 0,
123
  "loss_prob_margin": 0,
124
  "loss_reduction": "sum",
125
+ "lr_encoder": "2e-5",
126
  "lr_others": "3e-5",
127
  "masking": "none",
128
  "max_grad_norm": 10.0,
129
+ "max_len": 2048,
130
  "max_neg_type_ratio": 1,
131
+ "max_types": 200,
132
  "max_width": 12,
133
  "model_name": "jhu-clsp/mmBERT-base",
134
  "model_type": "gliner",
135
+ "name": "span level gliner",
136
  "negatives": 1.0,
137
  "num_post_fusion_layers": 1,
138
+ "num_steps": 100000,
139
+ "pad_token_id": 0,
140
  "post_fusion_schema": null,
141
  "prev_path": null,
142
  "random_drop": true,
 
148
  "size_sup": -1,
149
  "span_mode": "markerV0",
150
  "subtoken_pooling": "first",
151
+ "train_batch_size": 16,
152
+ "train_data": "../dataset_gen/dataset_generated/processed_output.jsonl",
153
+ "transformers_version": "4.57.1",
154
+ "val_data": "../dataset_gen/dataset_generated/test_it.jsonl",
155
  "vocab_size": 256002,
156
  "warmup_ratio": 0.05,
157
  "weight_decay_encoder": 0.1,
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1f2b1a08c8ba688f939cadfd317ae894cbca471c1e54cf9b14157244c318732d
3
- size 34363556
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f65190517e4633347d84e0225b8c5c66a1a62321107ebc73c09d5cefa2b5cd5
3
+ size 34363810