jamarticus commited on
Commit
4ababee
·
verified ·
1 Parent(s): 1f4e098

YurtsAI/ner-document-context

Browse files
Files changed (44) hide show
  1. README.md +425 -0
  2. added_tokens.json +4 -0
  3. config.json +601 -0
  4. merges.txt +0 -0
  5. model.safetensors +3 -0
  6. runs/Jul25_15-22-52_psicrz06tcrx/events.out.tfevents.1721921035.psicrz06tcrx.2730.0 +3 -0
  7. runs/Jul25_15-47-19_psicrz06tcrx/events.out.tfevents.1721925575.psicrz06tcrx.4445.0 +3 -0
  8. runs/Jul25_17-27-37_psicrz06tcrx/events.out.tfevents.1721931493.psicrz06tcrx.6934.0 +3 -0
  9. runs/Jul25_18-24-31_psicrz06tcrx/events.out.tfevents.1721935050.psicrz06tcrx.8437.0 +3 -0
  10. runs/Jul25_19-23-13_psicrz06tcrx/events.out.tfevents.1721938483.psicrz06tcrx.9919.0 +3 -0
  11. runs/Jul25_20-17-44_psicrz06tcrx/events.out.tfevents.1721941867.psicrz06tcrx.11356.0 +3 -0
  12. runs/Jul25_21-29-39_psicrz06tcrx/events.out.tfevents.1721946066.psicrz06tcrx.13121.0 +3 -0
  13. runs/Jul25_22-38-11_psicrz06tcrx/events.out.tfevents.1721950227.psicrz06tcrx.15014.0 +3 -0
  14. runs/Jul26_03-57-10_psicrz06tcrx/events.out.tfevents.1721967402.psicrz06tcrx.2840.0 +3 -0
  15. runs/Jul26_04-17-46_psicrz06tcrx/events.out.tfevents.1721968623.psicrz06tcrx.3465.0 +3 -0
  16. runs/Jul26_04-47-13_psicrz06tcrx/events.out.tfevents.1721970386.psicrz06tcrx.4239.0 +3 -0
  17. runs/Jul26_05-42-47_psicrz06tcrx/events.out.tfevents.1721972862.psicrz06tcrx.5582.0 +3 -0
  18. runs/Jul26_05-56-13_psicrz06tcrx/events.out.tfevents.1721973665.psicrz06tcrx.6069.0 +3 -0
  19. runs/Jul26_06-05-17_psicrz06tcrx/events.out.tfevents.1721974080.psicrz06tcrx.6704.0 +3 -0
  20. runs/Jul26_06-21-12_psicrz06tcrx/events.out.tfevents.1721975516.psicrz06tcrx.7185.0 +3 -0
  21. runs/Jul29_16-55-18_psicrz06tcrx/events.out.tfevents.1722274983.psicrz06tcrx.2807.0 +3 -0
  22. runs/Jul29_16-55-18_psicrz06tcrx/events.out.tfevents.1722433858.psicrz06tcrx.2807.1 +3 -0
  23. runs/Jun27_22-46-59_psicrz06tcrx/events.out.tfevents.1719528469.psicrz06tcrx.2869.0 +3 -0
  24. runs/Jun27_22-52-09_psicrz06tcrx/events.out.tfevents.1719528804.psicrz06tcrx.5472.0 +3 -0
  25. runs/Jun27_22-55-25_psicrz06tcrx/events.out.tfevents.1719529012.psicrz06tcrx.5678.0 +3 -0
  26. runs/Jun27_23-14-12_psicrz06tcrx/events.out.tfevents.1719530094.psicrz06tcrx.6287.0 +3 -0
  27. runs/Jun27_23-16-03_psicrz06tcrx/events.out.tfevents.1719530250.psicrz06tcrx.6427.0 +3 -0
  28. runs/Jun27_23-18-20_psicrz06tcrx/events.out.tfevents.1719530343.psicrz06tcrx.6582.0 +3 -0
  29. runs/Jun27_23-18-20_psicrz06tcrx/events.out.tfevents.1719536408.psicrz06tcrx.6582.1 +3 -0
  30. runs/Jun28_03-22-13_psicrz06tcrx/events.out.tfevents.1719544934.psicrz06tcrx.14486.0 +3 -0
  31. runs/Jun28_03-25-02_psicrz06tcrx/events.out.tfevents.1719545103.psicrz06tcrx.14639.0 +3 -0
  32. runs/Jun28_03-27-32_psicrz06tcrx/events.out.tfevents.1719545253.psicrz06tcrx.14816.0 +3 -0
  33. runs/Jun28_03-36-59_psicrz06tcrx/events.out.tfevents.1719545820.psicrz06tcrx.15209.0 +3 -0
  34. runs/Jun28_03-39-17_psicrz06tcrx/events.out.tfevents.1719545958.psicrz06tcrx.15442.0 +3 -0
  35. runs/Jun28_03-48-22_psicrz06tcrx/events.out.tfevents.1719546576.psicrz06tcrx.16041.0 +3 -0
  36. runs/Jun28_05-39-40_psicrz06tcrx/events.out.tfevents.1719553244.psicrz06tcrx.19916.0 +3 -0
  37. runs/Jun28_05-39-40_psicrz06tcrx/events.out.tfevents.1719559233.psicrz06tcrx.19916.1 +3 -0
  38. runs/Jun28_07-27-04_psicrz06tcrx/events.out.tfevents.1719559687.psicrz06tcrx.22490.0 +3 -0
  39. runs/Jun28_07-27-04_psicrz06tcrx/events.out.tfevents.1719565742.psicrz06tcrx.22490.1 +3 -0
  40. special_tokens_map.json +15 -0
  41. tokenizer.json +0 -0
  42. tokenizer_config.json +76 -0
  43. training_args.bin +3 -0
  44. vocab.json +0 -0
README.md ADDED
@@ -0,0 +1,425 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: roberta-large
3
+ datasets:
4
+ - YurtsAI/named_entity_recognition_document_context
5
+ language:
6
+ - en
7
+ library_name: span-marker
8
+ metrics:
9
+ - precision
10
+ - recall
11
+ - f1
12
+ pipeline_tag: token-classification
13
+ tags:
14
+ - span-marker
15
+ - token-classification
16
+ - ner
17
+ - named-entity-recognition
18
+ - generated_from_span_marker_trainer
19
+ widget:
20
+ - text: '* * phone call transcript: university research paper discussion * * * * date:
21
+ * * 09041942 * * time: * * 3:45 pm * * participants: * * dr. emily carter (ec)
22
+ - principal investigator dr. john smith (js) - co-investigator--- * * ec: * *
23
+ hey john, got a minute to discuss the latest draft of our paper on crispr-cas9?'
24
+ - text: monday is a chill day – beach time at barceloneta and maybe some shopping
25
+ at la rambla.
26
+ - text: don't forget to fast for at least 8 hours before the procedure – that means
27
+ no food or drink after midnight!
28
+ - text: whether it's buying a house in 5 years, saving for a killer vacation next
29
+ summer, or just building an emergency fund, write it down.
30
+ - text: '- * * full integration: * * all recipes from the rbso must be incorporated
31
+ into event menus by november 1, 2023.'
32
+ model-index:
33
+ - name: SpanMarker with roberta-large on YurtsAI/named_entity_recognition_document_context
34
+ results:
35
+ - task:
36
+ type: token-classification
37
+ name: Named Entity Recognition
38
+ dataset:
39
+ name: Unknown
40
+ type: YurtsAI/named_entity_recognition_document_context
41
+ split: eval
42
+ metrics:
43
+ - type: f1
44
+ value: 0.8349078585045542
45
+ name: F1
46
+ - type: precision
47
+ value: 0.8308950630296387
48
+ name: Precision
49
+ - type: recall
50
+ value: 0.8389596015495296
51
+ name: Recall
52
+ ---
53
+
54
+ # SpanMarker with roberta-large on YurtsAI/named_entity_recognition_document_context
55
+
56
+ This is a [SpanMarker](https://github.com/tomaarsen/SpanMarkerNER) model trained on the [YurtsAI/named_entity_recognition_document_context](https://huggingface.co/datasets/YurtsAI/named_entity_recognition_document_context) dataset that can be used for Named Entity Recognition. This SpanMarker model uses [roberta-large](https://huggingface.co/roberta-large) as the underlying encoder.
57
+
58
+ ## Model Details
59
+
60
+ ### Model Description
61
+ - **Model Type:** SpanMarker
62
+ - **Encoder:** [roberta-large](https://huggingface.co/roberta-large)
63
+ - **Maximum Sequence Length:** 256 tokens
64
+ - **Maximum Entity Length:** 11 words
65
+ - **Training Dataset:** [YurtsAI/named_entity_recognition_document_context](https://huggingface.co/datasets/YurtsAI/named_entity_recognition_document_context)
66
+ - **Language:** en
67
+ <!-- - **License:** Unknown -->
68
+
69
+ ### Model Sources
70
+
71
+ - **Repository:** [SpanMarker on GitHub](https://github.com/tomaarsen/SpanMarkerNER)
72
+ - **Thesis:** [SpanMarker For Named Entity Recognition](https://raw.githubusercontent.com/tomaarsen/SpanMarkerNER/main/thesis.pdf)
73
+
74
+ ### Model Labels
75
+ | Label | Examples |
76
+ |:--------------------------------------------------|:------------------------------------------------------------------------------------------------------------------------------|
77
+ | DATETIME__absolute | "14:00 hrs", "15th november 2023 at 10:00 am", "october 15th , 2023" |
78
+ | DATETIME__authored | "25 february 26", "sunday , 21 august , 1938", "1961-05-08" |
79
+ | DATETIME__range | "29th of oct. , 2023", "september 2021 to august 2023", "jan 2022 - dec 2022" |
80
+ | DATETIME__relative | "eod friday", "dec 15 , 11:59 pm", "10/15" |
81
+ | GENERAL__art-broadcastprogram | "stranger things", "live q & a", "product design concept sketchbook for kids" |
82
+ | GENERAL__art-film | "the crown", "kill bill", "stranger things" |
83
+ | GENERAL__art-music | |
84
+ | GENERAL__art-other | "statue of liberty", "broadway show", "wicked" |
85
+ | GENERAL__art-painting | "draw your dream house", "design a superhero costume" |
86
+ | GENERAL__art-writtenart | "optimization of quantum algorithms for cryptographic applications", "introduction to algorithms", "intro to cs '' by j. doe" |
87
+ | GENERAL__building-airport | "ory", "charles de gaulle", "cdg" |
88
+ | GENERAL__building-hospital | "green valley clinic", "department of oncology", "st. mary 's hospital" |
89
+ | GENERAL__building-hotel | "le jules verne", "hôtel ritz", "the beverly hills hotel" |
90
+ | GENERAL__building-library | "ancient library", "the grand library", "jefferson library" |
91
+ | GENERAL__building-other | "louvre museum", "engineering building", "eiffel tower" |
92
+ | GENERAL__building-restaurant | "l'ambroisie", "bella 's bistro", "in-n-out burger" |
93
+ | GENERAL__building-sportsfacility | "fenway" |
94
+ | GENERAL__building-theater | "gershwin theatre", "opera house", "broadway" |
95
+ | GENERAL__event-attack/battle/war/militaryconflict | "1863 battle of ridgefield", "battle of gettysburg", "war of 1812" |
96
+ | GENERAL__event-other | "annual science fair", "summer splash '23", "research methodology workshop" |
97
+ | GENERAL__event-sportsevent | "international olympiad in informatics", "ftx", "ioi" |
98
+ | GENERAL__location-GPE | "fr", "paris ,", "italy" |
99
+ | GENERAL__location-bodiesofwater | "river x", "river blue", "seine river" |
100
+ | GENERAL__location-island | "maldives", "similan islands", "ellis island" |
101
+ | GENERAL__location-mountain | "andes mountains", "swiss alps", "pine ridge" |
102
+ | GENERAL__location-other | "times square", "old market", "venice beach" |
103
+ | GENERAL__location-park | "central park", "ueno park", "universal studios" |
104
+ | GENERAL__location-road/railway/highway/transit | "i-95", "underground railroad", "hollywood walk of fame" |
105
+ | GENERAL__organization-company | "green earth organics", "xyz corporation", "north atlantic fisheries" |
106
+ | GENERAL__organization-education | "graduate school", "xyz", "xyz university" |
107
+ | GENERAL__organization-government/governmentagency | "department of economic development", "moe", "ministry of environment" |
108
+ | GENERAL__organization-media/newspaper | "pinterest", "yelp", "insta" |
109
+ | GENERAL__organization-other | "historical society", "grants office", "admissions committee" |
110
+ | GENERAL__organization-religion | "buddhist", "zen buddhist", "shinto" |
111
+ | GENERAL__organization-showorganization | "phare", "the soundbytes" |
112
+ | GENERAL__organization-sportsteam | "varsity soccer team", "red sox" |
113
+ | GENERAL__other-astronomything | |
114
+ | GENERAL__other-award | "team excellence award", "innovation award", "employee of the month" |
115
+ | GENERAL__other-biologything | "fodmap", "troponin i", "cmp" |
116
+ | GENERAL__other-chemicalthing | "co2", "pm2.5", "nitrate" |
117
+ | GENERAL__other-currency | "usd", "inr", "$ $ $" |
118
+ | GENERAL__other-disease | "mi", "irritable bowel syndrome", "myocardial infarction" |
119
+ | GENERAL__other-educationaldegree | "executive mba", "phd in quantum computing ,", "phd" |
120
+ | GENERAL__other-god | "inari", "athena", "inari taisha" |
121
+ | GENERAL__other-language | "french", "english", "spanish" |
122
+ | GENERAL__other-law | "cas", "clean air standards", "environmental protection act ( epa ) 2023" |
123
+ | GENERAL__other-livingthing | "eastern box turtle", "monarch butterfly", "western burrowing owl" |
124
+ | GENERAL__other-medical | "asa", "dapt", "clopidogrel" |
125
+ | GENERAL__person-artist/author | "carol", "picasso", "warhol" |
126
+ | GENERAL__person-other | "jamie", "sarah", "mark" |
127
+ | GENERAL__person-politician | "jane doe", "vespasian", "constantine i" |
128
+ | GENERAL__person-scholar | "dr. smith", "dr. lee", "dr. johnson" |
129
+ | GENERAL__person-soldier | "davis", "lt. sarah johnson", "col. r. johnson" |
130
+ | GENERAL__product-airplane | "hmmwvs", "uh-60s", "m1a2s" |
131
+ | GENERAL__product-car | "hmmwvs", "high mobility multipurpose wheeled vehicles", "mine-resistant ambush protected" |
132
+ | GENERAL__product-food | "pumpkin spice", "quinoa salad", "golden jubilee feast" |
133
+ | GENERAL__product-game | "stardew valley", "valorant", "call of duty : warzone" |
134
+ | GENERAL__product-other | "engagement metrics", "xj-200", "smart goal templates" |
135
+ | GENERAL__product-ship | "liberty island ferry", "hms victory", "thames river cruise" |
136
+ | GENERAL__product-software | "instagram", "svm", "r" |
137
+ | GENERAL__product-train | "n'ex", "shinkansen", "tgv" |
138
+ | GENERAL__product-weapon | "m1 abrams", "m4 carbine", "m4 carbines" |
139
+
140
+ ## Evaluation
141
+
142
+ ### Metrics
143
+ | Label | Precision | Recall | F1 |
144
+ |:--------------------------------------------------|:----------|:-------|:-------|
145
+ | **all** | 0.8309 | 0.8390 | 0.8349 |
146
+ | DATETIME__absolute | 0.8744 | 0.8577 | 0.8660 |
147
+ | DATETIME__authored | 0.9956 | 0.9935 | 0.9946 |
148
+ | DATETIME__range | 0.8451 | 0.9262 | 0.8838 |
149
+ | DATETIME__relative | 0.8266 | 0.7498 | 0.7863 |
150
+ | GENERAL__art-broadcastprogram | 0.6538 | 0.6296 | 0.6415 |
151
+ | GENERAL__art-film | 0.8 | 1.0 | 0.8889 |
152
+ | GENERAL__art-music | 0.0 | 0.0 | 0.0 |
153
+ | GENERAL__art-other | 0.625 | 0.7143 | 0.6667 |
154
+ | GENERAL__art-painting | 0.0 | 0.0 | 0.0 |
155
+ | GENERAL__art-writtenart | 0.7373 | 0.8047 | 0.7695 |
156
+ | GENERAL__building-airport | 0.8668 | 0.9689 | 0.9150 |
157
+ | GENERAL__building-hospital | 0.8378 | 0.9323 | 0.8826 |
158
+ | GENERAL__building-hotel | 0.7577 | 0.8603 | 0.8057 |
159
+ | GENERAL__building-library | 0.0 | 0.0 | 0.0 |
160
+ | GENERAL__building-other | 0.7597 | 0.8409 | 0.7982 |
161
+ | GENERAL__building-restaurant | 0.7953 | 0.8695 | 0.8307 |
162
+ | GENERAL__building-sportsfacility | 0.0 | 0.0 | 0.0 |
163
+ | GENERAL__building-theater | 0.6 | 0.6667 | 0.6316 |
164
+ | GENERAL__event-attack/battle/war/militaryconflict | 0.8438 | 0.9310 | 0.8852 |
165
+ | GENERAL__event-other | 0.6019 | 0.6382 | 0.6195 |
166
+ | GENERAL__event-sportsevent | 0.0 | 0.0 | 0.0 |
167
+ | GENERAL__location-GPE | 0.7232 | 0.7888 | 0.7546 |
168
+ | GENERAL__location-bodiesofwater | 0.6724 | 0.975 | 0.7959 |
169
+ | GENERAL__location-island | 0.7455 | 0.9111 | 0.8200 |
170
+ | GENERAL__location-mountain | 0.7436 | 0.8529 | 0.7945 |
171
+ | GENERAL__location-other | 0.7186 | 0.7793 | 0.7477 |
172
+ | GENERAL__location-park | 0.7899 | 0.8704 | 0.8282 |
173
+ | GENERAL__location-road/railway/highway/transit | 0.6325 | 0.7095 | 0.6688 |
174
+ | GENERAL__organization-company | 0.8665 | 0.8605 | 0.8635 |
175
+ | GENERAL__organization-education | 0.8256 | 0.8608 | 0.8428 |
176
+ | GENERAL__organization-government/governmentagency | 0.8344 | 0.8318 | 0.8331 |
177
+ | GENERAL__organization-media/newspaper | 0.6667 | 0.4 | 0.5 |
178
+ | GENERAL__organization-other | 0.7790 | 0.8105 | 0.7944 |
179
+ | GENERAL__organization-religion | 0.6667 | 0.8 | 0.7273 |
180
+ | GENERAL__organization-showorganization | 0.0 | 0.0 | 0.0 |
181
+ | GENERAL__organization-sportsteam | 0.0 | 0.0 | 0.0 |
182
+ | GENERAL__other-astronomything | 0.0 | 0.0 | 0.0 |
183
+ | GENERAL__other-award | 0.8216 | 0.8859 | 0.8525 |
184
+ | GENERAL__other-biologything | 0.7246 | 0.8961 | 0.8013 |
185
+ | GENERAL__other-chemicalthing | 0.7687 | 0.8047 | 0.7863 |
186
+ | GENERAL__other-currency | 0.6304 | 0.6744 | 0.6517 |
187
+ | GENERAL__other-disease | 0.8594 | 0.9048 | 0.8815 |
188
+ | GENERAL__other-educationaldegree | 0.7119 | 0.75 | 0.7304 |
189
+ | GENERAL__other-god | 0.8 | 0.5714 | 0.6667 |
190
+ | GENERAL__other-language | 0.6818 | 1.0 | 0.8108 |
191
+ | GENERAL__other-law | 0.7978 | 0.8462 | 0.8212 |
192
+ | GENERAL__other-livingthing | 0.7385 | 0.9320 | 0.8240 |
193
+ | GENERAL__other-medical | 0.7778 | 0.8343 | 0.8050 |
194
+ | GENERAL__person-artist/author | 0.625 | 0.3846 | 0.4762 |
195
+ | GENERAL__person-other | 0.8839 | 0.8979 | 0.8908 |
196
+ | GENERAL__person-politician | 0.7534 | 0.7432 | 0.7483 |
197
+ | GENERAL__person-scholar | 0.8640 | 0.8769 | 0.8704 |
198
+ | GENERAL__person-soldier | 0.7674 | 0.7586 | 0.7630 |
199
+ | GENERAL__product-airplane | 0.6774 | 0.6364 | 0.6562 |
200
+ | GENERAL__product-car | 0.9286 | 0.7879 | 0.8525 |
201
+ | GENERAL__product-food | 0.7798 | 0.7859 | 0.7828 |
202
+ | GENERAL__product-game | 0.75 | 0.75 | 0.75 |
203
+ | GENERAL__product-other | 0.7175 | 0.7537 | 0.7351 |
204
+ | GENERAL__product-ship | 0.0 | 0.0 | 0.0 |
205
+ | GENERAL__product-software | 0.8093 | 0.8403 | 0.8245 |
206
+ | GENERAL__product-train | 0.75 | 0.375 | 0.5 |
207
+ | GENERAL__product-weapon | 0.7794 | 0.8833 | 0.8281 |
208
+
209
+ ## Uses
210
+
211
+ ### Direct Use for Inference
212
+
213
+ ```python
214
+ from span_marker import SpanMarkerModel
215
+
216
+ # Download from the 🤗 Hub
217
+ model = SpanMarkerModel.from_pretrained("YurtsAI/named_entity_recognition_document_context")
218
+ # Run inference
219
+ entities = model.predict("monday is a chill day – beach time at barceloneta and maybe some shopping at la rambla.")
220
+ ```
221
+
222
+ ### Downstream Use
223
+ You can finetune this model on your own dataset.
224
+
225
+ <details><summary>Click to expand</summary>
226
+
227
+ ```python
228
+ from span_marker import SpanMarkerModel, Trainer
229
+
230
+ # Download from the 🤗 Hub
231
+ model = SpanMarkerModel.from_pretrained("YurtsAI/named_entity_recognition_document_context")
232
+
233
+ # Specify a Dataset with "tokens" and "ner_tag" columns
234
+ dataset = load_dataset("conll2003") # For example CoNLL2003
235
+
236
+ # Initialize a Trainer using the pretrained model & dataset
237
+ trainer = Trainer(
238
+ model=model,
239
+ train_dataset=dataset["train"],
240
+ eval_dataset=dataset["validation"],
241
+ )
242
+ trainer.train()
243
+ trainer.save_model("YurtsAI/named_entity_recognition_document_context-finetuned")
244
+ ```
245
+ </details>
246
+
247
+ <!--
248
+ ### Out-of-Scope Use
249
+
250
+ *List how the model may foreseeably be misused and address what users ought not to do with the model.*
251
+ -->
252
+
253
+ <!--
254
+ ## Bias, Risks and Limitations
255
+
256
+ *What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
257
+ -->
258
+
259
+ <!--
260
+ ### Recommendations
261
+
262
+ *What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
263
+ -->
264
+
265
+ ## Training Details
266
+
267
+ ### Training Set Metrics
268
+ | Training set | Min | Median | Max |
269
+ |:----------------------|:----|:--------|:----|
270
+ | Sentence length | 1 | 14.6796 | 691 |
271
+ | Entities per sentence | 0 | 0.4235 | 35 |
272
+
273
+ ### Training Hyperparameters
274
+ - learning_rate: 1e-05
275
+ - train_batch_size: 32
276
+ - eval_batch_size: 32
277
+ - seed: 42
278
+ - gradient_accumulation_steps: 2
279
+ - total_train_batch_size: 64
280
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
281
+ - lr_scheduler_type: linear
282
+ - lr_scheduler_warmup_ratio: 0.1
283
+ - num_epochs: 3
284
+
285
+ ### Training Results
286
+ | Epoch | Step | Validation Loss | Validation Precision | Validation Recall | Validation F1 | Validation Accuracy |
287
+ |:------:|:-----:|:---------------:|:--------------------:|:-----------------:|:-------------:|:-------------------:|
288
+ | 0.0299 | 500 | 0.0254 | 0.5244 | 0.0116 | 0.0228 | 0.9292 |
289
+ | 0.0597 | 1000 | 0.0144 | 0.5380 | 0.3492 | 0.4235 | 0.9444 |
290
+ | 0.0896 | 1500 | 0.0099 | 0.7134 | 0.4410 | 0.5450 | 0.9534 |
291
+ | 0.1194 | 2000 | 0.0088 | 0.6461 | 0.6571 | 0.6516 | 0.9596 |
292
+ | 0.1493 | 2500 | 0.0074 | 0.7177 | 0.6363 | 0.6745 | 0.9628 |
293
+ | 0.1791 | 3000 | 0.0075 | 0.6612 | 0.7342 | 0.6958 | 0.9637 |
294
+ | 0.2090 | 3500 | 0.0073 | 0.6686 | 0.7286 | 0.6973 | 0.9634 |
295
+ | 0.2388 | 4000 | 0.0061 | 0.7552 | 0.7044 | 0.7289 | 0.9693 |
296
+ | 0.2687 | 4500 | 0.0062 | 0.7385 | 0.7150 | 0.7266 | 0.9682 |
297
+ | 0.2986 | 5000 | 0.0070 | 0.6667 | 0.7792 | 0.7186 | 0.9654 |
298
+ | 0.3284 | 5500 | 0.0063 | 0.6984 | 0.7774 | 0.7358 | 0.9689 |
299
+ | 0.3583 | 6000 | 0.0055 | 0.7941 | 0.7023 | 0.7454 | 0.9706 |
300
+ | 0.3881 | 6500 | 0.0055 | 0.7540 | 0.7640 | 0.7589 | 0.9722 |
301
+ | 0.4180 | 7000 | 0.0053 | 0.7700 | 0.7614 | 0.7657 | 0.9732 |
302
+ | 0.4478 | 7500 | 0.0053 | 0.7791 | 0.7698 | 0.7744 | 0.9742 |
303
+ | 0.4777 | 8000 | 0.0054 | 0.7396 | 0.8062 | 0.7715 | 0.9729 |
304
+ | 0.5075 | 8500 | 0.0051 | 0.7653 | 0.7944 | 0.7796 | 0.9741 |
305
+ | 0.5374 | 9000 | 0.0050 | 0.7773 | 0.7844 | 0.7808 | 0.9747 |
306
+ | 0.5672 | 9500 | 0.0049 | 0.7954 | 0.7711 | 0.7830 | 0.9757 |
307
+ | 0.5971 | 10000 | 0.0049 | 0.7844 | 0.7876 | 0.7860 | 0.9754 |
308
+ | 0.6270 | 10500 | 0.0047 | 0.7898 | 0.7940 | 0.7919 | 0.9761 |
309
+ | 0.6568 | 11000 | 0.0047 | 0.7852 | 0.7929 | 0.7890 | 0.9761 |
310
+ | 0.6867 | 11500 | 0.0047 | 0.8001 | 0.7908 | 0.7954 | 0.9770 |
311
+ | 0.7165 | 12000 | 0.0050 | 0.7643 | 0.8145 | 0.7886 | 0.9755 |
312
+ | 0.7464 | 12500 | 0.0047 | 0.7991 | 0.7892 | 0.7941 | 0.9764 |
313
+ | 0.7762 | 13000 | 0.0046 | 0.7948 | 0.8084 | 0.8015 | 0.9774 |
314
+ | 0.8061 | 13500 | 0.0046 | 0.7841 | 0.8154 | 0.7994 | 0.9771 |
315
+ | 0.8359 | 14000 | 0.0043 | 0.8283 | 0.7776 | 0.8021 | 0.9783 |
316
+ | 0.8658 | 14500 | 0.0044 | 0.8054 | 0.7993 | 0.8023 | 0.9773 |
317
+ | 0.8957 | 15000 | 0.0047 | 0.7704 | 0.8152 | 0.7922 | 0.9758 |
318
+ | 0.9255 | 15500 | 0.0043 | 0.8018 | 0.8149 | 0.8083 | 0.9782 |
319
+ | 0.9554 | 16000 | 0.0043 | 0.8255 | 0.7938 | 0.8093 | 0.9789 |
320
+ | 0.9852 | 16500 | 0.0042 | 0.8201 | 0.8008 | 0.8104 | 0.9787 |
321
+ | 1.0151 | 17000 | 0.0044 | 0.7947 | 0.8175 | 0.8059 | 0.9784 |
322
+ | 1.0449 | 17500 | 0.0044 | 0.7942 | 0.8195 | 0.8066 | 0.9777 |
323
+ | 1.0748 | 18000 | 0.0043 | 0.8124 | 0.8110 | 0.8117 | 0.9789 |
324
+ | 1.1046 | 18500 | 0.0043 | 0.7987 | 0.8157 | 0.8071 | 0.9788 |
325
+ | 1.1345 | 19000 | 0.0043 | 0.8037 | 0.8171 | 0.8103 | 0.9789 |
326
+ | 1.1644 | 19500 | 0.0042 | 0.8178 | 0.8076 | 0.8127 | 0.9796 |
327
+ | 1.1942 | 20000 | 0.0044 | 0.7803 | 0.8389 | 0.8085 | 0.9780 |
328
+ | 1.2241 | 20500 | 0.0043 | 0.8040 | 0.8210 | 0.8124 | 0.9790 |
329
+ | 1.2539 | 21000 | 0.0043 | 0.8038 | 0.8245 | 0.8141 | 0.9788 |
330
+ | 1.2838 | 21500 | 0.0041 | 0.8318 | 0.7973 | 0.8142 | 0.9794 |
331
+ | 1.3136 | 22000 | 0.0041 | 0.8106 | 0.8211 | 0.8158 | 0.9796 |
332
+ | 1.3435 | 22500 | 0.0041 | 0.8288 | 0.8046 | 0.8165 | 0.9796 |
333
+ | 1.3733 | 23000 | 0.0041 | 0.8218 | 0.8170 | 0.8194 | 0.9799 |
334
+ | 1.4032 | 23500 | 0.0042 | 0.8164 | 0.8171 | 0.8168 | 0.9799 |
335
+ | 1.4330 | 24000 | 0.0041 | 0.8105 | 0.8248 | 0.8176 | 0.9793 |
336
+ | 1.4629 | 24500 | 0.0042 | 0.8073 | 0.8196 | 0.8134 | 0.9791 |
337
+ | 1.4928 | 25000 | 0.0040 | 0.8211 | 0.8162 | 0.8187 | 0.9797 |
338
+ | 1.5226 | 25500 | 0.0040 | 0.8195 | 0.8225 | 0.8210 | 0.9800 |
339
+ | 1.5525 | 26000 | 0.0040 | 0.8372 | 0.8018 | 0.8191 | 0.9799 |
340
+ | 1.5823 | 26500 | 0.0040 | 0.8263 | 0.8161 | 0.8212 | 0.9802 |
341
+ | 1.6122 | 27000 | 0.0039 | 0.8275 | 0.8141 | 0.8208 | 0.9802 |
342
+ | 1.6420 | 27500 | 0.0040 | 0.8264 | 0.8198 | 0.8231 | 0.9804 |
343
+ | 1.6719 | 28000 | 0.0040 | 0.8218 | 0.8195 | 0.8206 | 0.9799 |
344
+ | 1.7017 | 28500 | 0.0039 | 0.8286 | 0.8195 | 0.8240 | 0.9803 |
345
+ | 1.7316 | 29000 | 0.0041 | 0.8004 | 0.8357 | 0.8177 | 0.9788 |
346
+ | 1.7615 | 29500 | 0.0040 | 0.8138 | 0.8304 | 0.8220 | 0.9801 |
347
+ | 1.7913 | 30000 | 0.0040 | 0.8160 | 0.8309 | 0.8234 | 0.9804 |
348
+ | 1.8212 | 30500 | 0.0039 | 0.8204 | 0.8262 | 0.8233 | 0.9802 |
349
+ | 1.8510 | 31000 | 0.0038 | 0.8292 | 0.8228 | 0.8260 | 0.9810 |
350
+ | 1.8809 | 31500 | 0.0039 | 0.8247 | 0.8246 | 0.8246 | 0.9806 |
351
+ | 1.9107 | 32000 | 0.0038 | 0.8267 | 0.8258 | 0.8262 | 0.9810 |
352
+ | 1.9406 | 32500 | 0.0039 | 0.8102 | 0.8398 | 0.8248 | 0.9805 |
353
+ | 1.9704 | 33000 | 0.0039 | 0.8321 | 0.8185 | 0.8253 | 0.9809 |
354
+ | 2.0003 | 33500 | 0.0038 | 0.8325 | 0.8261 | 0.8293 | 0.9814 |
355
+ | 2.0302 | 34000 | 0.0038 | 0.8352 | 0.8228 | 0.8289 | 0.9813 |
356
+ | 2.0600 | 34500 | 0.0041 | 0.8144 | 0.8369 | 0.8255 | 0.9809 |
357
+ | 2.0899 | 35000 | 0.0039 | 0.8274 | 0.8281 | 0.8277 | 0.9813 |
358
+ | 2.1197 | 35500 | 0.0039 | 0.8198 | 0.8353 | 0.8275 | 0.9812 |
359
+ | 2.1496 | 36000 | 0.0039 | 0.8211 | 0.8358 | 0.8284 | 0.9811 |
360
+ | 2.1794 | 36500 | 0.0039 | 0.8242 | 0.8300 | 0.8271 | 0.9809 |
361
+ | 2.2093 | 37000 | 0.0039 | 0.8194 | 0.8317 | 0.8255 | 0.9808 |
362
+ | 2.2391 | 37500 | 0.0039 | 0.8258 | 0.8344 | 0.8301 | 0.9814 |
363
+ | 2.2690 | 38000 | 0.0039 | 0.8292 | 0.8302 | 0.8297 | 0.9816 |
364
+ | 2.2989 | 38500 | 0.0039 | 0.8281 | 0.8315 | 0.8298 | 0.9813 |
365
+ | 2.3287 | 39000 | 0.0039 | 0.8174 | 0.8386 | 0.8279 | 0.9808 |
366
+ | 2.3586 | 39500 | 0.0039 | 0.8208 | 0.8364 | 0.8285 | 0.9810 |
367
+ | 2.3884 | 40000 | 0.0039 | 0.8230 | 0.8379 | 0.8304 | 0.9815 |
368
+ | 2.4183 | 40500 | 0.0038 | 0.8355 | 0.8273 | 0.8314 | 0.9816 |
369
+ | 2.4481 | 41000 | 0.0038 | 0.8290 | 0.8347 | 0.8319 | 0.9816 |
370
+ | 2.4780 | 41500 | 0.0038 | 0.8233 | 0.8403 | 0.8317 | 0.9815 |
371
+ | 2.5078 | 42000 | 0.0039 | 0.8186 | 0.8417 | 0.8300 | 0.9814 |
372
+ | 2.5377 | 42500 | 0.0038 | 0.8321 | 0.8343 | 0.8332 | 0.9818 |
373
+ | 2.5675 | 43000 | 0.0038 | 0.8239 | 0.8396 | 0.8317 | 0.9816 |
374
+ | 2.5974 | 43500 | 0.0038 | 0.8267 | 0.8378 | 0.8322 | 0.9816 |
375
+ | 2.6273 | 44000 | 0.0038 | 0.8325 | 0.8343 | 0.8334 | 0.9818 |
376
+ | 2.6571 | 44500 | 0.0038 | 0.8254 | 0.8399 | 0.8326 | 0.9817 |
377
+ | 2.6870 | 45000 | 0.0038 | 0.8339 | 0.8338 | 0.8339 | 0.9820 |
378
+ | 2.7168 | 45500 | 0.0038 | 0.8301 | 0.8381 | 0.8341 | 0.9819 |
379
+ | 2.7467 | 46000 | 0.0038 | 0.8309 | 0.8371 | 0.8340 | 0.9818 |
380
+ | 2.7765 | 46500 | 0.0038 | 0.8296 | 0.8377 | 0.8337 | 0.9817 |
381
+ | 2.8064 | 47000 | 0.0037 | 0.8337 | 0.8349 | 0.8343 | 0.9820 |
382
+ | 2.8362 | 47500 | 0.0037 | 0.8303 | 0.8387 | 0.8345 | 0.9820 |
383
+ | 2.8661 | 48000 | 0.0037 | 0.8289 | 0.8401 | 0.8344 | 0.9819 |
384
+ | 2.8960 | 48500 | 0.0037 | 0.8299 | 0.8400 | 0.8349 | 0.9820 |
385
+ | 2.9258 | 49000 | 0.0037 | 0.8289 | 0.8401 | 0.8344 | 0.9819 |
386
+ | 2.9557 | 49500 | 0.0037 | 0.8322 | 0.8380 | 0.8351 | 0.9821 |
387
+ | 2.9855 | 50000 | 0.0037 | 0.8312 | 0.8384 | 0.8348 | 0.9820 |
388
+
389
+ ### Framework Versions
390
+ - Python: 3.11.7
391
+ - SpanMarker: 1.5.0
392
+ - Transformers: 4.42.1
393
+ - PyTorch: 2.1.1+cu121
394
+ - Datasets: 2.14.5
395
+ - Tokenizers: 0.19.1
396
+
397
+ ## Citation
398
+
399
+ ### BibTeX
400
+ ```
401
+ @software{Aarsen_SpanMarker,
402
+ author = {Aarsen, Tom},
403
+ license = {Apache-2.0},
404
+ title = {{SpanMarker for Named Entity Recognition}},
405
+ url = {https://github.com/tomaarsen/SpanMarkerNER}
406
+ }
407
+ ```
408
+
409
+ <!--
410
+ ## Glossary
411
+
412
+ *Clearly define terms in order to be accessible across audiences.*
413
+ -->
414
+
415
+ <!--
416
+ ## Model Card Authors
417
+
418
+ *Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
419
+ -->
420
+
421
+ <!--
422
+ ## Model Card Contact
423
+
424
+ *Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
425
+ -->
added_tokens.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "<end>": 50266,
3
+ "<start>": 50265
4
+ }
config.json ADDED
@@ -0,0 +1,601 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "SpanMarkerModel"
4
+ ],
5
+ "encoder": {
6
+ "_name_or_path": "roberta-large",
7
+ "add_cross_attention": false,
8
+ "architectures": [
9
+ "RobertaForMaskedLM"
10
+ ],
11
+ "attention_probs_dropout_prob": 0.1,
12
+ "bad_words_ids": null,
13
+ "begin_suppress_tokens": null,
14
+ "bos_token_id": 0,
15
+ "chunk_size_feed_forward": 0,
16
+ "classifier_dropout": null,
17
+ "cross_attention_hidden_size": null,
18
+ "decoder_start_token_id": null,
19
+ "diversity_penalty": 0.0,
20
+ "do_sample": false,
21
+ "early_stopping": false,
22
+ "encoder_no_repeat_ngram_size": 0,
23
+ "eos_token_id": 2,
24
+ "exponential_decay_length_penalty": null,
25
+ "finetuning_task": null,
26
+ "forced_bos_token_id": null,
27
+ "forced_eos_token_id": null,
28
+ "hidden_act": "gelu",
29
+ "hidden_dropout_prob": 0.1,
30
+ "hidden_size": 1024,
31
+ "id2label": {
32
+ "0": "O",
33
+ "1": "B-GENERAL__organization-showorganization",
34
+ "2": "I-GENERAL__organization-showorganization",
35
+ "3": "B-GENERAL__product-airplane",
36
+ "4": "I-GENERAL__product-airplane",
37
+ "5": "B-GENERAL__art-film",
38
+ "6": "I-GENERAL__art-film",
39
+ "7": "B-GENERAL__building-theater",
40
+ "8": "I-GENERAL__building-theater",
41
+ "9": "B-GENERAL__art-other",
42
+ "10": "I-GENERAL__art-other",
43
+ "11": "B-GENERAL__other-disease",
44
+ "12": "I-GENERAL__other-disease",
45
+ "13": "B-GENERAL__person-artist/author",
46
+ "14": "I-GENERAL__person-artist/author",
47
+ "15": "B-GENERAL__other-biologything",
48
+ "16": "I-GENERAL__other-biologything",
49
+ "17": "B-GENERAL__organization-media/newspaper",
50
+ "18": "I-GENERAL__organization-media/newspaper",
51
+ "19": "B-GENERAL__product-food",
52
+ "20": "I-GENERAL__product-food",
53
+ "21": "B-GENERAL__building-hotel",
54
+ "22": "I-GENERAL__building-hotel",
55
+ "23": "B-GENERAL__other-chemicalthing",
56
+ "24": "I-GENERAL__other-chemicalthing",
57
+ "25": "B-GENERAL__organization-other",
58
+ "26": "I-GENERAL__organization-other",
59
+ "27": "B-GENERAL__organization-religion",
60
+ "28": "I-GENERAL__organization-religion",
61
+ "29": "B-GENERAL__building-sportsfacility",
62
+ "30": "I-GENERAL__building-sportsfacility",
63
+ "31": "B-GENERAL__person-other",
64
+ "32": "I-GENERAL__person-other",
65
+ "33": "B-GENERAL__building-hospital",
66
+ "34": "I-GENERAL__building-hospital",
67
+ "35": "B-GENERAL__product-weapon",
68
+ "36": "I-GENERAL__product-weapon",
69
+ "37": "B-GENERAL__person-politician",
70
+ "38": "I-GENERAL__person-politician",
71
+ "39": "B-GENERAL__product-software",
72
+ "40": "I-GENERAL__product-software",
73
+ "41": "B-GENERAL__person-scholar",
74
+ "42": "I-GENERAL__person-scholar",
75
+ "43": "B-DATETIME__relative",
76
+ "44": "I-DATETIME__relative",
77
+ "45": "B-GENERAL__other-law",
78
+ "46": "I-GENERAL__other-law",
79
+ "47": "B-GENERAL__event-other",
80
+ "48": "I-GENERAL__event-other",
81
+ "49": "B-GENERAL__location-bodiesofwater",
82
+ "50": "I-GENERAL__location-bodiesofwater",
83
+ "51": "B-GENERAL__organization-government/governmentagency",
84
+ "52": "I-GENERAL__organization-government/governmentagency",
85
+ "53": "B-DATETIME__range",
86
+ "54": "I-DATETIME__range",
87
+ "55": "B-GENERAL__product-ship",
88
+ "56": "I-GENERAL__product-ship",
89
+ "57": "B-GENERAL__other-livingthing",
90
+ "58": "I-GENERAL__other-livingthing",
91
+ "59": "B-GENERAL__product-car",
92
+ "60": "I-GENERAL__product-car",
93
+ "61": "B-GENERAL__product-game",
94
+ "62": "I-GENERAL__product-game",
95
+ "63": "B-DATETIME__authored",
96
+ "64": "I-DATETIME__authored",
97
+ "65": "B-GENERAL__building-other",
98
+ "66": "I-GENERAL__building-other",
99
+ "67": "B-GENERAL__other-language",
100
+ "68": "I-GENERAL__other-language",
101
+ "69": "B-GENERAL__other-astronomything",
102
+ "70": "I-GENERAL__other-astronomything",
103
+ "71": "B-GENERAL__building-library",
104
+ "72": "I-GENERAL__building-library",
105
+ "73": "B-GENERAL__product-train",
106
+ "74": "I-GENERAL__product-train",
107
+ "75": "B-GENERAL__location-other",
108
+ "76": "I-GENERAL__location-other",
109
+ "77": "B-GENERAL__building-airport",
110
+ "78": "I-GENERAL__building-airport",
111
+ "79": "B-GENERAL__other-god",
112
+ "80": "I-GENERAL__other-god",
113
+ "81": "B-GENERAL__art-painting",
114
+ "82": "I-GENERAL__art-painting",
115
+ "83": "B-GENERAL__other-educationaldegree",
116
+ "84": "I-GENERAL__other-educationaldegree",
117
+ "85": "B-GENERAL__art-music",
118
+ "86": "I-GENERAL__art-music",
119
+ "87": "B-GENERAL__art-writtenart",
120
+ "88": "I-GENERAL__art-writtenart",
121
+ "89": "B-GENERAL__building-restaurant",
122
+ "90": "I-GENERAL__building-restaurant",
123
+ "91": "B-GENERAL__art-broadcastprogram",
124
+ "92": "I-GENERAL__art-broadcastprogram",
125
+ "93": "B-GENERAL__location-island",
126
+ "94": "I-GENERAL__location-island",
127
+ "95": "B-DATETIME__absolute",
128
+ "96": "I-DATETIME__absolute",
129
+ "97": "B-GENERAL__organization-sportsteam",
130
+ "98": "I-GENERAL__organization-sportsteam",
131
+ "99": "B-GENERAL__event-attack/battle/war/militaryconflict",
132
+ "100": "I-GENERAL__event-attack/battle/war/militaryconflict",
133
+ "101": "B-GENERAL__product-other",
134
+ "102": "I-GENERAL__product-other",
135
+ "103": "B-GENERAL__other-award",
136
+ "104": "I-GENERAL__other-award",
137
+ "105": "B-GENERAL__location-GPE",
138
+ "106": "I-GENERAL__location-GPE",
139
+ "107": "B-GENERAL__person-soldier",
140
+ "108": "I-GENERAL__person-soldier",
141
+ "109": "B-GENERAL__location-mountain",
142
+ "110": "I-GENERAL__location-mountain",
143
+ "111": "B-GENERAL__event-sportsevent",
144
+ "112": "I-GENERAL__event-sportsevent",
145
+ "113": "B-GENERAL__location-road/railway/highway/transit",
146
+ "114": "I-GENERAL__location-road/railway/highway/transit",
147
+ "115": "B-GENERAL__other-medical",
148
+ "116": "I-GENERAL__other-medical",
149
+ "117": "B-GENERAL__organization-education",
150
+ "118": "I-GENERAL__organization-education",
151
+ "119": "B-GENERAL__organization-company",
152
+ "120": "I-GENERAL__organization-company",
153
+ "121": "B-GENERAL__other-currency",
154
+ "122": "I-GENERAL__other-currency",
155
+ "123": "B-GENERAL__location-park",
156
+ "124": "I-GENERAL__location-park"
157
+ },
158
+ "initializer_range": 0.02,
159
+ "intermediate_size": 4096,
160
+ "is_decoder": false,
161
+ "is_encoder_decoder": false,
162
+ "label2id": {
163
+ "B-DATETIME__absolute": 95,
164
+ "B-DATETIME__authored": 63,
165
+ "B-DATETIME__range": 53,
166
+ "B-DATETIME__relative": 43,
167
+ "B-GENERAL__art-broadcastprogram": 91,
168
+ "B-GENERAL__art-film": 5,
169
+ "B-GENERAL__art-music": 85,
170
+ "B-GENERAL__art-other": 9,
171
+ "B-GENERAL__art-painting": 81,
172
+ "B-GENERAL__art-writtenart": 87,
173
+ "B-GENERAL__building-airport": 77,
174
+ "B-GENERAL__building-hospital": 33,
175
+ "B-GENERAL__building-hotel": 21,
176
+ "B-GENERAL__building-library": 71,
177
+ "B-GENERAL__building-other": 65,
178
+ "B-GENERAL__building-restaurant": 89,
179
+ "B-GENERAL__building-sportsfacility": 29,
180
+ "B-GENERAL__building-theater": 7,
181
+ "B-GENERAL__event-attack/battle/war/militaryconflict": 99,
182
+ "B-GENERAL__event-other": 47,
183
+ "B-GENERAL__event-sportsevent": 111,
184
+ "B-GENERAL__location-GPE": 105,
185
+ "B-GENERAL__location-bodiesofwater": 49,
186
+ "B-GENERAL__location-island": 93,
187
+ "B-GENERAL__location-mountain": 109,
188
+ "B-GENERAL__location-other": 75,
189
+ "B-GENERAL__location-park": 123,
190
+ "B-GENERAL__location-road/railway/highway/transit": 113,
191
+ "B-GENERAL__organization-company": 119,
192
+ "B-GENERAL__organization-education": 117,
193
+ "B-GENERAL__organization-government/governmentagency": 51,
194
+ "B-GENERAL__organization-media/newspaper": 17,
195
+ "B-GENERAL__organization-other": 25,
196
+ "B-GENERAL__organization-religion": 27,
197
+ "B-GENERAL__organization-showorganization": 1,
198
+ "B-GENERAL__organization-sportsteam": 97,
199
+ "B-GENERAL__other-astronomything": 69,
200
+ "B-GENERAL__other-award": 103,
201
+ "B-GENERAL__other-biologything": 15,
202
+ "B-GENERAL__other-chemicalthing": 23,
203
+ "B-GENERAL__other-currency": 121,
204
+ "B-GENERAL__other-disease": 11,
205
+ "B-GENERAL__other-educationaldegree": 83,
206
+ "B-GENERAL__other-god": 79,
207
+ "B-GENERAL__other-language": 67,
208
+ "B-GENERAL__other-law": 45,
209
+ "B-GENERAL__other-livingthing": 57,
210
+ "B-GENERAL__other-medical": 115,
211
+ "B-GENERAL__person-artist/author": 13,
212
+ "B-GENERAL__person-other": 31,
213
+ "B-GENERAL__person-politician": 37,
214
+ "B-GENERAL__person-scholar": 41,
215
+ "B-GENERAL__person-soldier": 107,
216
+ "B-GENERAL__product-airplane": 3,
217
+ "B-GENERAL__product-car": 59,
218
+ "B-GENERAL__product-food": 19,
219
+ "B-GENERAL__product-game": 61,
220
+ "B-GENERAL__product-other": 101,
221
+ "B-GENERAL__product-ship": 55,
222
+ "B-GENERAL__product-software": 39,
223
+ "B-GENERAL__product-train": 73,
224
+ "B-GENERAL__product-weapon": 35,
225
+ "I-DATETIME__absolute": 96,
226
+ "I-DATETIME__authored": 64,
227
+ "I-DATETIME__range": 54,
228
+ "I-DATETIME__relative": 44,
229
+ "I-GENERAL__art-broadcastprogram": 92,
230
+ "I-GENERAL__art-film": 6,
231
+ "I-GENERAL__art-music": 86,
232
+ "I-GENERAL__art-other": 10,
233
+ "I-GENERAL__art-painting": 82,
234
+ "I-GENERAL__art-writtenart": 88,
235
+ "I-GENERAL__building-airport": 78,
236
+ "I-GENERAL__building-hospital": 34,
237
+ "I-GENERAL__building-hotel": 22,
238
+ "I-GENERAL__building-library": 72,
239
+ "I-GENERAL__building-other": 66,
240
+ "I-GENERAL__building-restaurant": 90,
241
+ "I-GENERAL__building-sportsfacility": 30,
242
+ "I-GENERAL__building-theater": 8,
243
+ "I-GENERAL__event-attack/battle/war/militaryconflict": 100,
244
+ "I-GENERAL__event-other": 48,
245
+ "I-GENERAL__event-sportsevent": 112,
246
+ "I-GENERAL__location-GPE": 106,
247
+ "I-GENERAL__location-bodiesofwater": 50,
248
+ "I-GENERAL__location-island": 94,
249
+ "I-GENERAL__location-mountain": 110,
250
+ "I-GENERAL__location-other": 76,
251
+ "I-GENERAL__location-park": 124,
252
+ "I-GENERAL__location-road/railway/highway/transit": 114,
253
+ "I-GENERAL__organization-company": 120,
254
+ "I-GENERAL__organization-education": 118,
255
+ "I-GENERAL__organization-government/governmentagency": 52,
256
+ "I-GENERAL__organization-media/newspaper": 18,
257
+ "I-GENERAL__organization-other": 26,
258
+ "I-GENERAL__organization-religion": 28,
259
+ "I-GENERAL__organization-showorganization": 2,
260
+ "I-GENERAL__organization-sportsteam": 98,
261
+ "I-GENERAL__other-astronomything": 70,
262
+ "I-GENERAL__other-award": 104,
263
+ "I-GENERAL__other-biologything": 16,
264
+ "I-GENERAL__other-chemicalthing": 24,
265
+ "I-GENERAL__other-currency": 122,
266
+ "I-GENERAL__other-disease": 12,
267
+ "I-GENERAL__other-educationaldegree": 84,
268
+ "I-GENERAL__other-god": 80,
269
+ "I-GENERAL__other-language": 68,
270
+ "I-GENERAL__other-law": 46,
271
+ "I-GENERAL__other-livingthing": 58,
272
+ "I-GENERAL__other-medical": 116,
273
+ "I-GENERAL__person-artist/author": 14,
274
+ "I-GENERAL__person-other": 32,
275
+ "I-GENERAL__person-politician": 38,
276
+ "I-GENERAL__person-scholar": 42,
277
+ "I-GENERAL__person-soldier": 108,
278
+ "I-GENERAL__product-airplane": 4,
279
+ "I-GENERAL__product-car": 60,
280
+ "I-GENERAL__product-food": 20,
281
+ "I-GENERAL__product-game": 62,
282
+ "I-GENERAL__product-other": 102,
283
+ "I-GENERAL__product-ship": 56,
284
+ "I-GENERAL__product-software": 40,
285
+ "I-GENERAL__product-train": 74,
286
+ "I-GENERAL__product-weapon": 36,
287
+ "O": 0
288
+ },
289
+ "layer_norm_eps": 1e-05,
290
+ "length_penalty": 1.0,
291
+ "max_length": 20,
292
+ "max_position_embeddings": 514,
293
+ "min_length": 0,
294
+ "model_type": "roberta",
295
+ "no_repeat_ngram_size": 0,
296
+ "num_attention_heads": 16,
297
+ "num_beam_groups": 1,
298
+ "num_beams": 1,
299
+ "num_hidden_layers": 24,
300
+ "num_return_sequences": 1,
301
+ "output_attentions": false,
302
+ "output_hidden_states": false,
303
+ "output_scores": false,
304
+ "pad_token_id": 1,
305
+ "position_embedding_type": "absolute",
306
+ "prefix": null,
307
+ "problem_type": null,
308
+ "pruned_heads": {},
309
+ "remove_invalid_values": false,
310
+ "repetition_penalty": 1.0,
311
+ "return_dict": true,
312
+ "return_dict_in_generate": false,
313
+ "sep_token_id": null,
314
+ "suppress_tokens": null,
315
+ "task_specific_params": null,
316
+ "temperature": 1.0,
317
+ "tf_legacy_loss": false,
318
+ "tie_encoder_decoder": false,
319
+ "tie_word_embeddings": true,
320
+ "tokenizer_class": null,
321
+ "top_k": 50,
322
+ "top_p": 1.0,
323
+ "torch_dtype": null,
324
+ "torchscript": false,
325
+ "transformers_version": "4.42.1",
326
+ "type_vocab_size": 1,
327
+ "typical_p": 1.0,
328
+ "use_bfloat16": false,
329
+ "use_cache": true,
330
+ "vocab_size": 50272
331
+ },
332
+ "entity_max_length": 11,
333
+ "id2label": {
334
+ "0": "O",
335
+ "1": "DATETIME__absolute",
336
+ "2": "DATETIME__authored",
337
+ "3": "DATETIME__range",
338
+ "4": "DATETIME__relative",
339
+ "5": "GENERAL__art-broadcastprogram",
340
+ "6": "GENERAL__art-film",
341
+ "7": "GENERAL__art-music",
342
+ "8": "GENERAL__art-other",
343
+ "9": "GENERAL__art-painting",
344
+ "10": "GENERAL__art-writtenart",
345
+ "11": "GENERAL__building-airport",
346
+ "12": "GENERAL__building-hospital",
347
+ "13": "GENERAL__building-hotel",
348
+ "14": "GENERAL__building-library",
349
+ "15": "GENERAL__building-other",
350
+ "16": "GENERAL__building-restaurant",
351
+ "17": "GENERAL__building-sportsfacility",
352
+ "18": "GENERAL__building-theater",
353
+ "19": "GENERAL__event-attack/battle/war/militaryconflict",
354
+ "20": "GENERAL__event-other",
355
+ "21": "GENERAL__event-sportsevent",
356
+ "22": "GENERAL__location-GPE",
357
+ "23": "GENERAL__location-bodiesofwater",
358
+ "24": "GENERAL__location-island",
359
+ "25": "GENERAL__location-mountain",
360
+ "26": "GENERAL__location-other",
361
+ "27": "GENERAL__location-park",
362
+ "28": "GENERAL__location-road/railway/highway/transit",
363
+ "29": "GENERAL__organization-company",
364
+ "30": "GENERAL__organization-education",
365
+ "31": "GENERAL__organization-government/governmentagency",
366
+ "32": "GENERAL__organization-media/newspaper",
367
+ "33": "GENERAL__organization-other",
368
+ "34": "GENERAL__organization-religion",
369
+ "35": "GENERAL__organization-showorganization",
370
+ "36": "GENERAL__organization-sportsteam",
371
+ "37": "GENERAL__other-astronomything",
372
+ "38": "GENERAL__other-award",
373
+ "39": "GENERAL__other-biologything",
374
+ "40": "GENERAL__other-chemicalthing",
375
+ "41": "GENERAL__other-currency",
376
+ "42": "GENERAL__other-disease",
377
+ "43": "GENERAL__other-educationaldegree",
378
+ "44": "GENERAL__other-god",
379
+ "45": "GENERAL__other-language",
380
+ "46": "GENERAL__other-law",
381
+ "47": "GENERAL__other-livingthing",
382
+ "48": "GENERAL__other-medical",
383
+ "49": "GENERAL__person-artist/author",
384
+ "50": "GENERAL__person-other",
385
+ "51": "GENERAL__person-politician",
386
+ "52": "GENERAL__person-scholar",
387
+ "53": "GENERAL__person-soldier",
388
+ "54": "GENERAL__product-airplane",
389
+ "55": "GENERAL__product-car",
390
+ "56": "GENERAL__product-food",
391
+ "57": "GENERAL__product-game",
392
+ "58": "GENERAL__product-other",
393
+ "59": "GENERAL__product-ship",
394
+ "60": "GENERAL__product-software",
395
+ "61": "GENERAL__product-train",
396
+ "62": "GENERAL__product-weapon"
397
+ },
398
+ "id2reduced_id": {
399
+ "0": 0,
400
+ "1": 35,
401
+ "2": 35,
402
+ "3": 54,
403
+ "4": 54,
404
+ "5": 6,
405
+ "6": 6,
406
+ "7": 18,
407
+ "8": 18,
408
+ "9": 8,
409
+ "10": 8,
410
+ "11": 42,
411
+ "12": 42,
412
+ "13": 49,
413
+ "14": 49,
414
+ "15": 39,
415
+ "16": 39,
416
+ "17": 32,
417
+ "18": 32,
418
+ "19": 56,
419
+ "20": 56,
420
+ "21": 13,
421
+ "22": 13,
422
+ "23": 40,
423
+ "24": 40,
424
+ "25": 33,
425
+ "26": 33,
426
+ "27": 34,
427
+ "28": 34,
428
+ "29": 17,
429
+ "30": 17,
430
+ "31": 50,
431
+ "32": 50,
432
+ "33": 12,
433
+ "34": 12,
434
+ "35": 62,
435
+ "36": 62,
436
+ "37": 51,
437
+ "38": 51,
438
+ "39": 60,
439
+ "40": 60,
440
+ "41": 52,
441
+ "42": 52,
442
+ "43": 4,
443
+ "44": 4,
444
+ "45": 46,
445
+ "46": 46,
446
+ "47": 20,
447
+ "48": 20,
448
+ "49": 23,
449
+ "50": 23,
450
+ "51": 31,
451
+ "52": 31,
452
+ "53": 3,
453
+ "54": 3,
454
+ "55": 59,
455
+ "56": 59,
456
+ "57": 47,
457
+ "58": 47,
458
+ "59": 55,
459
+ "60": 55,
460
+ "61": 57,
461
+ "62": 57,
462
+ "63": 2,
463
+ "64": 2,
464
+ "65": 15,
465
+ "66": 15,
466
+ "67": 45,
467
+ "68": 45,
468
+ "69": 37,
469
+ "70": 37,
470
+ "71": 14,
471
+ "72": 14,
472
+ "73": 61,
473
+ "74": 61,
474
+ "75": 26,
475
+ "76": 26,
476
+ "77": 11,
477
+ "78": 11,
478
+ "79": 44,
479
+ "80": 44,
480
+ "81": 9,
481
+ "82": 9,
482
+ "83": 43,
483
+ "84": 43,
484
+ "85": 7,
485
+ "86": 7,
486
+ "87": 10,
487
+ "88": 10,
488
+ "89": 16,
489
+ "90": 16,
490
+ "91": 5,
491
+ "92": 5,
492
+ "93": 24,
493
+ "94": 24,
494
+ "95": 1,
495
+ "96": 1,
496
+ "97": 36,
497
+ "98": 36,
498
+ "99": 19,
499
+ "100": 19,
500
+ "101": 58,
501
+ "102": 58,
502
+ "103": 38,
503
+ "104": 38,
504
+ "105": 22,
505
+ "106": 22,
506
+ "107": 53,
507
+ "108": 53,
508
+ "109": 25,
509
+ "110": 25,
510
+ "111": 21,
511
+ "112": 21,
512
+ "113": 28,
513
+ "114": 28,
514
+ "115": 48,
515
+ "116": 48,
516
+ "117": 30,
517
+ "118": 30,
518
+ "119": 29,
519
+ "120": 29,
520
+ "121": 41,
521
+ "122": 41,
522
+ "123": 27,
523
+ "124": 27
524
+ },
525
+ "label2id": {
526
+ "DATETIME__absolute": 1,
527
+ "DATETIME__authored": 2,
528
+ "DATETIME__range": 3,
529
+ "DATETIME__relative": 4,
530
+ "GENERAL__art-broadcastprogram": 5,
531
+ "GENERAL__art-film": 6,
532
+ "GENERAL__art-music": 7,
533
+ "GENERAL__art-other": 8,
534
+ "GENERAL__art-painting": 9,
535
+ "GENERAL__art-writtenart": 10,
536
+ "GENERAL__building-airport": 11,
537
+ "GENERAL__building-hospital": 12,
538
+ "GENERAL__building-hotel": 13,
539
+ "GENERAL__building-library": 14,
540
+ "GENERAL__building-other": 15,
541
+ "GENERAL__building-restaurant": 16,
542
+ "GENERAL__building-sportsfacility": 17,
543
+ "GENERAL__building-theater": 18,
544
+ "GENERAL__event-attack/battle/war/militaryconflict": 19,
545
+ "GENERAL__event-other": 20,
546
+ "GENERAL__event-sportsevent": 21,
547
+ "GENERAL__location-GPE": 22,
548
+ "GENERAL__location-bodiesofwater": 23,
549
+ "GENERAL__location-island": 24,
550
+ "GENERAL__location-mountain": 25,
551
+ "GENERAL__location-other": 26,
552
+ "GENERAL__location-park": 27,
553
+ "GENERAL__location-road/railway/highway/transit": 28,
554
+ "GENERAL__organization-company": 29,
555
+ "GENERAL__organization-education": 30,
556
+ "GENERAL__organization-government/governmentagency": 31,
557
+ "GENERAL__organization-media/newspaper": 32,
558
+ "GENERAL__organization-other": 33,
559
+ "GENERAL__organization-religion": 34,
560
+ "GENERAL__organization-showorganization": 35,
561
+ "GENERAL__organization-sportsteam": 36,
562
+ "GENERAL__other-astronomything": 37,
563
+ "GENERAL__other-award": 38,
564
+ "GENERAL__other-biologything": 39,
565
+ "GENERAL__other-chemicalthing": 40,
566
+ "GENERAL__other-currency": 41,
567
+ "GENERAL__other-disease": 42,
568
+ "GENERAL__other-educationaldegree": 43,
569
+ "GENERAL__other-god": 44,
570
+ "GENERAL__other-language": 45,
571
+ "GENERAL__other-law": 46,
572
+ "GENERAL__other-livingthing": 47,
573
+ "GENERAL__other-medical": 48,
574
+ "GENERAL__person-artist/author": 49,
575
+ "GENERAL__person-other": 50,
576
+ "GENERAL__person-politician": 51,
577
+ "GENERAL__person-scholar": 52,
578
+ "GENERAL__person-soldier": 53,
579
+ "GENERAL__product-airplane": 54,
580
+ "GENERAL__product-car": 55,
581
+ "GENERAL__product-food": 56,
582
+ "GENERAL__product-game": 57,
583
+ "GENERAL__product-other": 58,
584
+ "GENERAL__product-ship": 59,
585
+ "GENERAL__product-software": 60,
586
+ "GENERAL__product-train": 61,
587
+ "GENERAL__product-weapon": 62,
588
+ "O": 0
589
+ },
590
+ "marker_max_length": 128,
591
+ "max_next_context": 3,
592
+ "max_prev_context": 3,
593
+ "model_max_length": 256,
594
+ "model_max_length_default": 512,
595
+ "model_type": "span-marker",
596
+ "span_marker_version": "1.5.0",
597
+ "torch_dtype": "float32",
598
+ "trained_with_document_context": true,
599
+ "transformers_version": "4.42.1",
600
+ "vocab_size": 50272
601
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f90acf25156c1fe2bac2dbae39e12f875b7f1e69e5ae4de5515426ee18cc712e
3
+ size 1422032220
runs/Jul25_15-22-52_psicrz06tcrx/events.out.tfevents.1721921035.psicrz06tcrx.2730.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52e59ca3a7dd89dac6340a4697f2c8d166c2eb6c53ec37d3d6362bbc3eccaee5
3
+ size 20568
runs/Jul25_15-47-19_psicrz06tcrx/events.out.tfevents.1721925575.psicrz06tcrx.4445.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b040aae965e7f8c2c8ef2b02b3c582a7a7185464bf99c95e91da7376952dcb94
3
+ size 25981
runs/Jul25_17-27-37_psicrz06tcrx/events.out.tfevents.1721931493.psicrz06tcrx.6934.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:452ce54c564eaf1a5268c91fb4a81ef3d307446593bc2e5cc4e63c45993267a9
3
+ size 24085
runs/Jul25_18-24-31_psicrz06tcrx/events.out.tfevents.1721935050.psicrz06tcrx.8437.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91e1641d6f06e6339367a50e9cf68a02229e57ec8c123201272df6e07374fe04
3
+ size 23876
runs/Jul25_19-23-13_psicrz06tcrx/events.out.tfevents.1721938483.psicrz06tcrx.9919.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ac37ba55955c95f0da7a60b3fda48006dfc33a2c4fda5d3bf07fde0f732c6b4
3
+ size 23876
runs/Jul25_20-17-44_psicrz06tcrx/events.out.tfevents.1721941867.psicrz06tcrx.11356.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ce108be42a94a7fd45609980120d8225ecc2e89ce5ce05ea0256084527e1b8e
3
+ size 23876
runs/Jul25_21-29-39_psicrz06tcrx/events.out.tfevents.1721946066.psicrz06tcrx.13121.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:737a1f21f87c2df38db3e61e5c6c363106bd92031f68bc5969f6b7967e9f3b8a
3
+ size 23876
runs/Jul25_22-38-11_psicrz06tcrx/events.out.tfevents.1721950227.psicrz06tcrx.15014.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44316e2d8a16ed42da18a009d1115cb93a2909751a291e66ba0d400b9b917900
3
+ size 23876
runs/Jul26_03-57-10_psicrz06tcrx/events.out.tfevents.1721967402.psicrz06tcrx.2840.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a2a879eb25e7a6b21066d99f574f1aa97a4bff156a993f88cb59d9d70b74a81
3
+ size 23876
runs/Jul26_04-17-46_psicrz06tcrx/events.out.tfevents.1721968623.psicrz06tcrx.3465.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ea3d24ed8b9d827a4b7020da1c1a4c1c0d585cceb0919990196a51f612d7717
3
+ size 23876
runs/Jul26_04-47-13_psicrz06tcrx/events.out.tfevents.1721970386.psicrz06tcrx.4239.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d95c32fac3827298d97958653b2748619fb368e9c4e6e616264d0eb33aa4721
3
+ size 23876
runs/Jul26_05-42-47_psicrz06tcrx/events.out.tfevents.1721972862.psicrz06tcrx.5582.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b634f0f6a2ce435e43c5fd9073e56417cf0ea2c41d206688da259128dfbc518
3
+ size 24501
runs/Jul26_05-56-13_psicrz06tcrx/events.out.tfevents.1721973665.psicrz06tcrx.6069.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28a2413c9b5c52eb5c4210f63f2053efd0e3b6cc23858bf96bf5fa8cbbec03dd
3
+ size 23876
runs/Jul26_06-05-17_psicrz06tcrx/events.out.tfevents.1721974080.psicrz06tcrx.6704.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c7471b4711a7c357010b108afe667cd878a7633244627e2c5f5f765b774d6a6
3
+ size 26693
runs/Jul26_06-21-12_psicrz06tcrx/events.out.tfevents.1721975516.psicrz06tcrx.7185.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8783de5bc0a30f12b8b6780a6a75a959f6a74fb7a707ff3682ffb4bcb252abb7
3
+ size 55236
runs/Jul29_16-55-18_psicrz06tcrx/events.out.tfevents.1722274983.psicrz06tcrx.2807.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92485a1c688ea52ee7250251137f911ee6721c49f955657fca6433b2c01aeab3
3
+ size 289794
runs/Jul29_16-55-18_psicrz06tcrx/events.out.tfevents.1722433858.psicrz06tcrx.2807.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2dfef784cc8055821a9e9209c4722e3a4a6007fe61c1afffe268ed5fd58d5df9
3
+ size 601
runs/Jun27_22-46-59_psicrz06tcrx/events.out.tfevents.1719528469.psicrz06tcrx.2869.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b55e7ff2a5a99b9e5e111fdc19c22583af74e6859a4ba75574b29436709675b4
3
+ size 20568
runs/Jun27_22-52-09_psicrz06tcrx/events.out.tfevents.1719528804.psicrz06tcrx.5472.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3050396dd8e2fb3076078a5a2407f07821d45be4b639f80d29721a39f4b0e80
3
+ size 20568
runs/Jun27_22-55-25_psicrz06tcrx/events.out.tfevents.1719529012.psicrz06tcrx.5678.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4bc9c4d8de06647ed987b28f6f94119e27badd1b2c22c39e60e4fb6195470de5
3
+ size 22266
runs/Jun27_23-14-12_psicrz06tcrx/events.out.tfevents.1719530094.psicrz06tcrx.6287.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db0611b0d4895da32124018f4a3b2c67c25b2a7485bf8d35faf9ad5c6002e015
3
+ size 22112
runs/Jun27_23-16-03_psicrz06tcrx/events.out.tfevents.1719530250.psicrz06tcrx.6427.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc266ee740aa5da851cea3604a73a3209097ccf1784c0088db7e4850e4699271
3
+ size 22112
runs/Jun27_23-18-20_psicrz06tcrx/events.out.tfevents.1719530343.psicrz06tcrx.6582.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9083a891cd67a05109207fc7c294f16e8c570bd3c2856997653d376ecc14aee
3
+ size 25319
runs/Jun27_23-18-20_psicrz06tcrx/events.out.tfevents.1719536408.psicrz06tcrx.6582.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92e0936b3ddf68c67afbd9431eb5f2faa83ece51053915b5320971b0a0905bc9
3
+ size 592
runs/Jun28_03-22-13_psicrz06tcrx/events.out.tfevents.1719544934.psicrz06tcrx.14486.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cbe80ece93d089bcf9ecf1686ef9ad4659610be293b4cfaee816dd8238ff2a2
3
+ size 22460
runs/Jun28_03-25-02_psicrz06tcrx/events.out.tfevents.1719545103.psicrz06tcrx.14639.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49719404464201a780d814d1927ad30e9b23293120eab588950eff605db8f7ea
3
+ size 22460
runs/Jun28_03-27-32_psicrz06tcrx/events.out.tfevents.1719545253.psicrz06tcrx.14816.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e57c8c6a30f5cb06420f5bd6c3a066bdd123407ca77063f475fc589fa66c4fb4
3
+ size 22460
runs/Jun28_03-36-59_psicrz06tcrx/events.out.tfevents.1719545820.psicrz06tcrx.15209.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9225461bfd6b4f2940f881b27b85c1eb8a3895bee784f02c5280ff86e2d1e95
3
+ size 23084
runs/Jun28_03-39-17_psicrz06tcrx/events.out.tfevents.1719545958.psicrz06tcrx.15442.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b69b5ce12a07c3293c23b422585d745093dc44c6d50a7e4a2162a0b8b90c693
3
+ size 23084
runs/Jun28_03-48-22_psicrz06tcrx/events.out.tfevents.1719546576.psicrz06tcrx.16041.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1334144f69087ad109f2a802800b3e88704a39cd9ded41235c145a5feb21016
3
+ size 26751
runs/Jun28_05-39-40_psicrz06tcrx/events.out.tfevents.1719553244.psicrz06tcrx.19916.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5f43603554103aeb808582be034fc3b0360b3965216ebf8681371415db102bb
3
+ size 26775
runs/Jun28_05-39-40_psicrz06tcrx/events.out.tfevents.1719559233.psicrz06tcrx.19916.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f2e77f2c7eaad45da8e136fec59c452f82cc044a16eaf52d360fac3f515271a
3
+ size 592
runs/Jun28_07-27-04_psicrz06tcrx/events.out.tfevents.1719559687.psicrz06tcrx.22490.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d66f6f570c7af92d8cf9bd861c2c62cefcc5537d080d959e41af4b2b70740b9
3
+ size 26775
runs/Jun28_07-27-04_psicrz06tcrx/events.out.tfevents.1719565742.psicrz06tcrx.22490.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e869a26aefd97eada56159682985f1c7861f6f9411e5106e4ea5134cfcd68cf1
3
+ size 592
special_tokens_map.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<s>",
3
+ "cls_token": "<s>",
4
+ "eos_token": "</s>",
5
+ "mask_token": {
6
+ "content": "<mask>",
7
+ "lstrip": true,
8
+ "normalized": false,
9
+ "rstrip": false,
10
+ "single_word": false
11
+ },
12
+ "pad_token": "<pad>",
13
+ "sep_token": "</s>",
14
+ "unk_token": "<unk>"
15
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": true,
3
+ "added_tokens_decoder": {
4
+ "0": {
5
+ "content": "<s>",
6
+ "lstrip": false,
7
+ "normalized": true,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "1": {
13
+ "content": "<pad>",
14
+ "lstrip": false,
15
+ "normalized": true,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "2": {
21
+ "content": "</s>",
22
+ "lstrip": false,
23
+ "normalized": true,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ },
28
+ "3": {
29
+ "content": "<unk>",
30
+ "lstrip": false,
31
+ "normalized": true,
32
+ "rstrip": false,
33
+ "single_word": false,
34
+ "special": true
35
+ },
36
+ "50264": {
37
+ "content": "<mask>",
38
+ "lstrip": true,
39
+ "normalized": false,
40
+ "rstrip": false,
41
+ "single_word": false,
42
+ "special": true
43
+ },
44
+ "50265": {
45
+ "content": "<start>",
46
+ "lstrip": false,
47
+ "normalized": false,
48
+ "rstrip": false,
49
+ "single_word": false,
50
+ "special": true
51
+ },
52
+ "50266": {
53
+ "content": "<end>",
54
+ "lstrip": false,
55
+ "normalized": false,
56
+ "rstrip": false,
57
+ "single_word": false,
58
+ "special": true
59
+ }
60
+ },
61
+ "bos_token": "<s>",
62
+ "clean_up_tokenization_spaces": true,
63
+ "cls_token": "<s>",
64
+ "entity_max_length": 11,
65
+ "eos_token": "</s>",
66
+ "errors": "replace",
67
+ "mask_token": "<mask>",
68
+ "max_next_context": 3,
69
+ "max_prev_context": 3,
70
+ "model_max_length": 256,
71
+ "pad_token": "<pad>",
72
+ "sep_token": "</s>",
73
+ "tokenizer_class": "RobertaTokenizer",
74
+ "trim_offsets": true,
75
+ "unk_token": "<unk>"
76
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c73d701fd2e73a55f082849661dae0d32bfc005a3037029705c7a995027d1474
3
+ size 5176
vocab.json ADDED
The diff for this file is too large to render. See raw diff