Add new SentenceTransformer model
Browse files- 1_Pooling/config.json +10 -0
- README.md +1022 -0
- config.json +47 -0
- config_sentence_transformers.json +10 -0
- model.safetensors +3 -0
- modules.json +20 -0
- sentence_bert_config.json +4 -0
- special_tokens_map.json +37 -0
- tokenizer.json +0 -0
- tokenizer_config.json +945 -0
1_Pooling/config.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"word_embedding_dimension": 768,
|
| 3 |
+
"pooling_mode_cls_token": false,
|
| 4 |
+
"pooling_mode_mean_tokens": true,
|
| 5 |
+
"pooling_mode_max_tokens": false,
|
| 6 |
+
"pooling_mode_mean_sqrt_len_tokens": false,
|
| 7 |
+
"pooling_mode_weightedmean_tokens": false,
|
| 8 |
+
"pooling_mode_lasttoken": false,
|
| 9 |
+
"include_prompt": true
|
| 10 |
+
}
|
README.md
ADDED
|
@@ -0,0 +1,1022 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
tags:
|
| 3 |
+
- sentence-transformers
|
| 4 |
+
- sentence-similarity
|
| 5 |
+
- feature-extraction
|
| 6 |
+
- generated_from_trainer
|
| 7 |
+
- dataset_size:3619
|
| 8 |
+
- loss:CachedMultipleNegativesRankingLoss
|
| 9 |
+
base_model: nomic-ai/modernbert-embed-base
|
| 10 |
+
widget:
|
| 11 |
+
- source_sentence: What is the meaning of the pattern code 128 in the table?
|
| 12 |
+
sentences:
|
| 13 |
+
- "epevents\nThe following table may serve as a quick reference to select certain\n\
|
| 14 |
+
pattern types of recognized events (i.e. away from CCD edges, bad pixels\netc.):\n\
|
| 15 |
+
\n ‘PATTERN‘ Meaning\n ----------- ---------------------------------------------------\n\
|
| 16 |
+
\ 0 singles\n 1 doubles in Y with Y(main)<Y(secondary)\n\
|
| 17 |
+
\ 2 doubles in X with X(main)<X(secondary)\n 3 doubles in\
|
| 18 |
+
\ Y with Y(main)>Y(secondary)\n 4 doubles in X with X(main)>X(secondary)\n\
|
| 19 |
+
\ 5–8 triples\n 9–12 quadruples\n 128 singles at CCD\
|
| 20 |
+
\ window (RAWX=1, RAWX=64, RAWY=200)\n or close to bad pixels\n \
|
| 21 |
+
\ 205 doubles at CCD window or bad pixels\n 206 triples at CCD\
|
| 22 |
+
\ window or bad pixels\n 207 quadruples at CCD window or bad pixels\n\
|
| 23 |
+
\nNote: as of version 6.30.4 PATTERN values of 128 have been changed to 0\n(i.e. $8^{\\\
|
| 24 |
+
rm th}$ bit is not set anymore for singles), and PATTERN\nvalues of 205 have been\
|
| 25 |
+
\ changed to 1–4 (i.e. $7^{\\rm th}$ and\n$8^{\\rm th}$ bit are not set anymore\
|
| 26 |
+
\ for doubles)!\n\nSecondary events of those valid doubles, triples, and quadruples\n\
|
| 27 |
+
($`PATTERN`=1..12$) have ${\\rm PATTERN(main)} + 64$ (as listed above),\ni.e. $7^{\\\
|
| 28 |
+
rm th}$ bit set.\n\n1. For the pattern codes in ‘PAT_ID‘ and ‘PATTERN‘ the following\n\
|
| 29 |
+
\ bit-wise storing is used:\n\n ‘PAT_ID‘ \n ----------\
|
| 30 |
+
\ ------- -------------------------------------------\n bit value\
|
| 31 |
+
\ Meaning\n 16 32768 free for additional pattern related flag\n\
|
| 32 |
+
\ 15 16384 – \" –\n 14 8192 – \" –\n \
|
| 33 |
+
\ 13 4096 PAT_ORI first digit (x-coordinate)\n 12 2048 –\
|
| 34 |
+
\ \" –\n 11 1024 PAT_ORI second digit (y-coordinate)\n \
|
| 35 |
+
\ 10 512 – \" –\n 9 256 PAT_IND: 1, ..., < 512 (telemetry\
|
| 36 |
+
\ limit)\n ... ... – \" –\n 1 1 – \" –\n\n\
|
| 37 |
+
\ ‘PATTERN‘ \n ----------- -------\
|
| 38 |
+
\ ------------------------- ----------------------------------\n \
|
| 39 |
+
\ bit value Meaning \n 8 128 sign of PAT_TYP\
|
| 40 |
+
\ \n 7 64 sign of PAT_IND \n \
|
| 41 |
+
\ 6 32 used to flag PAT_TYP > 4\n \
|
| 42 |
+
\ 5 16 if bit 6, then use next 5 bits\n\
|
| 43 |
+
\ 4 8 MOS code numbers 0 - 12 to store PAT_TYP - 5\n \
|
| 44 |
+
\ 3 4 a combination of hence, max storage: PAT_TYP\
|
| 45 |
+
\ = 36\n 2 2 PAT_TYP ≤ 4 and – \" –\n \
|
| 46 |
+
\ 1 1 PAT_ORI – \" –\n\n Note: as of version\
|
| 47 |
+
\ 6.30.4 PATTERN values of 128 have been changed\n to 0 (i.e. $8^{\\rm th}$\
|
| 48 |
+
\ bit is not set anymore for singles), and\n PATTERN values of 205 have been\
|
| 49 |
+
\ changed to 1–4 (i.e. $7^{\\rm th}$\n and $8^{\\rm th}$ bit are not set anymore\
|
| 50 |
+
\ for doubles)!\n\n2. Creation of event quality flags in column ‘FLAG‘. Task:\
|
| 51 |
+
\ epevents\n makes use of the common MOS/pn event related flag code (see )\
|
| 52 |
+
\ and\n uses the following bits (other flags are set by the Task: epframes\n\
|
| 53 |
+
\ task):\n\n ‘FLAG‘ \n -------- --------- -------------------------------------\n\
|
| 54 |
+
\ bit value Meaning (information)\n 1 0x2 ‘INVALID_PATTERN‘\n\
|
| 55 |
+
\ 2 0x4 ‘CLOSE_TO_CCD_WINDOW‘\n 5 0x20 ‘CLOSE_TO_ONBOARD_BADPIX‘\n\
|
| 56 |
+
\ 6 0x40 ‘CLOSE_TO_BRIGHTPIX‘ (not on-board)\n 8\
|
| 57 |
+
\ 0x100 ‘CLOSE_TO_DEADPIX‘ (not on-board)\n 16 0x10000 ‘OUT_OF_FOV‘\
|
| 58 |
+
\ \n\n bit value Meaning (rejection)\n ------- ----------\
|
| 59 |
+
\ ---------------------\n 19 0x80000 ‘COSMIC_RAY‘\n 21\
|
| 60 |
+
\ 0x200000 ‘ON_BADPIX‘\n 22 0x400000 ‘SECONDARY‘\n 23\
|
| 61 |
+
\ 0x800000 ‘TRAILING‘\n total 0xfa0000 EPN rejection mask\n"
|
| 62 |
+
- "rgssources\nThe source data can come from several sources:\n\n- A source list\
|
| 63 |
+
\ from a previous run of Task: rgssources (note that\n from version 5.1, Task:\
|
| 64 |
+
\ rgssources is now compatible with all\n earlier source list formats).\n\n\
|
| 65 |
+
- The proposed target source.\n\n- The attitude of the spacecraft.\n\n- \
|
| 66 |
+
\ A source list output by either Task: emldetect or Task: eboxdetect.\n\n- A\
|
| 67 |
+
\ source position supplied on the command line by the user.\n\nThese are described\
|
| 68 |
+
\ individually below.\n"
|
| 69 |
+
- "rgssources\n## Parameters\n\n \\label{rgssources:description:parameters}\n \
|
| 70 |
+
\ \n **filemode}\t{modify** (Optional): no\n(Type: \n Controls whether the\
|
| 71 |
+
\ task opens a previous source list for editing or creates a new one.\n }\n\
|
| 72 |
+
\ \\optparm{changeprime}\t{no}\t{boolean}\t{yes|no, Default: string}\t{modify|create,\
|
| 73 |
+
\ Range: \n Only active in `filemode`=`modify'. Unless this parameter is set,\
|
| 74 |
+
\ the previous prime source index number is retained.\n }\n \\optparm{changeattitude)\t\
|
| 75 |
+
{boolean}\t{yes|no}{\n Only active in `filemode`=`modify'. Unless this parameter\
|
| 76 |
+
\ is set, the previous attitude (stored in the header) is retained.\n }\n \
|
| 77 |
+
\ **srclist}\t{rgsset.ds** (Mandatory): yes\n(Type: \n The name of the rgs\
|
| 78 |
+
\ source list. If `filemode`=`create', the output is written to this file. If\
|
| 79 |
+
\ there is an existing file of this name, it will be overwritten unless SAS\\\
|
| 80 |
+
_CLOBBER is unset. If `filemode`=`modify', the task looks for an existing source\
|
| 81 |
+
\ list of this name and modifies it.\n }\n **instexpid}\t{}\t{string}\t{, Default:\
|
| 82 |
+
\ dataset}\t{, Range: \n This parameter contains information about both the\
|
| 83 |
+
\ instrument (that is, RGS1 or 2) and the exposure identifier (a letter S or U,\
|
| 84 |
+
\ indicating scheduled or unscheduled, followed by a three-digit numeric identifier.\
|
| 85 |
+
\ The `instexpid` string can be supplied in a number of different forms, but the\
|
| 86 |
+
\ two most useful are (i) as a six-character string comprising either R1 or R2\
|
| 87 |
+
\ followed by the exposure identifier (an example: `R2S003'); (ii) the name of\
|
| 88 |
+
\ any of RGS-specific files in the ODF can also be used. This parameter is mandatory\
|
| 89 |
+
\ if `filemode`=`create', or in cases where the instrument and/or exposure can\
|
| 90 |
+
\ neither be read from the file header or deduced from its name.\n }\n \\\
|
| 91 |
+
optparm{writeobskwds)\t{boolean}\t{yes|no** (Optional): no\n(Type: yes}\t{boolean}\t\
|
| 92 |
+
{yes|no, Default: \n If this is set, the task attempts to write observation-specific\
|
| 93 |
+
\ keywords to the file header. The user must point the environment variable SAS\\\
|
| 94 |
+
_ODF to the ODF directory for this to succeed.\n }\n \\optparm{writeexpkwds,\
|
| 95 |
+
\ Range: \n If this is set, the task attempts to write exposure-specific keywords\
|
| 96 |
+
\ to the file header. For this to succeed, the user must point the environment\
|
| 97 |
+
\ variable SAS\\_ODF to the ODF directory, and the task must also be able to determine\
|
| 98 |
+
\ the exposure number, either via the `instexpid` parameter, or from the `EXPIDSTR`\
|
| 99 |
+
\ keyword in the file header, or (if neither are present) from the file name.\n\
|
| 100 |
+
\ }\n \\optparm{clobberonlabel)\t{boolean}\t{yes|no}{\n Labels in RGS source\
|
| 101 |
+
\ lists are required to be unique. Where a clash is detected between a source\
|
| 102 |
+
\ already in the list and a new candidate source, the task takes one of two actions,\
|
| 103 |
+
\ depending on the value of this parameter: if `yes', the candidate is discarded;\
|
| 104 |
+
\ if `no', the task halts with an error.\n }\n\n **primestyle}\t{label}\t\
|
| 105 |
+
{string** (Optional): \n If `primestyle\n(Type: \n Only active if \\param{changeprime`=yes\
|
| 106 |
+
\ and either `addusersource` or `userasprime`=no. It controls the way in which\
|
| 107 |
+
\ the prime source is specified. See the parameters `primelabel` and `primeindex`.\
|
| 108 |
+
\ (An additional possible value of `expression' is planned.)\n }\n \\optparm{primelabel}\t\
|
| 109 |
+
{PROPOSAL, Default: label|index|expr|brightest|auto, Range: string}\t{) is active\
|
| 110 |
+
\ and set to `label', this parameter gives the value of the `LABEL` column of\
|
| 111 |
+
\ the source that it is desired the `PRIMESRC` keyword should point to.\n }\n\
|
| 112 |
+
\ **primeindex}\t{1}\t{integer}\t{$0<$primeindex** (Optional): expmedian\n(Type:\
|
| 113 |
+
\ }\t{string}\t{, Default: \n If `primestyle` is active and set to `index',\
|
| 114 |
+
\ the `PRIMESRC` keyword is set to this value.\n }\n \\optparm{primeexpression,\
|
| 115 |
+
\ Range: \n This mode is not yet supported.\n }\n\n \\optparm{attstyle)\t\
|
| 116 |
+
{string}{mean|median|start|user|expmedian}{\n Controls the way the attitude\
|
| 117 |
+
\ is calculated. If `mean', the attitude is calculated from the mean of the values\
|
| 118 |
+
\ in the attitude history file. If `median', the median of these values is used.\
|
| 119 |
+
\ If the value is `start', the task uses the attitude at the start of the exposure\
|
| 120 |
+
\ as the reference attitude. A value of `expmedian' tells the task to use the\
|
| 121 |
+
\ median of the attitude during the exposure only, as calculated by Task: attfilter.\
|
| 122 |
+
\ The final value, `user', allows the user to input the numbers him/herself via\
|
| 123 |
+
\ the next three parameters.\n }\n **meanset}\t{atthk.dat** (Optional): \n\
|
| 124 |
+
\ The name of the attitude history file. This file is a necessary input in\
|
| 125 |
+
\ the case that `attstyle\n(Type: \n The name of the attitude history file.\
|
| 126 |
+
\ This file is a necessary input in the case that \\param{attstyle` is `mean'.\n\
|
| 127 |
+
\ }\n \\optparm{medianset}\t{atthk.dat, Default: dataset}\t{, Range: dataset}\t\
|
| 128 |
+
{) is `median'.\n }\n **attra}\t{0}\t{angle}\t\t{$0\\le$`attra`$\\le 360$**\
|
| 129 |
+
\ (Mandatory): attgti.ds:STDGTI\n(Type: \n Only active if `attstyle`=`user'.\
|
| 130 |
+
\ The declination of the attitude, in decimal degrees.\n }\n \\mandparm{attapos}\t\
|
| 131 |
+
{0}\t{angle}\t{$0\\le$`attapos`$\\le 360$, Default: \n Only active if `attstyle`=`user'.\
|
| 132 |
+
\ The right ascension of the attitude, in decimal degrees.\n }\n \\mandparm{attdec}\t\
|
| 133 |
+
{0}\t{angle}\t{$-90\\le$`attdec`$\\le 90$, Range: \n Only active if `attstyle`=`user'.\
|
| 134 |
+
\ The position angle of the attitude, in decimal degrees.\n }\n **expmediantable){table**\
|
| 135 |
+
\ (Optional): \n This should be set if the user wishes to add a source to the\
|
| 136 |
+
\ list with a position specified on the command line.\n \n(Type: \n The\
|
| 137 |
+
\ name of the table in the filtered attitude history file in which the exposure-median\
|
| 138 |
+
\ keywords can be found. This file is a necessary input in the case that `attstyle`\
|
| 139 |
+
\ is `expmedian'.\n }\n\n \\optparm{addusersource, Default: , Range: no}\t\
|
| 140 |
+
{boolean}\t{yes|no)\n **label}\t{USER}\t{string}\t{** (Optional): \n Only\
|
| 141 |
+
\ active if `addusersource\n(Type: \n Only active if \\param{addusersource`=yes.\
|
| 142 |
+
\ The brightness of the source in counts per second. It is anticipated that this\
|
| 143 |
+
\ parameter won't be used much, since this is not a quantity that is likely to\
|
| 144 |
+
\ be known in most circumstances. The default value of 0.0 is harmless.\n }\n\
|
| 145 |
+
\ \\optparm{userasprime}\t{no}\t{boolean}\t{yes|no, Default: \n Only active\
|
| 146 |
+
\ if `addusersource`=yes. This is written directly to the `LABEL` column of the\
|
| 147 |
+
\ output source list. The empty string is not permitted.\n }\n \\optparm{rate}\t\
|
| 148 |
+
{0.0}\t{real}\t\t{$0.0<$rate, Range: \n Only active if `addusersource`=yes.\
|
| 149 |
+
\ If `changeprime`=yes and `userasprime`=yes, then the attribute `PRIMESRC` is\
|
| 150 |
+
\ set to the index number of the user source.\n }\n \\optparm{process}\t{no}\t\
|
| 151 |
+
{boolean}\t{yes|no)=yes. This causes the value in the `PROCESS` column to be set\
|
| 152 |
+
\ to true for the user-added source.\n }\n **bkgexclude}\t{yes}\t{boolean}\t\
|
| 153 |
+
{yes|no** (Optional): \n Only active if `addusersource\n(Type: radec, Default:\
|
| 154 |
+
\ \n Only active if \\param{addusersource`=yes. This causes the value in the\
|
| 155 |
+
\ `BKG\\_EXCLUDE` column to be set to true for the user-added source.\n }\n\
|
| 156 |
+
\ \\optparm{positionstyle, Range: string}\t{radec|wrtatt)=yes. If `positionstyle`=`radec',\
|
| 157 |
+
\ then the position of the user-added source is expected via the parameters `ra`\
|
| 158 |
+
\ and `dec`. If on the other hand `positionstyle`=`wrtatt' (With Respect To ATTitude),\
|
| 159 |
+
\ then the position of the user-added source is expected via the parameters `deltadisp`\
|
| 160 |
+
\ and `deltaxdsp`.\n }\n **ra}\t\t{0}\t{angle}\t{$0\\le$`ra`$\\le 360$** (Mandatory):\
|
| 161 |
+
\ \n Only active if `addusersource\n(Type: \n Only active if \\param{addusersource`=yes\
|
| 162 |
+
\ and `positionstyle`=`radec'. The declination of the user-added source, in decimal\
|
| 163 |
+
\ degrees.\n }\n \\mandparm{deltaxdsp}\t{0.0}\t{real}\t\t{, Default: \n \
|
| 164 |
+
\ Only active if `addusersource`=yes and `positionstyle`=`radec'. The right ascension\
|
| 165 |
+
\ of the user-added source, in decimal degrees.\n }\n \\mandparm{dec}\t{0}\t\
|
| 166 |
+
{angle}\t{$-90\\le$`dec`$\\le 90$, Range: \n Only active if `addusersource`=yes\
|
| 167 |
+
\ and `positionstyle`=`wrtatt'. The displacement in arcminutes of the user-added\
|
| 168 |
+
\ source from the pointing direction, in the dispersion direction.\n }\n \\\
|
| 169 |
+
mandparm{deltadisp}\t{0.0}\t{real}\t\t{)=yes and `positionstyle`=`wrtatt'. The\
|
| 170 |
+
\ displacement in arcminutes of the user-added source from the pointing direction,\
|
| 171 |
+
\ in the cross-dispersion direction.\n }\n\n **withepicset}\t{no}\t{boolean}\t\
|
| 172 |
+
{yes|no** (Optional): string\n(Type: \n The name of a set containing a list\
|
| 173 |
+
\ of sources. Formats output by the tasks Task: emldetect and Task: eboxdetect\
|
| 174 |
+
\ are accepted.\n }\n \\optparm{epiclabelprefix, Default: \n If this is\
|
| 175 |
+
\ set, the task looks for the parameter `epicset`, giving the name of an EPIC\
|
| 176 |
+
\ source list.\n }\n \\optparm{epicset}\t{}\t{dataset}\t{, Range: EPIC)\t\
|
| 177 |
+
{}{\n This parameter gives the string which is used by the task as a prefix\
|
| 178 |
+
\ when constructing `LABEL` values for EPIC-derived sources. The other part of\
|
| 179 |
+
\ the `LABEL` is the number `ML\\_ID\\_SRC` or `BOX\\_ID\\_SRC`. The main purpose\
|
| 180 |
+
\ of this parameter is to allow several EPIC-derived source lists to be included\
|
| 181 |
+
\ in the one RGS list if desired, while retaining unique labels.\n }\n **doconfusion}\t\
|
| 182 |
+
{no}\t{boolean}\t{yes|no** (Optional): \n Active only if `withepicset\n(Type:\
|
| 183 |
+
\ 3.5,1.0,1.0, Default: \n Active only if \\param{withepicset`=true. This parameter\
|
| 184 |
+
\ causes the task to check the epic sources + proposal position for confusion\
|
| 185 |
+
\ in the EPIC field of view. It is mainly designed for use in the PCMS, to prevent\
|
| 186 |
+
\ automatic extraction of too many spectra for what is essentially the same object.\
|
| 187 |
+
\ The degree of confusion depends on the size of the PSF, which is a function\
|
| 188 |
+
\ of energy. Therefore, strictly speaking, it depends on the selection of the\
|
| 189 |
+
\ energy band of interest (`bandids`). At the moment, however, the a-priori energy\
|
| 190 |
+
\ of $(0.5+2)/2 = 1.25$~keV is unconditionally used for it, whatever `bandids`\
|
| 191 |
+
\ is.\n }\n \\optparm{instweights, Range: real list}\t{)=true. This parameter\
|
| 192 |
+
\ gives the list of weighting factors for EPIC instruments for the use of calculation\
|
| 193 |
+
\ of RATE, where the order is the normal ID\\_INST number (i.e., pn, MOS1 and\
|
| 194 |
+
\ 2). The resultant RATE in the output RGS source list is normalised to 1.0 in\
|
| 195 |
+
\ the list, namely in default, it is normalised to the RATE of MOS1 (or 2).\n\
|
| 196 |
+
\ }\n **flagepicsrcoutoffov** (Optional): \n If this is set, the task carries\
|
| 197 |
+
\ out filtering, where only those sources, the position of which corresponds to\
|
| 198 |
+
\ cross-dispersion angles on the RGS camera between $-$2.9 and +2.9 arcminutes\
|
| 199 |
+
\ from camera centre, are regarded as a good source. If `withepicset\n(Type:\
|
| 200 |
+
\ \n Active only if \\param{withepicset`. If this is set, the input EPIC sources\
|
| 201 |
+
\ falling outside the FOV (see the description of `enablefilter` for definition)\
|
| 202 |
+
\ are flagged and are not dropped from the output source list due to that reason.\
|
| 203 |
+
\ If not (default), either they are dropped from the source list (if `enablefilter`=true)\
|
| 204 |
+
\ or nothing is done. See the description of `enablefilter` for the summary of\
|
| 205 |
+
\ the behaviour.\n }\n \\optparm{enablefilter, Default: no}\t{boolean}\t{yes|no,\
|
| 206 |
+
\ Range: no}\t{boolean}\t{yes|no)=true, the filtering is made also for the input\
|
| 207 |
+
\ EPIC sources, and the those EPIC sources regarded as no-good are either dropped\
|
| 208 |
+
\ out of the output list (`flagepicsrcoutoffov`=false) or just flagged as OUTOFFOV\
|
| 209 |
+
\ (if `flagepicsrcoutoffov`=false) (see section~\\ref{rgssources:description:outputfiles}\
|
| 210 |
+
\ for the OUTOFFOV flag). Regardless of whether epic sources are added or not\
|
| 211 |
+
\ (`withepicset`), the task checks the positions of all sources if `enablefilter`\
|
| 212 |
+
\ is set and flags them as it is and warns about any that fall outside the FOV.\n\
|
| 213 |
+
\ \\begin{center}\n \\begin{tabular}{|l|cc|}\n \\multicolumn{3}{c}{When `enablefilter`=true}\\\
|
| 214 |
+
\\\n \\hline\n & EPIC sources & Anything else\\\\\n \\hline\n `flagepicsrcoutoffov`\
|
| 215 |
+
\ = true & Flagged & Flagged\\\\\n `flagepicsrcoutoffov` = false & Dropped &\
|
| 216 |
+
\ Flagged\\\\\n \\hline\n \\end{tabular}\n \\end{center}\n }\n **bandids**\
|
| 217 |
+
\ (Optional): yes\n(Type: integer list}\t{, Default: 2,3, Range: \n This parameter\
|
| 218 |
+
\ gives the list of energy bands accepted for the input EPIC source list. The\
|
| 219 |
+
\ RATE value of each source in the output RGS source list is the sum of the RATEs\
|
| 220 |
+
\ of the corresponding source for the energy bands specified with this parameter.\
|
| 221 |
+
\ For 1XMM-source-catalogue type ones, this list should be 2, whereas for 2XMM-source-catalogue\
|
| 222 |
+
\ type ones, this list should be 2, 3 (default). Although an arbitrary number\
|
| 223 |
+
\ of elements in the list is allowed, if it is more than 9, only the first 9 energy\
|
| 224 |
+
\ bands are stated in the `E\\_mBNDnn` header keyword and the rest is unstated\
|
| 225 |
+
\ (see section~\\ref{rgssources:description:outputfiles}) in the output list.\n\
|
| 226 |
+
\ }\n \\optparm{withboresightfudge)\t{boolean}\t{yes|no}{\n Flip the sign\
|
| 227 |
+
\ of the boresight euler\\%psi. {\\bf This parameter will be removed} after the\
|
| 228 |
+
\ boresight is fixed. \n }\n\n[INPUT FILES]\nrgssources\n1. EPIC sources set\
|
| 229 |
+
\ with a binary extension table named ‘SRCLIST‘\n (required only if ‘withepicset‘\
|
| 230 |
+
\ = ‘yes’).\n\n The following columns need to be present in this table:\n\n\
|
| 231 |
+
\ - ‘RA‘: this value is copied into the RGS column of the same name.\n\n\
|
| 232 |
+
\ - ‘DEC‘: this value is copied into the RGS column of the same\n \
|
| 233 |
+
\ name.\n\n - ‘ML_ID_SRC‘ (if the source list was made by Task: emldetect)\
|
| 234 |
+
\ or\n ‘BOX_ID_SRC‘ (if the source list was made by Task: eboxdetect):\n\
|
| 235 |
+
\ this number is included in the ‘LABEL‘ value of the source in\n \
|
| 236 |
+
\ the RGS list.\n\n - ‘ID_BAND‘: this value is used in distinguishing the\
|
| 237 |
+
\ energy band\n in calculating RATE (see below).\n\n - ‘RATE‘: the\
|
| 238 |
+
\ sum of these values in the specified energy bands\n are written in the\
|
| 239 |
+
\ output RGS list. The energy band (ID) is\n listed in the above-mentioned\
|
| 240 |
+
\ ‘ID_BAND‘ column, whereas the\n energy band IDs are specified in ‘bandids‘\
|
| 241 |
+
\ command-line\n parameter.\n\n2. RGS sources set as described in the\
|
| 242 |
+
\ ‘Output files’ section (required\n only if ‘filemode‘ = ‘modify’).\n\n3.\
|
| 243 |
+
\ The attitude history file created by Task: atthkgen (required only\n if\
|
| 244 |
+
\ ((‘filemode‘ = ‘modify’ and ‘changeattitude‘ = ‘yes’) or\n ‘filemode‘ = ‘create’)\
|
| 245 |
+
\ and ‘attstyle‘ = ‘mean’ or ‘median’.).\n\n4. The filtered attitude history\
|
| 246 |
+
\ file created by Task: attfilter\n (required only if ((‘filemode‘ = ‘modify’\
|
| 247 |
+
\ and ‘changeattitude‘ =\n ‘yes’) or ‘filemode‘ = ‘create’) and ‘attstyle‘\
|
| 248 |
+
\ = ‘expmedian’.).\n\n[OUTPUT FILES]\nrgssources\n1. RGS sources set with a binary\
|
| 249 |
+
\ extension table named ‘SRCLIST‘. The\n header has all the keywords mandatory\
|
| 250 |
+
\ for PPS products, in\n particular\n\n - ‘RA_PNT‘: The right ascension\
|
| 251 |
+
\ of the attitude in decimal\n degrees.\n\n - ‘DEC_PNT‘: The declination\
|
| 252 |
+
\ of the attitude in decimal degrees.\n\n - ‘PA_PNT‘: The position angle\
|
| 253 |
+
\ of the attitude in decimal degrees.\n\n The ‘SRCLIST‘ table has the following\
|
| 254 |
+
\ keywords:\n\n - ‘PRIMESRC‘: The ‘INDEX‘ value (see column description below)\
|
| 255 |
+
\ of\n the prime source.\n\n - ‘E_EXPRn‘: There are n ( ≤ 99) occurrences\
|
| 256 |
+
\ of this keyword, one\n for each EPIC source list added to the RGS list.\
|
| 257 |
+
\ The numbers ‘n‘\n are consecutive, starting at 1. The values of these\
|
| 258 |
+
\ keywords are\n taken from the ‘INSTRUME‘ header keyword in the input\
|
| 259 |
+
\ EPIC\n source list (that is, probably EPN, in most of the cases, which\n\
|
| 260 |
+
\ does not carry a lot of practical meaning, in fact), although it\n \
|
| 261 |
+
\ used to be the exposure IDs of the respective EPIC source files\n \
|
| 262 |
+
\ (in the old-style source lists).\n\n - ‘E_CONTn‘: Similar to the ‘E_EXPRn‘\
|
| 263 |
+
\ keyword, but this records\n the value of the ‘CONTENT‘ keyword in the\
|
| 264 |
+
\ EPIC file header.\n\n - ‘E_mBNDn‘: Similar to the ‘E_EXPRn‘ keyword, but\
|
| 265 |
+
\ this records\n the value of either ‘ID_BAND‘ (in the input RGS source\
|
| 266 |
+
\ file,\n when ‘filemode‘=‘modify’) or ‘bandids‘, which is used to select\n\
|
| 267 |
+
\ the EPIC sources and to calculate the RATE value, transmitted\n \
|
| 268 |
+
\ into the output RGS source list. Note that this used to be\n ‘E_BANDn‘(=2)\
|
| 269 |
+
\ before Ver.6.0. If ‘filemode‘=‘modify’ and if the\n input RGS source\
|
| 270 |
+
\ list has ‘E_BANDn‘ keywords, then they will be\n preserved in the output\
|
| 271 |
+
\ RGS source list (i.e., both ‘E_BANDn‘\n and ‘E_mBNDn‘ keywords may appear).\n\
|
| 272 |
+
\n - ‘E_FILTn‘: Similar to the ‘E_EXPRn‘ keyword, but this records\n \
|
| 273 |
+
\ the value of the ‘FILTER‘ keyword in the EPIC file header.\n\n The ‘SRCLIST‘\
|
| 274 |
+
\ table has the following columns:\n\n Column name: Data type: Description:\n\
|
| 275 |
+
\ ---------------- ------------ --------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------\n\
|
| 276 |
+
\ ‘INDEX‘ int16 Source index number. Each source has a unique\
|
| 277 |
+
\ value, which Task: rgssources never alters.\n ‘LABEL‘ string\
|
| 278 |
+
\ Label for the source. These values are also unique to each source. Only upper\
|
| 279 |
+
\ case is used. At present, label values can only be 20 characters or less in\
|
| 280 |
+
\ length. Trailing spaces are not allowed.\n ‘RA‘ real32 \
|
| 281 |
+
\ J2000 right ascension in decimal degrees.\n ‘DEC‘ real32\
|
| 282 |
+
\ J2000 declination in decimal degrees.\n ‘RATE‘ real32 \
|
| 283 |
+
\ Counts per second.\n ‘DELTA_DISP‘ real32 Offset on the sky,\
|
| 284 |
+
\ in the dispersion direction, of the source with respect to the pointing direction.\
|
| 285 |
+
\ Given in arcminutes.\n ‘DELTA_XDSP‘ real32 Offset on the sky,\
|
| 286 |
+
\ in the cross-dispersion direction, of the source with respect to the pointing\
|
| 287 |
+
\ direction. Given in arcminutes.\n ‘FOV_PHI‘ real32 This and\
|
| 288 |
+
\ the next column give the polar coordinates of ‘DELTA_DISP‘ and ‘FOV_PHI‘. Units\
|
| 289 |
+
\ for both are decimal degrees. ‘FOV_PHI‘ is the angle of the source position\
|
| 290 |
+
\ from the -ve dispersion axis towards the +ve cross-dispersion axis.\n ‘FOV_R‘\
|
| 291 |
+
\ real32 \n ‘CONFUSION‘ real32 This is a measure\
|
| 292 |
+
\ of how confused the source is with respect to the prime source. See subsection\
|
| 293 |
+
\ [confusion] for a description of how it is calculated. It is a dimensionless\
|
| 294 |
+
\ number.\n ‘PROCESS‘ bool This column is used by Task: rgsregions\
|
| 295 |
+
\ to flag those sources for which spectrum extraction regions should be calculated.\
|
| 296 |
+
\ This column is no longer set by Task: rgssources, though, so all values are\
|
| 297 |
+
\ written as false in principle. An exception is the case of ‘filemode‘=‘modify’;\
|
| 298 |
+
\ in that case the PROCESS column in the input RGS source list is in principle\
|
| 299 |
+
\ preserved. Another exception is the sources added by the user (‘addusersource‘=true),\
|
| 300 |
+
\ where the value of the command-line option ‘process‘ is written as it is in\
|
| 301 |
+
\ principle. In any case, if ‘filemode‘=‘modify’ and ‘changeattitude‘=true, all\
|
| 302 |
+
\ PROCESS values are forcibly written as false regardless of the value ‘process‘\
|
| 303 |
+
\ or PROCESS in the input RGS source list.\n ‘BKG_EXCLUDE‘ bool \
|
| 304 |
+
\ This column is used by Task: rgsregions to flag those sources which should\
|
| 305 |
+
\ be excluded from the background spectrum extraction region. This column is no\
|
| 306 |
+
\ longer set by Task: rgssources, so all values are written as false.\n ‘FIXED_ON_SKY‘\
|
| 307 |
+
\ bool This column flags those sources for which the positional information\
|
| 308 |
+
\ was derived from right ascension and declination. The only sources for which\
|
| 309 |
+
\ ‘FIXED_ON_SKY‘ is false are the attitude source and any user source supplied\
|
| 310 |
+
\ with ‘userstyle‘=‘wtatt’.\n\n Column name: Data type: Description:\n\
|
| 311 |
+
\ -------------- ------------ ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------\n\
|
| 312 |
+
\ ‘EPIC_FILE‘ int16 This gives the number of the ‘E_EXPRn‘, ‘E_CONTn‘,\
|
| 313 |
+
\ ‘E_mBNDn‘ (or ‘E_BANDn‘ before Ver.6.0) and ‘E_FILTn‘ keywords appropriate to\
|
| 314 |
+
\ the source if it has been derived from an EPIC source list. Eg, for ‘EPIC_FILE‘=3,\
|
| 315 |
+
\ the details of the original list from which this source came can be found from\
|
| 316 |
+
\ the keywords ‘E_EXPR3‘, ‘E_CONT3‘, ‘E_mBND3‘ and ‘E_FILT3‘.\n ‘FLAG‘ \
|
| 317 |
+
\ int32 If non-zero, something goes wrong in the source. It is a\
|
| 318 |
+
\ binary (bit-type) form of representation for each cause – see the following\
|
| 319 |
+
\ table for detail (n.b., The representation of this FLAG column is entirely different\
|
| 320 |
+
\ from that in the input EPIC source list). Note that some of the checks may be\
|
| 321 |
+
\ bypassed if requested (by command-line parameters); for example if ‘enablefilter‘=false\
|
| 322 |
+
\ and ‘flagepicsrcoutoffov‘=false, no check for OUTOFFOV is carried out.\n\n \
|
| 323 |
+
\ The following is the description for the ‘FLAG‘ column:\n\n Name \
|
| 324 |
+
\ Bit Description\n ------------ ----- ---------------------------------------------------------------\n\
|
| 325 |
+
\ OUTOFFOV 0 The source is out of field of view.\n CONFUSED\
|
| 326 |
+
\ 1 The source may be confused with other source(s).\n BADBAND[1]\
|
| 327 |
+
\ 2 The energy band used (hence RATE) may be wrong.\n WIDESRC \
|
| 328 |
+
\ 3 The source is greater than 90 degrees away from the pointing.\n\n Note\
|
| 329 |
+
\ that the RGS source list set is also used to store the spectrum\n extraction\
|
| 330 |
+
\ regions created by Task: rgsregions. These become\n invalidated if the attitude\
|
| 331 |
+
\ is altered; in this case Task:\n rgssources deletes them. See the algorithm\
|
| 332 |
+
\ (section\n [rgssources:description:algorithm]) for details of the circumstances\n\
|
| 333 |
+
\ under which this occurs.\n\n The RGS source list table is required to\
|
| 334 |
+
\ have 1 source whose\n position is taken from the observation proposal, and\
|
| 335 |
+
\ 1 source whose\n position is equal to the RGS attitude (stored in the dataset\
|
| 336 |
+
\ header\n keywords ‘RA_PNT‘, ‘DEC_PNT‘ and ‘PA_PNT‘). The ‘LABEL‘ values of\n\
|
| 337 |
+
\ these two sources are PROPOSAL and ONAXIS respectively.\n\n[1] Since Ver.6.0,\
|
| 338 |
+
\ this flag is not set by rgssources.\n\n[ABSTRACT] rgssources\nThe task constructs\
|
| 339 |
+
\ a list of sources that are to be processed by RGS\npipeline.\n[DESCRIPTION]\
|
| 340 |
+
\ rgssources\n[ATTITUDE PARAMETERS.] rgssources\n[CCF.] rgssources\nTo access\
|
| 341 |
+
\ this, the user should set SAS_CCF in the usual way.\n[ADDING FURTHER SOURCES.]\
|
| 342 |
+
\ rgssources\n[FUTURE DEVELOPMENTS] rgssources\n-\n[CAL USAGE] rgssources\n- \
|
| 343 |
+
\ CAL_setState\n\n- CAL_getMiscellaneousDataValue"
|
| 344 |
+
- source_sentence: What are the possible warning messages listed in the excerpt?
|
| 345 |
+
sentences:
|
| 346 |
+
- 'General cross-correlation products
|
| 347 |
+
|
| 348 |
+
|
| 349 |
+
These PPS cross-correlation products list the names of all catalogues
|
| 350 |
+
|
| 351 |
+
searched (both around each EPIC position and in the whole EPIC field)
|
| 352 |
+
|
| 353 |
+
and describe the format of their output.
|
| 354 |
+
|
| 355 |
+
'
|
| 356 |
+
- 'This product is no longer made by the pipeline. A scientifically
|
| 357 |
+
|
| 358 |
+
meaningful flatfield image can not readily be constructed from onboard
|
| 359 |
+
|
| 360 |
+
flat-field images. A unit flatfield is considered to be adequate and so
|
| 361 |
+
|
| 362 |
+
creation of this product was dropped from the processing.
|
| 363 |
+
|
| 364 |
+
'
|
| 365 |
+
- "rgsregions\n## Errors\n\n \\label{rgsregions:description:errorconditions}\n\n\
|
| 366 |
+
\ **Error:** noExposureMaps.\n }\n\n **Warning:** fractionalCoverage,\n `xpsfexcl`,\
|
| 367 |
+
\ or `pdistincl`) was given a value greater\n than zero but less than one, suggesting\
|
| 368 |
+
\ that the user has forgotten\n that these parameters are specified as percentages.\n\
|
| 369 |
+
\ }\n\n **Warning:** protectedRegion\n\n **Warning:** emptyRegion\n\n"
|
| 370 |
+
- source_sentence: What happens if the number of types and scopes provided is not
|
| 371 |
+
equal in cifremove?
|
| 372 |
+
sentences:
|
| 373 |
+
- "- For each RGS detector there is a single file containing filtered\n events\
|
| 374 |
+
\ from all CCDs.\n\n- The structure of the FITS file is:\n\n 1. Primary\
|
| 375 |
+
\ header with null primary array.\n\n 2. A binary table extension containing\
|
| 376 |
+
\ event data\n ( EXTNAME=’EVENTS’).\n\n 3. Per CCD (m =1-9) a standard\
|
| 377 |
+
\ GTI extension (STDGTI0m).\n\n 4. Per CCD (m) and per CCD readout node (n=0-1),\
|
| 378 |
+
\ a bad pixel\n extension (BADPIXnm).\n\n 5. Per CCD (m) and per CCD\
|
| 379 |
+
\ readout node (n), a rejected pixel\n extension (REJPIXnm).\n\n 6.\
|
| 380 |
+
\ Per CCD (m) an exposure extension (EXPOSU0m).\n\n 7. Per CCD (m) and per\
|
| 381 |
+
\ readout node (n), an exposure map extension\n EXPMAPnm\n\n- These files\
|
| 382 |
+
\ are identified using the keyword\n\n CONTENT = 'RGS EVENT LIST'\n\n \
|
| 383 |
+
\ in the primary header.\n\n- This is a product of class RGSEXP.\n\n- The\
|
| 384 |
+
\ EVENTS extension comprises a binary table extension with the\n following\
|
| 385 |
+
\ columns:\n\n Name Type Description\n -----------------\
|
| 386 |
+
\ ---------------- -----------------------------------------------\n TIME\
|
| 387 |
+
\ 8-byte REAL Frame timestamp\n FLAG 4-byte\
|
| 388 |
+
\ INTEGER Event attribute flags\n BETA 4-byte REAL Uncorrected\
|
| 389 |
+
\ dispersion angle\n XDSP 4-byte REAL Uncorrected cross-dispersion\
|
| 390 |
+
\ angle\n CHIPX 2-byte INTEGER Chip X coordinate (pixel)\n\
|
| 391 |
+
\ CHIPY 2-byte INTEGER Chip Y coordinate (pixel)\n PHA\
|
| 392 |
+
\ 2-byte INTEGER Total telemetered energy\n SHAPE \
|
| 393 |
+
\ BYTE Event shape identifier\n GRADE BYTE \
|
| 394 |
+
\ Total number of pixels\n PI 2-byte INTEGER \
|
| 395 |
+
\ Total corrected CCD event energy\n CCDNR BYTE CCD\
|
| 396 |
+
\ ID number\n BETA_CORR 4-byte REAL Attitude corrected dispersion\
|
| 397 |
+
\ angle (radians)\n XDSP_CORR 4-byte REAL Attitude corrected\
|
| 398 |
+
\ cross-disp angle (radians)\n M_LAMBDA 4-byte REAL Wavelength\
|
| 399 |
+
\ spectral-order product\n BETA_CHANNEL 2-byte INTEGER BETA_CORR channel\n\
|
| 400 |
+
\ MLAMBDA_CHANNEL 2-byte INTEGER M_LAMBDA channel\n XDSP_CHANNEL\
|
| 401 |
+
\ 2-byte INTEGER XDISP_CORR channel\n\n- Event times are specified in\
|
| 402 |
+
\ seconds after a reference time\n specified in a header keyword (MJDREF).\n\
|
| 403 |
+
\n- The STDGTI0m extension comprises a binary table extension with the\n \
|
| 404 |
+
\ following columns:\n\n Name Type Description\n -------\
|
| 405 |
+
\ ------------- ------------------------------------------\n START 8-byte\
|
| 406 |
+
\ REAL GTI start time (s) since reference epoch\n STOP 8-byte REAL \
|
| 407 |
+
\ GTI end time (s) since reference epoch\n\n- The BADPIXnm extension contains\
|
| 408 |
+
\ a binary table extension with the\n following columns:\n\n Name \
|
| 409 |
+
\ Type Description\n --------- ---------------- --------------------------------\n\
|
| 410 |
+
\ CHIPX 2-byte INTEGER Chip X coordinate (pixel)\n CHIPY 2-byte\
|
| 411 |
+
\ INTEGER Chip Y coordinate (pixel)\n YEXTENT 2-byte INTEGER Extent\
|
| 412 |
+
\ of badness in Y (pixel)\n TYPE 2-byte INTEGER Type of badness\n\
|
| 413 |
+
\ BADFLAG 2-byte INTEGER Data source flag\n\n- The REJPIXnm extension\
|
| 414 |
+
\ contains a binary table extension with the\n following columns:\n\n \
|
| 415 |
+
\ Name Type Description\n ------- ---------------- ---------------------------\n\
|
| 416 |
+
\ FRAME 4-byte INTEGER Frame identifier\n FLAG 4-byte INTEGER\
|
| 417 |
+
\ Event attribute flags\n CHIPX 2-byte INTEGER Chip X coordinate (pixel)\n\
|
| 418 |
+
\ CHIPY 2-byte INTEGER Chip Y coordinate (pixel)\n\n- The EXPOSU0m\
|
| 419 |
+
\ extension contains a binary table extension with the\n following columns:\n\
|
| 420 |
+
\n Name Type Description\n ---------- ----------------\
|
| 421 |
+
\ ---------------------------------------------\n FRAME 4-byte INTEGER\
|
| 422 |
+
\ Frame identifier\n NLOSTEVT 2-byte INTEGER Number of lost events\
|
| 423 |
+
\ in frame\n ABORTFLG 2-byte INTEGER Abort frame flag\n FLAG \
|
| 424 |
+
\ 4-byte INTEGER Frame attributes\n TIMEDEL 4-byte REAL Frame\
|
| 425 |
+
\ integration time (s)\n TIME 8-byte REAL Seconds since MJDREF\n\
|
| 426 |
+
\ FRACEXP0 4-byte REAL Exposure fraction node 0\n FRACEXP1 \
|
| 427 |
+
\ 4-byte REAL Exposure fraction node 1\n ASPCDSP 4-byte REAL \
|
| 428 |
+
\ Aspect correction applied to BETA (radians)\n ASPCXDSP 4-byte REAL \
|
| 429 |
+
\ Aspect correction applied to XDSP (radians)\n\n- The EXPMAPnm extension\
|
| 430 |
+
\ is an image extension containing the exposure\n map for CCD m, node n.\n\n\
|
| 431 |
+
- This is a science product suitable for use in further data analysis.\n\n-\
|
| 432 |
+
\ There will be a single event file per exposure. The event lists will\n \
|
| 433 |
+
\ typically be 10 MB uncompressed\n"
|
| 434 |
+
- "The source list for a grism exposure represents a list of detections of\nall\
|
| 435 |
+
\ the zeroth order and/or first-order spectrum features in the OSW\nimage.\n\n\
|
| 436 |
+
- The source detection list is supplied in FITS format.\n\n- These files are\
|
| 437 |
+
\ identified using the keyword\n\n CONTENT = 'OM OSW GRISM SOURCE LIST'\n\
|
| 438 |
+
\n in the primary header.\n\n- This is a product of class OMSW.\n\n- The\
|
| 439 |
+
\ OGIP filetype is defined by the keywords\n\n HDUCLASS= 'OGIP ' \
|
| 440 |
+
\ / Format conforms to OGIP/GSFC conventions\n HDUCLAS1= 'SRCLIST\
|
| 441 |
+
\ ' / File contains a source list\n\n in the primary header.\n\n\
|
| 442 |
+
- The data extension (EXTNAME = ’SRCLIST’) contains a binary table\n with\
|
| 443 |
+
\ the following columns:\n\n Name Type Description\n\
|
| 444 |
+
\ -------------- ---------------- --------------------------------------------------------------\n\
|
| 445 |
+
\ SRCNUM 4-byte INTEGER Source number\n XPOS 4-byte\
|
| 446 |
+
\ REAL X-pixel position\n YPOS 4-byte REAL Y-pixel position\n\
|
| 447 |
+
\ POSERR 4-byte REAL Positional error (pixels)\n SPB_COILOSS\
|
| 448 |
+
\ 4-byte REAL Coincidence loss correction in source+background\n \
|
| 449 |
+
\ BK_COILOSS 4-byte REAL Coincidence loss correction in background\n\
|
| 450 |
+
\ FWHM_MAJ 4-byte REAL Source FWHM (ellipse major axis)\n \
|
| 451 |
+
\ FWHM_MAJ_ERR 4-byte REAL Source FWHM (major axis) error\n FWHM_MIN\
|
| 452 |
+
\ 4-byte REAL Source FWHM (ellipse minor axis)\n FWHM_MIN_ERR\
|
| 453 |
+
\ 4-byte REAL Source FWHM (minor axis) error\n PA 4-byte\
|
| 454 |
+
\ REAL Position angle of ellipse major axis\n PA_ERR 4-byte\
|
| 455 |
+
\ REAL Source position angle error\n QFLAG 16-bit INTEGER \
|
| 456 |
+
\ Quality flag\n CFLAG 8-bit INTEGER Confusion flag\n EFLAG\
|
| 457 |
+
\ 8-bit INTEGER Extension flag\n SPECTR_ID 4-byte INTEGER\
|
| 458 |
+
\ Spectrum identifier\n REL2SRCNUM 4-byte INTEGER Identifies related\
|
| 459 |
+
\ spectrum and zeroth order feature entries\n\n- This is a science product.\
|
| 460 |
+
\ The OM OSW source list is the first stage\n analysis of the OSW for grism\
|
| 461 |
+
\ data.\n\n- The grism source lists is notably distinct from the normal imaging\n\
|
| 462 |
+
\ and FAST source lists because many entries are the detections of the\n \
|
| 463 |
+
\ spectra themselves, not just the zeroth order features that map to\n the\
|
| 464 |
+
\ objects on the sky. At the current time, the SSC pipeline does\n not insert\
|
| 465 |
+
\ celestial coordinates (RA and DEC) in the file though\n this is expected\
|
| 466 |
+
\ to change in a future pipeline release. The ellipse\n parameters of the detections\
|
| 467 |
+
\ largely reflect dispersion in the\n spectrum and zeroth order features, rather\
|
| 468 |
+
\ than intrinsic extension\n of the sky object.\n\n- There is one file per\
|
| 469 |
+
\ OSW per exposure. Each file is typically 24KB\n uncompressed.\n"
|
| 470 |
+
- "cifremove\n \n cif=parameter(calindexset)\n if(parameterCount(types)\
|
| 471 |
+
\ != parameterCount(scopes)){\n error(ParameterCountMismatch)\n }\n\
|
| 472 |
+
\ foreach(type-scope pair){\n if(! cif.has(type, scope)){\n \
|
| 473 |
+
\ warning(NoMatchingCcfConstituent)\n } else {\n cif.remove_entry(type,\
|
| 474 |
+
\ scope) \n }\n }\n"
|
| 475 |
+
- source_sentence: What are the task parameters of binadapt?
|
| 476 |
+
sentences:
|
| 477 |
+
- "backscale\n## Parameters\n\n\\label{backscale:description:parameters}\n\n **spectrumset**\
|
| 478 |
+
\ (Mandatory): \n Name of the input file\n \n(Type: string, Default: spectrum.ds,\
|
| 479 |
+
\ Range: )\n **badpixlocation** (Optional): \n Name of the file containing the\
|
| 480 |
+
\ bad pixels, initially this\n is the event file.\n \n(Type: string, Default:\
|
| 481 |
+
\ notSpecified, Range: )\n **withbadpixcorr** (Optional): \n Whether to use bad\
|
| 482 |
+
\ pixels and chip gaps in the calculation.\n \n(Type: boolean, Default: yes,\
|
| 483 |
+
\ Range: )\n **useodfatt** (Optional): \n Whether to use the ODF attitude file\
|
| 484 |
+
\ to construct position info.\n \n(Type: boolean, Default: no, Range: )\n **ignoreoutoffov**\
|
| 485 |
+
\ (Optional): \n Whether area outside the field of view should be included\n\
|
| 486 |
+
\ in the backscale calculation.\n \n(Type: boolean, Default: yes, Range: )\n\
|
| 487 |
+
\ **withbadpixres** (Optional): \n Whether a grid resolution has been specified\
|
| 488 |
+
\ on the command line.\n If not set then the task uses the default badpixelresolution\
|
| 489 |
+
\ set by\n the Task: arfgen\n(Type: boolean, Default: no, Range: ) task.\n \n\
|
| 490 |
+
\ **badpixelresolution** (Optional): \n The grid resolution to use when calculating\
|
| 491 |
+
\ the area. If set then this overrides\n the value used internally by Task: arfgen\n\
|
| 492 |
+
(Type: float, Default: , Range: ). A value such as 2.0, will result in \n a faster\
|
| 493 |
+
\ execution time at the expense of accuracy.\n \n% **detmaptype** (Optional):\
|
| 494 |
+
\ detmapfile.ds:\n(Type: choice, Default: flat, Range: dataset flat}\n% {\n\
|
| 495 |
+
% This is the detector map type. It should be left as the default\n% 'flat'\
|
| 496 |
+
\ in all cases except where the source region contains a\n% spatial mask. In\
|
| 497 |
+
\ this case it should be set to 'dataset' and\n% an image of the extraction\
|
| 498 |
+
\ region given in `detmaparray`.\n% }\n\n% \\optparm{detmaparray){array}{none}\n\
|
| 499 |
+
% {\n% Name of detector map dataset and array in the DAL compound notation.\n\
|
| 500 |
+
% Only used if `detmaptype` is set to `dataset`.\n% }\n\n[INPUT FILES]\n\
|
| 501 |
+
backscale\n- an EPIC spectrum file containing a datasubspace definition\n\n\
|
| 502 |
+
- an optional second file containing the bad pixel extensions\n\n[OUTPUT FILES]\n\
|
| 503 |
+
backscale\n- The input spectrum is modified\n\n[ABSTRACT] backscale\nA tool\
|
| 504 |
+
\ for calculating and writing the BACKSCAL keyword in EPIC spectra.\n[SPATIAL\
|
| 505 |
+
\ MASKS] backscale\n[CAL USAGE] backscale\nThe metatask doesn’t use the CAL directly\
|
| 506 |
+
\ but calls Task: arfgen which\nuses the routine CAL_onCcd to determine whether\
|
| 507 |
+
\ a pixel lies on a CCD.\n[FUTURE DEVELOPMENTS] backscale\nThere is scope for\
|
| 508 |
+
\ reorganising Task: arfgen to make the BACKSCAL\ncalculation a bit faster."
|
| 509 |
+
- "binadapt\n## Parameters\n\n**prefix** (Optional): Input inst+exposure ID (1S001,\
|
| 510 |
+
\ S003) OR “comb” to\nuse combimage inputs.\n\n(Type: string, Default: comb, Range:\
|
| 511 |
+
\ ) The program defaults to deriving\na filename of the form comb-elow-ehigh.fits.\
|
| 512 |
+
\ If using singular expids,\nenter that as the prefix.\n\n**elow** (Optional):\
|
| 513 |
+
\ Lower energy limit for the energy band in eV.\n\n(Type: int, Default: 350, Range:\
|
| 514 |
+
\ 0 < = elow < = 11999) **ehigh**\n(Optional): Upper energy limit for the energy\
|
| 515 |
+
\ band in eV.\n\n(Type: int, Default: 1100, Range: 1 < = ehigh < = 12000)\n\
|
| 516 |
+
**withpartbkg** (Optional): Particle background control, \"yes\" to\nsubtract\
|
| 517 |
+
\ the model (QPB) particle background image.\n\n(Type: bool, Default: no, Range:\
|
| 518 |
+
\ T/F) **withspbkg** (Optional): Soft\nproton background control, \"yes\" to subtract\
|
| 519 |
+
\ the soft proton background\nimage.\n\n(Type: bool, Default: no, Range: T/F)\
|
| 520 |
+
\ **withswcxbkg** (Optional): Solar\nwind charge exchange background control,\
|
| 521 |
+
\ \"yes\" to subtract the SWCX\nbackground image.\n\n(Type: bool, Default: no,\
|
| 522 |
+
\ Range: T/F) **withmask** (Optional): Apply\nadditional masking using input image?\n\
|
| 523 |
+
\n(Type: bool, Default: no, Range: T/F) **maskfile** (Optional): The\nfilename\
|
| 524 |
+
\ for an image to provide additional masking if desired.\n\n(Type: dataset, Default:\
|
| 525 |
+
\ default, Range: ) If left blank (AND\nwithmask=T), binadapt will derive a mask\
|
| 526 |
+
\ filename based on other\nparameters. The mask images must be the same size and\
|
| 527 |
+
\ projection as the\nother images. Since masks can come from many sources, it\
|
| 528 |
+
\ is recommended\nthe user enter withmask=T maskfile=yourmaskfile together.\n\
|
| 529 |
+
**withbinning** (Optional): Perform binning?\n\n(Type: bool, Default: yes, Range:\
|
| 530 |
+
\ T/F) **binfactor** (Optional): Binning\nfactor.\n\n(Type: int, Default: 2, Range:\
|
| 531 |
+
\ 1 < = binfactor) **withsmoothing**\n(Optional): Perform smoothing?\n\n(Type:\
|
| 532 |
+
\ bool, Default: yes, Range: T/F) **smoothcounts** (Optional):\nSmoothing factor.\n\
|
| 533 |
+
\n(Type: int, Default: 50, Range: 1 < = smoothcounts < = 100)\n**maskthresh**\
|
| 534 |
+
\ (Optional): The scale factor for excluding regions from\nthe smoothing based\
|
| 535 |
+
\ on a mask image.\n\n(Type: real, Default: 0.02, Range: 0.001 < = maskthresh)\
|
| 536 |
+
\ In the default\nmode the average exposure is calculated and then any pixel with\
|
| 537 |
+
\ exposure\nless than fraction*average value is excluded.\n[INPUT FILES]\nbinadapt\n\
|
| 538 |
+
Binadapt will create filenames based on parameters input, especially\nprefix,\
|
| 539 |
+
\ elow, and ehigh\n\nThe user can choose to enter either a prefix designating\
|
| 540 |
+
\ the\ninstrument + expid, e.g. 1S001, 2S002, S003 OR the string “comb” to use\n\
|
| 541 |
+
products from the task combimage. Either will initiate deriving all the\ninput\
|
| 542 |
+
\ filenames based on other input parameters. If no prefix is given,\nbinadapt\
|
| 543 |
+
\ will derive an input filename of the form:\ncomb-elow-ehigh.fits, the default\
|
| 544 |
+
\ output from combimage.\n\nValid input filenames derived are, in the case of\
|
| 545 |
+
\ a prefix being\nentered, e.g.:\n\n binadapt prefix=1S001 withspbkg=T withpartbkg=T\
|
| 546 |
+
\ withswcx=T withmask=T\n maskfile=mymaskimage.fits elow=400 ehigh=2000\n\n\
|
| 547 |
+
mos1S001-fovimsky-400-2000.fits (from mosspectra)\nmos1S001-expimsky-400-2000.fits\
|
| 548 |
+
\ (from mosspectra)\nmos1S001-bkgimsky-400-2000.fits (from mosback)\nmos1S001-swcximsky-400-2000.fits\
|
| 549 |
+
\ (from swcx)\nmos1S001-protimsky-400-2000.fits (from proton)\nmos1S001-maskimsky-400-2000.fits\
|
| 550 |
+
\ (from emask, et al)\n[NOTE: binadapt will, by default, create a mask file name\
|
| 551 |
+
\ as above, but\nsince masks can come from different tasks, if you have a mask\
|
| 552 |
+
\ NOT of\nthat style, simply set withmask=T and maskfile=yourmaskname to override\n\
|
| 553 |
+
the default]\n\nValid input filenames derived are, in the case of a comb being\
|
| 554 |
+
\ entered,\ne.g.:\n\n binadapt prefix=comb withspbkg=T withpartbkg=T withswcx=T\
|
| 555 |
+
\ withmask=T\n maskfile=mymaskimage.fits elow=400 ehigh=2000\n\nAll of these\
|
| 556 |
+
\ files are produced by the task combimage after running\nany/all of mosspectra/\
|
| 557 |
+
\ mosback/ swcx/ proton comb-fovimsky-400-2000.fits\ncomb-expimsky-400-2000.fits\n\
|
| 558 |
+
comb-bkgimsky-400-2000.fits\ncomb-swcximsky-400-2000.fits\ncomb-protimsky-400-2000.fits\n\
|
| 559 |
+
comb-maskimsky-400-2000.fits (from emask, et al\nNOTE: typically, a mask produced\
|
| 560 |
+
\ by combimage will have the name style\nas above, but if you rename your files,\
|
| 561 |
+
\ simply set withmask=T and\nmaskfile=yourmaskname to override the default\n\n\
|
| 562 |
+
[OUTPUT FILES]\nbinadapt\nIf withsmoothing=T, binadapt creates an adaptively smoothed,\
|
| 563 |
+
\ exposure\ncorrected, and background subtracted (any selected) image in SKY coords:\n\
|
| 564 |
+
\nmos1S001-adaptimsky-350-1100.fits\n\nA 900x900 Real32 image of the smoothing\
|
| 565 |
+
\ FWHM:\n\nmos1S001-sizeimsky-350-1100.fits\n\nNote: both of the above are also\
|
| 566 |
+
\ binned if withbinning=T\n\nA QDP plot file of the radial profile of the data\
|
| 567 |
+
\ for the selected\nenergy band (elow and ehigh) of the selected region:\n\nmos1S001-radfilt-350-1100.qdp\n\
|
| 568 |
+
\nA histogram of the smoothing FWHM:\n\nmos1S001-size-350-1100.qdp\n\nIf withsmoothing=F,\
|
| 569 |
+
\ only these binned, exposure corrected, and\nbackground subtracted (any selected)\
|
| 570 |
+
\ images are created:\n\nThe binned count rate uncertainty image for the selected\
|
| 571 |
+
\ energy band\n(elow and ehigh) of the selected region in SKY coordinates:\n\n\
|
| 572 |
+
mos1S001-sigimsky-350-1100.fits\n\nand the binned count rate image for the selected\
|
| 573 |
+
\ energy band (elow and\nehigh) of the selected region in sky coordinates:\n\n\
|
| 574 |
+
mos1S001-rateimsky-350-1100.fits\n\nA QDP plot file of the radial profile of the\
|
| 575 |
+
\ data for the selected\nenergy band (elow and ehigh) of the selected region:\n\
|
| 576 |
+
\nmos1S001-radfilt-350-1100.qdp\n\n[FUTURE DEVELOPMENTS] binadapt"
|
| 577 |
+
- "- This extension contains the exposed fraction of each frame per CCD\n (in\
|
| 578 |
+
\ the pn the frame time is constant, and is therefore not included\n in this\
|
| 579 |
+
\ extension).\n\n- There is one extension per CCD in the relevant mode (IMAGING\
|
| 580 |
+
\ or\n TIMING) during the exposure.\n\n- The following keywords are present\
|
| 581 |
+
\ in all cases (example values\n shown):\n\n CCDID = \
|
| 582 |
+
\ 1 / CCD Identifier\n FRMTIME = 2600 / Nominal frame\
|
| 583 |
+
\ integration time\n WINDOWX0= 1 / X coordinate of bottom\
|
| 584 |
+
\ left corner of window\n WINDOWY0= 1 / Y coordinate\
|
| 585 |
+
\ of bottom left corner of window\n WINDOWDX= 600 / Size,\
|
| 586 |
+
\ along x-axis, of window\n WINDOWDY= 600 / Size, along\
|
| 587 |
+
\ y-axis, of window\n\n- In addition, the following keywords are present in\
|
| 588 |
+
\ EPIC pn EXPOSUnn\n extensions:\n\n QUADRANT= 0\
|
| 589 |
+
\ / Quadrant Identifier\n QUADMODE= 0 / Quadrant mode\n\
|
| 590 |
+
\ CCDMODE = 0 / CCD mode\n SINGLES = \
|
| 591 |
+
\ 588287 / number of single events\n DOUBLES = \
|
| 592 |
+
\ 67309 / number of double events\n TRIPLES = 2920 / number\
|
| 593 |
+
\ of triple events\n QUADRUPL= 4607 / number of quadruple\
|
| 594 |
+
\ events\n NOTRECEV= 3958 / number of not recognized events\n\
|
| 595 |
+
\ NOTRECPA= 171641 / number of not recognized patterns\n\
|
| 596 |
+
\ MAXPAT = 263 / maximum pattern size\n MIPS\
|
| 597 |
+
\ = 3 / number of MIPs found\n RECPHOTO= \
|
| 598 |
+
\ 664123 / number of recognized photons\n ANALYSED= \
|
| 599 |
+
\ 924737 / number of analysed events\n\n- For both imaging and timing mode\
|
| 600 |
+
\ MOS event lists this extension\n contains the following columns:\n\n \
|
| 601 |
+
\ Name Type Description\n --------- ------------- -------------------------------------------------\n\
|
| 602 |
+
\ TIME 8-byte REAL Frame start time (seconds since reference time)\n\
|
| 603 |
+
\ TIMEDEL 4-byte REAL Duration of frame time (seconds)\n FRACEXP\
|
| 604 |
+
\ 4-byte REAL Fractional exposure of frame\n\n- For both imaging and timing\
|
| 605 |
+
\ mode pn event lists this extension\n contains the following columns:\n\n\
|
| 606 |
+
\ Name Type Description\n --------- ------------- -------------------------------------------------\n\
|
| 607 |
+
\ TIME 8-byte REAL Frame start time (seconds since reference time)\n\
|
| 608 |
+
\ FRACEXP 4-byte REAL Fractional exposure of frame\n"
|
| 609 |
+
- source_sentence: In nearly all cases, how many source and background region spectra
|
| 610 |
+
are supplied for the RGS?
|
| 611 |
+
sentences:
|
| 612 |
+
- "Parameter dialogs\n\nEach task has an associated parameter dialog window. These\
|
| 613 |
+
\ individual\ntask GUIs are used to enter the values of the different task parameters\n\
|
| 614 |
+
and to . The parameter dialog windows are opened by double-clicking any\nof the\
|
| 615 |
+
\ tasks listed under the \"task\" column.\n\nThe following parameter dialog window\
|
| 616 |
+
\ (figure [fig:gui:parameterdialog])\nillustrates some of the basic parameter\
|
| 617 |
+
\ types. Each parameter type has a\ncorresponding widget type. For example, a\
|
| 618 |
+
\ boolean parameter is entered\nusing a check-box (withexposure); a choice parameter\
|
| 619 |
+
\ is entered by using\na pop-up menu that allows to select from a set of options\
|
| 620 |
+
\ (sampling); a\nfilename parameter is entered as a string (imagesets), with the\
|
| 621 |
+
\ option\nof popping up a file browser by pressing the button with the folder\
|
| 622 |
+
\ icon\n(see § [gui:browser]).\n\nIf the task has a large number of parameters,\
|
| 623 |
+
\ the dialog window may have\nscroll-bars. The scroll bars will disappear if the\
|
| 624 |
+
\ size of the dialog\nwindow is increased sufficiently.\n\nFurther information\
|
| 625 |
+
\ on a parameter can be obtained by placing the cursor\nover the parameter widget.\
|
| 626 |
+
\ This causes a yellow tool-tip to pop-up if\nthe parameter file defines a prompt\
|
| 627 |
+
\ field for the parameter.\n\nThe parameter dialog has the following buttons:\n\
|
| 628 |
+
\n ---------- ------------------------------------------------------------------------\n\
|
| 629 |
+
\ Run Run the task with the selected parameters\n Cancel Close the\
|
| 630 |
+
\ parameter dialog window without running the task or changing\n the\
|
| 631 |
+
\ parameters\n Save Saves the value of the parameters\n Defaults Reset\
|
| 632 |
+
\ the parameters to their default values\n ---------- ------------------------------------------------------------------------\n\
|
| 633 |
+
\nWhen a task has been run, the parameter values are retained until the\nnext\
|
| 634 |
+
\ time that the task is run (within the same session). The Defaults\nbutton may\
|
| 635 |
+
\ be used to reset the parameters of a task to their default\nvalues. The \"Task\"\
|
| 636 |
+
\ menu in the main SAS GUI provides an option \"Revert\nto defaults\" to reset\
|
| 637 |
+
\ all the parameters of all the tasks to their\ndefaults.\n"
|
| 638 |
+
- "- This extension gives the good time intervals for the event list.\n\n- There\
|
| 639 |
+
\ is one extension per CCD in the relevant mode (IMAGING or\n TIMING) during\
|
| 640 |
+
\ the exposure.\n\n- The following keywords are present:\n\n HDUCLASS=\
|
| 641 |
+
\ 'OGIP ' / format conforms to OGIP standard\n HDUCLAS1= 'GTI\
|
| 642 |
+
\ ' / table contains Good Time Intervals\n HDUCLAS2= 'STANDARD'\
|
| 643 |
+
\ / standard Good Time Interval table\n\n- This extension contains\
|
| 644 |
+
\ the following columns:\n\n Name Type Description\n -------\
|
| 645 |
+
\ ------------- --------------------------------\n START 8-byte REAL \
|
| 646 |
+
\ seconds (since reference time)\n STOP 8-byte REAL seconds (since reference\
|
| 647 |
+
\ time)\n"
|
| 648 |
+
- 'RGS spectral products
|
| 649 |
+
|
| 650 |
+
|
| 651 |
+
This section describes the spectral data products to be generated from
|
| 652 |
+
|
| 653 |
+
pointed observations.
|
| 654 |
+
|
| 655 |
+
|
| 656 |
+
Source and background region spectra and a background-subtracted source
|
| 657 |
+
|
| 658 |
+
spectrum are supplied for the brightest point sources in the RGS (in
|
| 659 |
+
|
| 660 |
+
nearly all cases this is just one source). Spectral response matrices
|
| 661 |
+
|
| 662 |
+
are also supplied.
|
| 663 |
+
|
| 664 |
+
'
|
| 665 |
+
pipeline_tag: sentence-similarity
|
| 666 |
+
library_name: sentence-transformers
|
| 667 |
+
---
|
| 668 |
+
|
| 669 |
+
# SentenceTransformer based on nomic-ai/modernbert-embed-base
|
| 670 |
+
|
| 671 |
+
This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [nomic-ai/modernbert-embed-base](https://huggingface.co/nomic-ai/modernbert-embed-base). It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
|
| 672 |
+
|
| 673 |
+
## Model Details
|
| 674 |
+
|
| 675 |
+
### Model Description
|
| 676 |
+
- **Model Type:** Sentence Transformer
|
| 677 |
+
- **Base model:** [nomic-ai/modernbert-embed-base](https://huggingface.co/nomic-ai/modernbert-embed-base) <!-- at revision d556a88e332558790b210f7bdbe87da2fa94a8d8 -->
|
| 678 |
+
- **Maximum Sequence Length:** 8192 tokens
|
| 679 |
+
- **Output Dimensionality:** 768 dimensions
|
| 680 |
+
- **Similarity Function:** Cosine Similarity
|
| 681 |
+
<!-- - **Training Dataset:** Unknown -->
|
| 682 |
+
<!-- - **Language:** Unknown -->
|
| 683 |
+
<!-- - **License:** Unknown -->
|
| 684 |
+
|
| 685 |
+
### Model Sources
|
| 686 |
+
|
| 687 |
+
- **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
|
| 688 |
+
- **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
|
| 689 |
+
- **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
|
| 690 |
+
|
| 691 |
+
### Full Model Architecture
|
| 692 |
+
|
| 693 |
+
```
|
| 694 |
+
SentenceTransformer(
|
| 695 |
+
(0): Transformer({'max_seq_length': 8192, 'do_lower_case': False}) with Transformer model: ModernBertModel
|
| 696 |
+
(1): Pooling({'word_embedding_dimension': 768, 'pooling_mode_cls_token': False, 'pooling_mode_mean_tokens': True, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
|
| 697 |
+
(2): Normalize()
|
| 698 |
+
)
|
| 699 |
+
```
|
| 700 |
+
|
| 701 |
+
## Usage
|
| 702 |
+
|
| 703 |
+
### Direct Usage (Sentence Transformers)
|
| 704 |
+
|
| 705 |
+
First install the Sentence Transformers library:
|
| 706 |
+
|
| 707 |
+
```bash
|
| 708 |
+
pip install -U sentence-transformers
|
| 709 |
+
```
|
| 710 |
+
|
| 711 |
+
Then you can load this model and run inference.
|
| 712 |
+
```python
|
| 713 |
+
from sentence_transformers import SentenceTransformer
|
| 714 |
+
|
| 715 |
+
# Download from the 🤗 Hub
|
| 716 |
+
model = SentenceTransformer("lochhonest/modernbert-finetuned-for-sas")
|
| 717 |
+
# Run inference
|
| 718 |
+
sentences = [
|
| 719 |
+
'In nearly all cases, how many source and background region spectra are supplied for the RGS?',
|
| 720 |
+
'RGS spectral products\n\nThis section describes the spectral data products to be generated from\npointed observations.\n\nSource and background region spectra and a background-subtracted source\nspectrum are supplied for the brightest point sources in the RGS (in\nnearly all cases this is just one source). Spectral response matrices\nare also supplied.\n',
|
| 721 |
+
"- This extension gives the good time intervals for the event list.\n\n- There is one extension per CCD in the relevant mode (IMAGING or\n TIMING) during the exposure.\n\n- The following keywords are present:\n\n HDUCLASS= 'OGIP ' / format conforms to OGIP standard\n HDUCLAS1= 'GTI ' / table contains Good Time Intervals\n HDUCLAS2= 'STANDARD' / standard Good Time Interval table\n\n- This extension contains the following columns:\n\n Name Type Description\n ------- ------------- --------------------------------\n START 8-byte REAL seconds (since reference time)\n STOP 8-byte REAL seconds (since reference time)\n",
|
| 722 |
+
]
|
| 723 |
+
embeddings = model.encode(sentences)
|
| 724 |
+
print(embeddings.shape)
|
| 725 |
+
# [3, 768]
|
| 726 |
+
|
| 727 |
+
# Get the similarity scores for the embeddings
|
| 728 |
+
similarities = model.similarity(embeddings, embeddings)
|
| 729 |
+
print(similarities.shape)
|
| 730 |
+
# [3, 3]
|
| 731 |
+
```
|
| 732 |
+
|
| 733 |
+
<!--
|
| 734 |
+
### Direct Usage (Transformers)
|
| 735 |
+
|
| 736 |
+
<details><summary>Click to see the direct usage in Transformers</summary>
|
| 737 |
+
|
| 738 |
+
</details>
|
| 739 |
+
-->
|
| 740 |
+
|
| 741 |
+
<!--
|
| 742 |
+
### Downstream Usage (Sentence Transformers)
|
| 743 |
+
|
| 744 |
+
You can finetune this model on your own dataset.
|
| 745 |
+
|
| 746 |
+
<details><summary>Click to expand</summary>
|
| 747 |
+
|
| 748 |
+
</details>
|
| 749 |
+
-->
|
| 750 |
+
|
| 751 |
+
<!--
|
| 752 |
+
### Out-of-Scope Use
|
| 753 |
+
|
| 754 |
+
*List how the model may foreseeably be misused and address what users ought not to do with the model.*
|
| 755 |
+
-->
|
| 756 |
+
|
| 757 |
+
<!--
|
| 758 |
+
## Bias, Risks and Limitations
|
| 759 |
+
|
| 760 |
+
*What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
|
| 761 |
+
-->
|
| 762 |
+
|
| 763 |
+
<!--
|
| 764 |
+
### Recommendations
|
| 765 |
+
|
| 766 |
+
*What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
|
| 767 |
+
-->
|
| 768 |
+
|
| 769 |
+
## Training Details
|
| 770 |
+
|
| 771 |
+
### Training Dataset
|
| 772 |
+
|
| 773 |
+
#### Unnamed Dataset
|
| 774 |
+
|
| 775 |
+
* Size: 3,619 training samples
|
| 776 |
+
* Columns: <code>anchor</code> and <code>positive</code>
|
| 777 |
+
* Approximate statistics based on the first 1000 samples:
|
| 778 |
+
| | anchor | positive |
|
| 779 |
+
|:--------|:---------------------------------------------------------------------------------|:-------------------------------------------------------------------------------------|
|
| 780 |
+
| type | string | string |
|
| 781 |
+
| details | <ul><li>min: 2 tokens</li><li>mean: 15.7 tokens</li><li>max: 38 tokens</li></ul> | <ul><li>min: 2 tokens</li><li>mean: 411.84 tokens</li><li>max: 3755 tokens</li></ul> |
|
| 782 |
+
* Samples:
|
| 783 |
+
| anchor | positive |
|
| 784 |
+
|:---------------------------------------------------------------------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
| 785 |
+
| <code>What is the purpose of the document described in the preface?</code> | <code>Preface<br><br>This is the reference document describing the individual XMM-Newton<br>Survey Science Centre (SSC) data product files. It is intended to be of<br>use to software developers, archive administrators and to scientists<br>analysing XMM-Newton data. Please see the SSC data products Interface<br>Control Document (XMM-SOC-ICD-0006-SSC, issue 4.0) for a description of<br>the product group files and other related files that are sent to the<br>SOC.<br><br>This version (4.3) includes changes related to the upgrade to SAS16.0 in<br>the processing pipeline originally developped in 2012 to uniformly<br>process all the XMM data at that time, from which the 3XMM catalogue was<br>derived. Revisions and additions since version 4.2 are identified by<br>change bars at the right of each page.<br><br>This document will continue to evolve through subsequent issues, under<br>indirect control from the SAS and SSC configuration control boards.<br><br>This document is the result of the work of many people. Contributors<br>have included:<br><br>Hermann Brunner, G...</code> |
|
| 786 |
+
| <code>What version of the document is described in the preface?</code> | <code>Preface<br><br>This is the reference document describing the individual XMM-Newton<br>Survey Science Centre (SSC) data product files. It is intended to be of<br>use to software developers, archive administrators and to scientists<br>analysing XMM-Newton data. Please see the SSC data products Interface<br>Control Document (XMM-SOC-ICD-0006-SSC, issue 4.0) for a description of<br>the product group files and other related files that are sent to the<br>SOC.<br><br>This version (4.3) includes changes related to the upgrade to SAS16.0 in<br>the processing pipeline originally developped in 2012 to uniformly<br>process all the XMM data at that time, from which the 3XMM catalogue was<br>derived. Revisions and additions since version 4.2 are identified by<br>change bars at the right of each page.<br><br>This document will continue to evolve through subsequent issues, under<br>indirect control from the SAS and SSC configuration control boards.<br><br>This document is the result of the work of many people. Contributors<br>have included:<br><br>Hermann Brunner, G...</code> |
|
| 787 |
+
| <code>What is the main change in version 4.3 of the document?</code> | <code>Preface<br><br>This is the reference document describing the individual XMM-Newton<br>Survey Science Centre (SSC) data product files. It is intended to be of<br>use to software developers, archive administrators and to scientists<br>analysing XMM-Newton data. Please see the SSC data products Interface<br>Control Document (XMM-SOC-ICD-0006-SSC, issue 4.0) for a description of<br>the product group files and other related files that are sent to the<br>SOC.<br><br>This version (4.3) includes changes related to the upgrade to SAS16.0 in<br>the processing pipeline originally developped in 2012 to uniformly<br>process all the XMM data at that time, from which the 3XMM catalogue was<br>derived. Revisions and additions since version 4.2 are identified by<br>change bars at the right of each page.<br><br>This document will continue to evolve through subsequent issues, under<br>indirect control from the SAS and SSC configuration control boards.<br><br>This document is the result of the work of many people. Contributors<br>have included:<br><br>Hermann Brunner, G...</code> |
|
| 788 |
+
* Loss: [<code>CachedMultipleNegativesRankingLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#cachedmultiplenegativesrankingloss) with these parameters:
|
| 789 |
+
```json
|
| 790 |
+
{
|
| 791 |
+
"scale": 20.0,
|
| 792 |
+
"similarity_fct": "get_similarity"
|
| 793 |
+
}
|
| 794 |
+
```
|
| 795 |
+
|
| 796 |
+
### Evaluation Dataset
|
| 797 |
+
|
| 798 |
+
#### Unnamed Dataset
|
| 799 |
+
|
| 800 |
+
* Size: 30 evaluation samples
|
| 801 |
+
* Columns: <code>anchor</code> and <code>positive</code>
|
| 802 |
+
* Approximate statistics based on the first 30 samples:
|
| 803 |
+
| | anchor | positive |
|
| 804 |
+
|:--------|:---------------------------------------------------------------------------------|:-------------------------------------------------------------------------------------|
|
| 805 |
+
| type | string | string |
|
| 806 |
+
| details | <ul><li>min: 8 tokens</li><li>mean: 16.0 tokens</li><li>max: 24 tokens</li></ul> | <ul><li>min: 6 tokens</li><li>mean: 642.47 tokens</li><li>max: 6152 tokens</li></ul> |
|
| 807 |
+
* Samples:
|
| 808 |
+
| anchor | positive |
|
| 809 |
+
|:-------------------------------------------------------------------------------------------------------------------|:------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
| 810 |
+
| <code>What is the purpose of the PPS cross-correlation products?</code> | <code>General cross-correlation products<br><br>These PPS cross-correlation products list the names of all catalogues<br>searched (both around each EPIC position and in the whole EPIC field)<br>and describe the format of their output.<br></code> |
|
| 811 |
+
| <code>What are the task parameters of rgssources?</code> | <code>rgssources<br>## Parameters<br><br> \label{rgssources:description:parameters}<br> <br> **filemode} {modify** (Optional): no<br>(Type: <br> Controls whether the task opens a previous source list for editing or creates a new one.<br> }<br> \optparm{changeprime} {no} {boolean} {yes|no, Default: string} {modify|create, Range: <br> Only active in `filemode`=`modify'. Unless this parameter is set, the previous prime source index number is retained.<br> }<br> \optparm{changeattitude) {boolean} {yes|no}{<br> Only active in `filemode`=`modify'. Unless this parameter is set, the previous attitude (stored in the header) is retained.<br> }<br> **srclist} {rgsset.ds** (Mandatory): yes<br>(Type: <br> The name of the rgs source list. If `filemode`=`create', the output is written to this file. If there is an existing file of this name, it will be overwritten unless SAS\_CLOBBER is unset. If `filemode`=`modify', the task looks for an existing source list of this name and modifies it.<br> }<br> **instexpid} {} {string} {, Default:...</code> |
|
| 812 |
+
| <code>How many stars were used in the U-filter analysis for the G153 pointing to create the distortion map?</code> | <code>OM distortion<br><br>The OM<br>(http://www.cosmos.esa.int/web/xmm-newton/technical-details-om) optics,<br>filters and (primarily) the detector system result in a certain amount<br>of image distortion. This effect can be corrected with a “distortion<br>map”, by comparing the expected position with the measured position for<br>a large number of stars in the OM<br>(http://www.cosmos.esa.int/web/xmm-newton/technical-details-om) field of<br>view. A U-filter analysis has been performed on the G153 pointing with<br>813 stars. The effect of applying this correction is shown in<br>Fig. [fig:uhb:distmap]. A positional r.m.s. accuracy of 0.5 − 1.5 arcsec<br>is obtained. The distortion map has been entered into the appropriate<br>CCF file and is used in http://www.cosmos.esa.int/web/xmm-newton/sas<br>(http://www.cosmos.esa.int/web/xmm-newton/sas).<br></code> |
|
| 813 |
+
* Loss: [<code>CachedMultipleNegativesRankingLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#cachedmultiplenegativesrankingloss) with these parameters:
|
| 814 |
+
```json
|
| 815 |
+
{
|
| 816 |
+
"scale": 20.0,
|
| 817 |
+
"similarity_fct": "get_similarity"
|
| 818 |
+
}
|
| 819 |
+
```
|
| 820 |
+
|
| 821 |
+
### Training Hyperparameters
|
| 822 |
+
#### Non-Default Hyperparameters
|
| 823 |
+
|
| 824 |
+
- `eval_strategy`: steps
|
| 825 |
+
- `per_device_train_batch_size`: 16
|
| 826 |
+
- `per_device_eval_batch_size`: 4
|
| 827 |
+
- `num_train_epochs`: 2
|
| 828 |
+
- `lr_scheduler_type`: constant
|
| 829 |
+
- `warmup_ratio`: 0.1
|
| 830 |
+
- `bf16`: True
|
| 831 |
+
- `batch_sampler`: no_duplicates
|
| 832 |
+
|
| 833 |
+
#### All Hyperparameters
|
| 834 |
+
<details><summary>Click to expand</summary>
|
| 835 |
+
|
| 836 |
+
- `overwrite_output_dir`: False
|
| 837 |
+
- `do_predict`: False
|
| 838 |
+
- `eval_strategy`: steps
|
| 839 |
+
- `prediction_loss_only`: True
|
| 840 |
+
- `per_device_train_batch_size`: 16
|
| 841 |
+
- `per_device_eval_batch_size`: 4
|
| 842 |
+
- `per_gpu_train_batch_size`: None
|
| 843 |
+
- `per_gpu_eval_batch_size`: None
|
| 844 |
+
- `gradient_accumulation_steps`: 1
|
| 845 |
+
- `eval_accumulation_steps`: None
|
| 846 |
+
- `torch_empty_cache_steps`: None
|
| 847 |
+
- `learning_rate`: 5e-05
|
| 848 |
+
- `weight_decay`: 0.0
|
| 849 |
+
- `adam_beta1`: 0.9
|
| 850 |
+
- `adam_beta2`: 0.999
|
| 851 |
+
- `adam_epsilon`: 1e-08
|
| 852 |
+
- `max_grad_norm`: 1.0
|
| 853 |
+
- `num_train_epochs`: 2
|
| 854 |
+
- `max_steps`: -1
|
| 855 |
+
- `lr_scheduler_type`: constant
|
| 856 |
+
- `lr_scheduler_kwargs`: {}
|
| 857 |
+
- `warmup_ratio`: 0.1
|
| 858 |
+
- `warmup_steps`: 0
|
| 859 |
+
- `log_level`: passive
|
| 860 |
+
- `log_level_replica`: warning
|
| 861 |
+
- `log_on_each_node`: True
|
| 862 |
+
- `logging_nan_inf_filter`: True
|
| 863 |
+
- `save_safetensors`: True
|
| 864 |
+
- `save_on_each_node`: False
|
| 865 |
+
- `save_only_model`: False
|
| 866 |
+
- `restore_callback_states_from_checkpoint`: False
|
| 867 |
+
- `no_cuda`: False
|
| 868 |
+
- `use_cpu`: False
|
| 869 |
+
- `use_mps_device`: False
|
| 870 |
+
- `seed`: 42
|
| 871 |
+
- `data_seed`: None
|
| 872 |
+
- `jit_mode_eval`: False
|
| 873 |
+
- `use_ipex`: False
|
| 874 |
+
- `bf16`: True
|
| 875 |
+
- `fp16`: False
|
| 876 |
+
- `fp16_opt_level`: O1
|
| 877 |
+
- `half_precision_backend`: auto
|
| 878 |
+
- `bf16_full_eval`: False
|
| 879 |
+
- `fp16_full_eval`: False
|
| 880 |
+
- `tf32`: None
|
| 881 |
+
- `local_rank`: 0
|
| 882 |
+
- `ddp_backend`: None
|
| 883 |
+
- `tpu_num_cores`: None
|
| 884 |
+
- `tpu_metrics_debug`: False
|
| 885 |
+
- `debug`: []
|
| 886 |
+
- `dataloader_drop_last`: False
|
| 887 |
+
- `dataloader_num_workers`: 0
|
| 888 |
+
- `dataloader_prefetch_factor`: None
|
| 889 |
+
- `past_index`: -1
|
| 890 |
+
- `disable_tqdm`: False
|
| 891 |
+
- `remove_unused_columns`: True
|
| 892 |
+
- `label_names`: None
|
| 893 |
+
- `load_best_model_at_end`: False
|
| 894 |
+
- `ignore_data_skip`: False
|
| 895 |
+
- `fsdp`: []
|
| 896 |
+
- `fsdp_min_num_params`: 0
|
| 897 |
+
- `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
|
| 898 |
+
- `fsdp_transformer_layer_cls_to_wrap`: None
|
| 899 |
+
- `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
|
| 900 |
+
- `deepspeed`: None
|
| 901 |
+
- `label_smoothing_factor`: 0.0
|
| 902 |
+
- `optim`: adamw_torch
|
| 903 |
+
- `optim_args`: None
|
| 904 |
+
- `adafactor`: False
|
| 905 |
+
- `group_by_length`: False
|
| 906 |
+
- `length_column_name`: length
|
| 907 |
+
- `ddp_find_unused_parameters`: None
|
| 908 |
+
- `ddp_bucket_cap_mb`: None
|
| 909 |
+
- `ddp_broadcast_buffers`: False
|
| 910 |
+
- `dataloader_pin_memory`: True
|
| 911 |
+
- `dataloader_persistent_workers`: False
|
| 912 |
+
- `skip_memory_metrics`: True
|
| 913 |
+
- `use_legacy_prediction_loop`: False
|
| 914 |
+
- `push_to_hub`: False
|
| 915 |
+
- `resume_from_checkpoint`: None
|
| 916 |
+
- `hub_model_id`: None
|
| 917 |
+
- `hub_strategy`: every_save
|
| 918 |
+
- `hub_private_repo`: None
|
| 919 |
+
- `hub_always_push`: False
|
| 920 |
+
- `gradient_checkpointing`: False
|
| 921 |
+
- `gradient_checkpointing_kwargs`: None
|
| 922 |
+
- `include_inputs_for_metrics`: False
|
| 923 |
+
- `include_for_metrics`: []
|
| 924 |
+
- `eval_do_concat_batches`: True
|
| 925 |
+
- `fp16_backend`: auto
|
| 926 |
+
- `push_to_hub_model_id`: None
|
| 927 |
+
- `push_to_hub_organization`: None
|
| 928 |
+
- `mp_parameters`:
|
| 929 |
+
- `auto_find_batch_size`: False
|
| 930 |
+
- `full_determinism`: False
|
| 931 |
+
- `torchdynamo`: None
|
| 932 |
+
- `ray_scope`: last
|
| 933 |
+
- `ddp_timeout`: 1800
|
| 934 |
+
- `torch_compile`: False
|
| 935 |
+
- `torch_compile_backend`: None
|
| 936 |
+
- `torch_compile_mode`: None
|
| 937 |
+
- `dispatch_batches`: None
|
| 938 |
+
- `split_batches`: None
|
| 939 |
+
- `include_tokens_per_second`: False
|
| 940 |
+
- `include_num_input_tokens_seen`: False
|
| 941 |
+
- `neftune_noise_alpha`: None
|
| 942 |
+
- `optim_target_modules`: None
|
| 943 |
+
- `batch_eval_metrics`: False
|
| 944 |
+
- `eval_on_start`: False
|
| 945 |
+
- `use_liger_kernel`: False
|
| 946 |
+
- `eval_use_gather_object`: False
|
| 947 |
+
- `average_tokens_across_devices`: False
|
| 948 |
+
- `prompts`: None
|
| 949 |
+
- `batch_sampler`: no_duplicates
|
| 950 |
+
- `multi_dataset_batch_sampler`: proportional
|
| 951 |
+
|
| 952 |
+
</details>
|
| 953 |
+
|
| 954 |
+
### Training Logs
|
| 955 |
+
| Epoch | Step | Training Loss | Validation Loss |
|
| 956 |
+
|:------:|:----:|:-------------:|:---------------:|
|
| 957 |
+
| 0.2203 | 50 | 0.2209 | - |
|
| 958 |
+
| 0.4405 | 100 | 0.1635 | 0.0402 |
|
| 959 |
+
| 0.6608 | 150 | 0.1759 | - |
|
| 960 |
+
| 0.8811 | 200 | 0.1674 | 0.1307 |
|
| 961 |
+
| 1.1013 | 250 | 0.1134 | - |
|
| 962 |
+
| 1.3216 | 300 | 0.0809 | 0.0441 |
|
| 963 |
+
| 1.5419 | 350 | 0.0571 | - |
|
| 964 |
+
| 1.7621 | 400 | 0.077 | 0.0268 |
|
| 965 |
+
| 1.9824 | 450 | 0.0557 | - |
|
| 966 |
+
|
| 967 |
+
|
| 968 |
+
### Framework Versions
|
| 969 |
+
- Python: 3.10.14
|
| 970 |
+
- Sentence Transformers: 3.4.1
|
| 971 |
+
- Transformers: 4.48.2
|
| 972 |
+
- PyTorch: 2.6.0+cu124
|
| 973 |
+
- Accelerate: 1.3.0
|
| 974 |
+
- Datasets: 3.3.1
|
| 975 |
+
- Tokenizers: 0.21.0
|
| 976 |
+
|
| 977 |
+
## Citation
|
| 978 |
+
|
| 979 |
+
### BibTeX
|
| 980 |
+
|
| 981 |
+
#### Sentence Transformers
|
| 982 |
+
```bibtex
|
| 983 |
+
@inproceedings{reimers-2019-sentence-bert,
|
| 984 |
+
title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
|
| 985 |
+
author = "Reimers, Nils and Gurevych, Iryna",
|
| 986 |
+
booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
|
| 987 |
+
month = "11",
|
| 988 |
+
year = "2019",
|
| 989 |
+
publisher = "Association for Computational Linguistics",
|
| 990 |
+
url = "https://arxiv.org/abs/1908.10084",
|
| 991 |
+
}
|
| 992 |
+
```
|
| 993 |
+
|
| 994 |
+
#### CachedMultipleNegativesRankingLoss
|
| 995 |
+
```bibtex
|
| 996 |
+
@misc{gao2021scaling,
|
| 997 |
+
title={Scaling Deep Contrastive Learning Batch Size under Memory Limited Setup},
|
| 998 |
+
author={Luyu Gao and Yunyi Zhang and Jiawei Han and Jamie Callan},
|
| 999 |
+
year={2021},
|
| 1000 |
+
eprint={2101.06983},
|
| 1001 |
+
archivePrefix={arXiv},
|
| 1002 |
+
primaryClass={cs.LG}
|
| 1003 |
+
}
|
| 1004 |
+
```
|
| 1005 |
+
|
| 1006 |
+
<!--
|
| 1007 |
+
## Glossary
|
| 1008 |
+
|
| 1009 |
+
*Clearly define terms in order to be accessible across audiences.*
|
| 1010 |
+
-->
|
| 1011 |
+
|
| 1012 |
+
<!--
|
| 1013 |
+
## Model Card Authors
|
| 1014 |
+
|
| 1015 |
+
*Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
|
| 1016 |
+
-->
|
| 1017 |
+
|
| 1018 |
+
<!--
|
| 1019 |
+
## Model Card Contact
|
| 1020 |
+
|
| 1021 |
+
*Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
|
| 1022 |
+
-->
|
config.json
ADDED
|
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_name_or_path": "nomic-ai/modernbert-embed-base",
|
| 3 |
+
"architectures": [
|
| 4 |
+
"ModernBertModel"
|
| 5 |
+
],
|
| 6 |
+
"attention_bias": false,
|
| 7 |
+
"attention_dropout": 0.0,
|
| 8 |
+
"bos_token_id": 50281,
|
| 9 |
+
"classifier_activation": "gelu",
|
| 10 |
+
"classifier_bias": false,
|
| 11 |
+
"classifier_dropout": 0.0,
|
| 12 |
+
"classifier_pooling": "mean",
|
| 13 |
+
"cls_token_id": 50281,
|
| 14 |
+
"decoder_bias": true,
|
| 15 |
+
"deterministic_flash_attn": false,
|
| 16 |
+
"embedding_dropout": 0.0,
|
| 17 |
+
"eos_token_id": 50282,
|
| 18 |
+
"global_attn_every_n_layers": 3,
|
| 19 |
+
"global_rope_theta": 160000.0,
|
| 20 |
+
"gradient_checkpointing": false,
|
| 21 |
+
"hidden_activation": "gelu",
|
| 22 |
+
"hidden_size": 768,
|
| 23 |
+
"initializer_cutoff_factor": 2.0,
|
| 24 |
+
"initializer_range": 0.02,
|
| 25 |
+
"intermediate_size": 1152,
|
| 26 |
+
"layer_norm_eps": 1e-05,
|
| 27 |
+
"local_attention": 128,
|
| 28 |
+
"local_rope_theta": 10000.0,
|
| 29 |
+
"max_position_embeddings": 8192,
|
| 30 |
+
"mlp_bias": false,
|
| 31 |
+
"mlp_dropout": 0.0,
|
| 32 |
+
"model_type": "modernbert",
|
| 33 |
+
"norm_bias": false,
|
| 34 |
+
"norm_eps": 1e-05,
|
| 35 |
+
"num_attention_heads": 12,
|
| 36 |
+
"num_hidden_layers": 22,
|
| 37 |
+
"pad_token_id": 50283,
|
| 38 |
+
"position_embedding_type": "absolute",
|
| 39 |
+
"reference_compile": true,
|
| 40 |
+
"repad_logits_with_grad": false,
|
| 41 |
+
"sep_token_id": 50282,
|
| 42 |
+
"sparse_pred_ignore_index": -100,
|
| 43 |
+
"sparse_prediction": false,
|
| 44 |
+
"torch_dtype": "float32",
|
| 45 |
+
"transformers_version": "4.48.2",
|
| 46 |
+
"vocab_size": 50368
|
| 47 |
+
}
|
config_sentence_transformers.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"__version__": {
|
| 3 |
+
"sentence_transformers": "3.4.1",
|
| 4 |
+
"transformers": "4.48.2",
|
| 5 |
+
"pytorch": "2.6.0+cu124"
|
| 6 |
+
},
|
| 7 |
+
"prompts": {},
|
| 8 |
+
"default_prompt_name": null,
|
| 9 |
+
"similarity_fn_name": "cosine"
|
| 10 |
+
}
|
model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8b9a52371c20459c83ab3b9e4dcba56b63c2b89ee64f564bceda45edf14a5516
|
| 3 |
+
size 596070136
|
modules.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"idx": 0,
|
| 4 |
+
"name": "0",
|
| 5 |
+
"path": "",
|
| 6 |
+
"type": "sentence_transformers.models.Transformer"
|
| 7 |
+
},
|
| 8 |
+
{
|
| 9 |
+
"idx": 1,
|
| 10 |
+
"name": "1",
|
| 11 |
+
"path": "1_Pooling",
|
| 12 |
+
"type": "sentence_transformers.models.Pooling"
|
| 13 |
+
},
|
| 14 |
+
{
|
| 15 |
+
"idx": 2,
|
| 16 |
+
"name": "2",
|
| 17 |
+
"path": "2_Normalize",
|
| 18 |
+
"type": "sentence_transformers.models.Normalize"
|
| 19 |
+
}
|
| 20 |
+
]
|
sentence_bert_config.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"max_seq_length": 8192,
|
| 3 |
+
"do_lower_case": false
|
| 4 |
+
}
|
special_tokens_map.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"cls_token": {
|
| 3 |
+
"content": "[CLS]",
|
| 4 |
+
"lstrip": false,
|
| 5 |
+
"normalized": false,
|
| 6 |
+
"rstrip": false,
|
| 7 |
+
"single_word": false
|
| 8 |
+
},
|
| 9 |
+
"mask_token": {
|
| 10 |
+
"content": "[MASK]",
|
| 11 |
+
"lstrip": true,
|
| 12 |
+
"normalized": false,
|
| 13 |
+
"rstrip": false,
|
| 14 |
+
"single_word": false
|
| 15 |
+
},
|
| 16 |
+
"pad_token": {
|
| 17 |
+
"content": "[PAD]",
|
| 18 |
+
"lstrip": false,
|
| 19 |
+
"normalized": false,
|
| 20 |
+
"rstrip": false,
|
| 21 |
+
"single_word": false
|
| 22 |
+
},
|
| 23 |
+
"sep_token": {
|
| 24 |
+
"content": "[SEP]",
|
| 25 |
+
"lstrip": false,
|
| 26 |
+
"normalized": false,
|
| 27 |
+
"rstrip": false,
|
| 28 |
+
"single_word": false
|
| 29 |
+
},
|
| 30 |
+
"unk_token": {
|
| 31 |
+
"content": "[UNK]",
|
| 32 |
+
"lstrip": false,
|
| 33 |
+
"normalized": false,
|
| 34 |
+
"rstrip": false,
|
| 35 |
+
"single_word": false
|
| 36 |
+
}
|
| 37 |
+
}
|
tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
tokenizer_config.json
ADDED
|
@@ -0,0 +1,945 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"added_tokens_decoder": {
|
| 3 |
+
"0": {
|
| 4 |
+
"content": "|||IP_ADDRESS|||",
|
| 5 |
+
"lstrip": false,
|
| 6 |
+
"normalized": true,
|
| 7 |
+
"rstrip": false,
|
| 8 |
+
"single_word": false,
|
| 9 |
+
"special": false
|
| 10 |
+
},
|
| 11 |
+
"1": {
|
| 12 |
+
"content": "<|padding|>",
|
| 13 |
+
"lstrip": false,
|
| 14 |
+
"normalized": false,
|
| 15 |
+
"rstrip": false,
|
| 16 |
+
"single_word": false,
|
| 17 |
+
"special": true
|
| 18 |
+
},
|
| 19 |
+
"50254": {
|
| 20 |
+
"content": " ",
|
| 21 |
+
"lstrip": false,
|
| 22 |
+
"normalized": true,
|
| 23 |
+
"rstrip": false,
|
| 24 |
+
"single_word": false,
|
| 25 |
+
"special": false
|
| 26 |
+
},
|
| 27 |
+
"50255": {
|
| 28 |
+
"content": " ",
|
| 29 |
+
"lstrip": false,
|
| 30 |
+
"normalized": true,
|
| 31 |
+
"rstrip": false,
|
| 32 |
+
"single_word": false,
|
| 33 |
+
"special": false
|
| 34 |
+
},
|
| 35 |
+
"50256": {
|
| 36 |
+
"content": " ",
|
| 37 |
+
"lstrip": false,
|
| 38 |
+
"normalized": true,
|
| 39 |
+
"rstrip": false,
|
| 40 |
+
"single_word": false,
|
| 41 |
+
"special": false
|
| 42 |
+
},
|
| 43 |
+
"50257": {
|
| 44 |
+
"content": " ",
|
| 45 |
+
"lstrip": false,
|
| 46 |
+
"normalized": true,
|
| 47 |
+
"rstrip": false,
|
| 48 |
+
"single_word": false,
|
| 49 |
+
"special": false
|
| 50 |
+
},
|
| 51 |
+
"50258": {
|
| 52 |
+
"content": " ",
|
| 53 |
+
"lstrip": false,
|
| 54 |
+
"normalized": true,
|
| 55 |
+
"rstrip": false,
|
| 56 |
+
"single_word": false,
|
| 57 |
+
"special": false
|
| 58 |
+
},
|
| 59 |
+
"50259": {
|
| 60 |
+
"content": " ",
|
| 61 |
+
"lstrip": false,
|
| 62 |
+
"normalized": true,
|
| 63 |
+
"rstrip": false,
|
| 64 |
+
"single_word": false,
|
| 65 |
+
"special": false
|
| 66 |
+
},
|
| 67 |
+
"50260": {
|
| 68 |
+
"content": " ",
|
| 69 |
+
"lstrip": false,
|
| 70 |
+
"normalized": true,
|
| 71 |
+
"rstrip": false,
|
| 72 |
+
"single_word": false,
|
| 73 |
+
"special": false
|
| 74 |
+
},
|
| 75 |
+
"50261": {
|
| 76 |
+
"content": " ",
|
| 77 |
+
"lstrip": false,
|
| 78 |
+
"normalized": true,
|
| 79 |
+
"rstrip": false,
|
| 80 |
+
"single_word": false,
|
| 81 |
+
"special": false
|
| 82 |
+
},
|
| 83 |
+
"50262": {
|
| 84 |
+
"content": " ",
|
| 85 |
+
"lstrip": false,
|
| 86 |
+
"normalized": true,
|
| 87 |
+
"rstrip": false,
|
| 88 |
+
"single_word": false,
|
| 89 |
+
"special": false
|
| 90 |
+
},
|
| 91 |
+
"50263": {
|
| 92 |
+
"content": " ",
|
| 93 |
+
"lstrip": false,
|
| 94 |
+
"normalized": true,
|
| 95 |
+
"rstrip": false,
|
| 96 |
+
"single_word": false,
|
| 97 |
+
"special": false
|
| 98 |
+
},
|
| 99 |
+
"50264": {
|
| 100 |
+
"content": " ",
|
| 101 |
+
"lstrip": false,
|
| 102 |
+
"normalized": true,
|
| 103 |
+
"rstrip": false,
|
| 104 |
+
"single_word": false,
|
| 105 |
+
"special": false
|
| 106 |
+
},
|
| 107 |
+
"50265": {
|
| 108 |
+
"content": " ",
|
| 109 |
+
"lstrip": false,
|
| 110 |
+
"normalized": true,
|
| 111 |
+
"rstrip": false,
|
| 112 |
+
"single_word": false,
|
| 113 |
+
"special": false
|
| 114 |
+
},
|
| 115 |
+
"50266": {
|
| 116 |
+
"content": " ",
|
| 117 |
+
"lstrip": false,
|
| 118 |
+
"normalized": true,
|
| 119 |
+
"rstrip": false,
|
| 120 |
+
"single_word": false,
|
| 121 |
+
"special": false
|
| 122 |
+
},
|
| 123 |
+
"50267": {
|
| 124 |
+
"content": " ",
|
| 125 |
+
"lstrip": false,
|
| 126 |
+
"normalized": true,
|
| 127 |
+
"rstrip": false,
|
| 128 |
+
"single_word": false,
|
| 129 |
+
"special": false
|
| 130 |
+
},
|
| 131 |
+
"50268": {
|
| 132 |
+
"content": " ",
|
| 133 |
+
"lstrip": false,
|
| 134 |
+
"normalized": true,
|
| 135 |
+
"rstrip": false,
|
| 136 |
+
"single_word": false,
|
| 137 |
+
"special": false
|
| 138 |
+
},
|
| 139 |
+
"50269": {
|
| 140 |
+
"content": " ",
|
| 141 |
+
"lstrip": false,
|
| 142 |
+
"normalized": true,
|
| 143 |
+
"rstrip": false,
|
| 144 |
+
"single_word": false,
|
| 145 |
+
"special": false
|
| 146 |
+
},
|
| 147 |
+
"50270": {
|
| 148 |
+
"content": " ",
|
| 149 |
+
"lstrip": false,
|
| 150 |
+
"normalized": true,
|
| 151 |
+
"rstrip": false,
|
| 152 |
+
"single_word": false,
|
| 153 |
+
"special": false
|
| 154 |
+
},
|
| 155 |
+
"50271": {
|
| 156 |
+
"content": " ",
|
| 157 |
+
"lstrip": false,
|
| 158 |
+
"normalized": true,
|
| 159 |
+
"rstrip": false,
|
| 160 |
+
"single_word": false,
|
| 161 |
+
"special": false
|
| 162 |
+
},
|
| 163 |
+
"50272": {
|
| 164 |
+
"content": " ",
|
| 165 |
+
"lstrip": false,
|
| 166 |
+
"normalized": true,
|
| 167 |
+
"rstrip": false,
|
| 168 |
+
"single_word": false,
|
| 169 |
+
"special": false
|
| 170 |
+
},
|
| 171 |
+
"50273": {
|
| 172 |
+
"content": " ",
|
| 173 |
+
"lstrip": false,
|
| 174 |
+
"normalized": true,
|
| 175 |
+
"rstrip": false,
|
| 176 |
+
"single_word": false,
|
| 177 |
+
"special": false
|
| 178 |
+
},
|
| 179 |
+
"50274": {
|
| 180 |
+
"content": " ",
|
| 181 |
+
"lstrip": false,
|
| 182 |
+
"normalized": true,
|
| 183 |
+
"rstrip": false,
|
| 184 |
+
"single_word": false,
|
| 185 |
+
"special": false
|
| 186 |
+
},
|
| 187 |
+
"50275": {
|
| 188 |
+
"content": " ",
|
| 189 |
+
"lstrip": false,
|
| 190 |
+
"normalized": true,
|
| 191 |
+
"rstrip": false,
|
| 192 |
+
"single_word": false,
|
| 193 |
+
"special": false
|
| 194 |
+
},
|
| 195 |
+
"50276": {
|
| 196 |
+
"content": " ",
|
| 197 |
+
"lstrip": false,
|
| 198 |
+
"normalized": true,
|
| 199 |
+
"rstrip": false,
|
| 200 |
+
"single_word": false,
|
| 201 |
+
"special": false
|
| 202 |
+
},
|
| 203 |
+
"50277": {
|
| 204 |
+
"content": "|||EMAIL_ADDRESS|||",
|
| 205 |
+
"lstrip": false,
|
| 206 |
+
"normalized": true,
|
| 207 |
+
"rstrip": false,
|
| 208 |
+
"single_word": false,
|
| 209 |
+
"special": false
|
| 210 |
+
},
|
| 211 |
+
"50278": {
|
| 212 |
+
"content": "|||PHONE_NUMBER|||",
|
| 213 |
+
"lstrip": false,
|
| 214 |
+
"normalized": true,
|
| 215 |
+
"rstrip": false,
|
| 216 |
+
"single_word": false,
|
| 217 |
+
"special": false
|
| 218 |
+
},
|
| 219 |
+
"50279": {
|
| 220 |
+
"content": "<|endoftext|>",
|
| 221 |
+
"lstrip": false,
|
| 222 |
+
"normalized": false,
|
| 223 |
+
"rstrip": false,
|
| 224 |
+
"single_word": false,
|
| 225 |
+
"special": true
|
| 226 |
+
},
|
| 227 |
+
"50280": {
|
| 228 |
+
"content": "[UNK]",
|
| 229 |
+
"lstrip": false,
|
| 230 |
+
"normalized": false,
|
| 231 |
+
"rstrip": false,
|
| 232 |
+
"single_word": false,
|
| 233 |
+
"special": true
|
| 234 |
+
},
|
| 235 |
+
"50281": {
|
| 236 |
+
"content": "[CLS]",
|
| 237 |
+
"lstrip": false,
|
| 238 |
+
"normalized": false,
|
| 239 |
+
"rstrip": false,
|
| 240 |
+
"single_word": false,
|
| 241 |
+
"special": true
|
| 242 |
+
},
|
| 243 |
+
"50282": {
|
| 244 |
+
"content": "[SEP]",
|
| 245 |
+
"lstrip": false,
|
| 246 |
+
"normalized": false,
|
| 247 |
+
"rstrip": false,
|
| 248 |
+
"single_word": false,
|
| 249 |
+
"special": true
|
| 250 |
+
},
|
| 251 |
+
"50283": {
|
| 252 |
+
"content": "[PAD]",
|
| 253 |
+
"lstrip": false,
|
| 254 |
+
"normalized": false,
|
| 255 |
+
"rstrip": false,
|
| 256 |
+
"single_word": false,
|
| 257 |
+
"special": true
|
| 258 |
+
},
|
| 259 |
+
"50284": {
|
| 260 |
+
"content": "[MASK]",
|
| 261 |
+
"lstrip": true,
|
| 262 |
+
"normalized": false,
|
| 263 |
+
"rstrip": false,
|
| 264 |
+
"single_word": false,
|
| 265 |
+
"special": true
|
| 266 |
+
},
|
| 267 |
+
"50285": {
|
| 268 |
+
"content": "[unused0]",
|
| 269 |
+
"lstrip": false,
|
| 270 |
+
"normalized": true,
|
| 271 |
+
"rstrip": false,
|
| 272 |
+
"single_word": false,
|
| 273 |
+
"special": false
|
| 274 |
+
},
|
| 275 |
+
"50286": {
|
| 276 |
+
"content": "[unused1]",
|
| 277 |
+
"lstrip": false,
|
| 278 |
+
"normalized": true,
|
| 279 |
+
"rstrip": false,
|
| 280 |
+
"single_word": false,
|
| 281 |
+
"special": false
|
| 282 |
+
},
|
| 283 |
+
"50287": {
|
| 284 |
+
"content": "[unused2]",
|
| 285 |
+
"lstrip": false,
|
| 286 |
+
"normalized": true,
|
| 287 |
+
"rstrip": false,
|
| 288 |
+
"single_word": false,
|
| 289 |
+
"special": false
|
| 290 |
+
},
|
| 291 |
+
"50288": {
|
| 292 |
+
"content": "[unused3]",
|
| 293 |
+
"lstrip": false,
|
| 294 |
+
"normalized": true,
|
| 295 |
+
"rstrip": false,
|
| 296 |
+
"single_word": false,
|
| 297 |
+
"special": false
|
| 298 |
+
},
|
| 299 |
+
"50289": {
|
| 300 |
+
"content": "[unused4]",
|
| 301 |
+
"lstrip": false,
|
| 302 |
+
"normalized": true,
|
| 303 |
+
"rstrip": false,
|
| 304 |
+
"single_word": false,
|
| 305 |
+
"special": false
|
| 306 |
+
},
|
| 307 |
+
"50290": {
|
| 308 |
+
"content": "[unused5]",
|
| 309 |
+
"lstrip": false,
|
| 310 |
+
"normalized": true,
|
| 311 |
+
"rstrip": false,
|
| 312 |
+
"single_word": false,
|
| 313 |
+
"special": false
|
| 314 |
+
},
|
| 315 |
+
"50291": {
|
| 316 |
+
"content": "[unused6]",
|
| 317 |
+
"lstrip": false,
|
| 318 |
+
"normalized": true,
|
| 319 |
+
"rstrip": false,
|
| 320 |
+
"single_word": false,
|
| 321 |
+
"special": false
|
| 322 |
+
},
|
| 323 |
+
"50292": {
|
| 324 |
+
"content": "[unused7]",
|
| 325 |
+
"lstrip": false,
|
| 326 |
+
"normalized": true,
|
| 327 |
+
"rstrip": false,
|
| 328 |
+
"single_word": false,
|
| 329 |
+
"special": false
|
| 330 |
+
},
|
| 331 |
+
"50293": {
|
| 332 |
+
"content": "[unused8]",
|
| 333 |
+
"lstrip": false,
|
| 334 |
+
"normalized": true,
|
| 335 |
+
"rstrip": false,
|
| 336 |
+
"single_word": false,
|
| 337 |
+
"special": false
|
| 338 |
+
},
|
| 339 |
+
"50294": {
|
| 340 |
+
"content": "[unused9]",
|
| 341 |
+
"lstrip": false,
|
| 342 |
+
"normalized": true,
|
| 343 |
+
"rstrip": false,
|
| 344 |
+
"single_word": false,
|
| 345 |
+
"special": false
|
| 346 |
+
},
|
| 347 |
+
"50295": {
|
| 348 |
+
"content": "[unused10]",
|
| 349 |
+
"lstrip": false,
|
| 350 |
+
"normalized": true,
|
| 351 |
+
"rstrip": false,
|
| 352 |
+
"single_word": false,
|
| 353 |
+
"special": false
|
| 354 |
+
},
|
| 355 |
+
"50296": {
|
| 356 |
+
"content": "[unused11]",
|
| 357 |
+
"lstrip": false,
|
| 358 |
+
"normalized": true,
|
| 359 |
+
"rstrip": false,
|
| 360 |
+
"single_word": false,
|
| 361 |
+
"special": false
|
| 362 |
+
},
|
| 363 |
+
"50297": {
|
| 364 |
+
"content": "[unused12]",
|
| 365 |
+
"lstrip": false,
|
| 366 |
+
"normalized": true,
|
| 367 |
+
"rstrip": false,
|
| 368 |
+
"single_word": false,
|
| 369 |
+
"special": false
|
| 370 |
+
},
|
| 371 |
+
"50298": {
|
| 372 |
+
"content": "[unused13]",
|
| 373 |
+
"lstrip": false,
|
| 374 |
+
"normalized": true,
|
| 375 |
+
"rstrip": false,
|
| 376 |
+
"single_word": false,
|
| 377 |
+
"special": false
|
| 378 |
+
},
|
| 379 |
+
"50299": {
|
| 380 |
+
"content": "[unused14]",
|
| 381 |
+
"lstrip": false,
|
| 382 |
+
"normalized": true,
|
| 383 |
+
"rstrip": false,
|
| 384 |
+
"single_word": false,
|
| 385 |
+
"special": false
|
| 386 |
+
},
|
| 387 |
+
"50300": {
|
| 388 |
+
"content": "[unused15]",
|
| 389 |
+
"lstrip": false,
|
| 390 |
+
"normalized": true,
|
| 391 |
+
"rstrip": false,
|
| 392 |
+
"single_word": false,
|
| 393 |
+
"special": false
|
| 394 |
+
},
|
| 395 |
+
"50301": {
|
| 396 |
+
"content": "[unused16]",
|
| 397 |
+
"lstrip": false,
|
| 398 |
+
"normalized": true,
|
| 399 |
+
"rstrip": false,
|
| 400 |
+
"single_word": false,
|
| 401 |
+
"special": false
|
| 402 |
+
},
|
| 403 |
+
"50302": {
|
| 404 |
+
"content": "[unused17]",
|
| 405 |
+
"lstrip": false,
|
| 406 |
+
"normalized": true,
|
| 407 |
+
"rstrip": false,
|
| 408 |
+
"single_word": false,
|
| 409 |
+
"special": false
|
| 410 |
+
},
|
| 411 |
+
"50303": {
|
| 412 |
+
"content": "[unused18]",
|
| 413 |
+
"lstrip": false,
|
| 414 |
+
"normalized": true,
|
| 415 |
+
"rstrip": false,
|
| 416 |
+
"single_word": false,
|
| 417 |
+
"special": false
|
| 418 |
+
},
|
| 419 |
+
"50304": {
|
| 420 |
+
"content": "[unused19]",
|
| 421 |
+
"lstrip": false,
|
| 422 |
+
"normalized": true,
|
| 423 |
+
"rstrip": false,
|
| 424 |
+
"single_word": false,
|
| 425 |
+
"special": false
|
| 426 |
+
},
|
| 427 |
+
"50305": {
|
| 428 |
+
"content": "[unused20]",
|
| 429 |
+
"lstrip": false,
|
| 430 |
+
"normalized": true,
|
| 431 |
+
"rstrip": false,
|
| 432 |
+
"single_word": false,
|
| 433 |
+
"special": false
|
| 434 |
+
},
|
| 435 |
+
"50306": {
|
| 436 |
+
"content": "[unused21]",
|
| 437 |
+
"lstrip": false,
|
| 438 |
+
"normalized": true,
|
| 439 |
+
"rstrip": false,
|
| 440 |
+
"single_word": false,
|
| 441 |
+
"special": false
|
| 442 |
+
},
|
| 443 |
+
"50307": {
|
| 444 |
+
"content": "[unused22]",
|
| 445 |
+
"lstrip": false,
|
| 446 |
+
"normalized": true,
|
| 447 |
+
"rstrip": false,
|
| 448 |
+
"single_word": false,
|
| 449 |
+
"special": false
|
| 450 |
+
},
|
| 451 |
+
"50308": {
|
| 452 |
+
"content": "[unused23]",
|
| 453 |
+
"lstrip": false,
|
| 454 |
+
"normalized": true,
|
| 455 |
+
"rstrip": false,
|
| 456 |
+
"single_word": false,
|
| 457 |
+
"special": false
|
| 458 |
+
},
|
| 459 |
+
"50309": {
|
| 460 |
+
"content": "[unused24]",
|
| 461 |
+
"lstrip": false,
|
| 462 |
+
"normalized": true,
|
| 463 |
+
"rstrip": false,
|
| 464 |
+
"single_word": false,
|
| 465 |
+
"special": false
|
| 466 |
+
},
|
| 467 |
+
"50310": {
|
| 468 |
+
"content": "[unused25]",
|
| 469 |
+
"lstrip": false,
|
| 470 |
+
"normalized": true,
|
| 471 |
+
"rstrip": false,
|
| 472 |
+
"single_word": false,
|
| 473 |
+
"special": false
|
| 474 |
+
},
|
| 475 |
+
"50311": {
|
| 476 |
+
"content": "[unused26]",
|
| 477 |
+
"lstrip": false,
|
| 478 |
+
"normalized": true,
|
| 479 |
+
"rstrip": false,
|
| 480 |
+
"single_word": false,
|
| 481 |
+
"special": false
|
| 482 |
+
},
|
| 483 |
+
"50312": {
|
| 484 |
+
"content": "[unused27]",
|
| 485 |
+
"lstrip": false,
|
| 486 |
+
"normalized": true,
|
| 487 |
+
"rstrip": false,
|
| 488 |
+
"single_word": false,
|
| 489 |
+
"special": false
|
| 490 |
+
},
|
| 491 |
+
"50313": {
|
| 492 |
+
"content": "[unused28]",
|
| 493 |
+
"lstrip": false,
|
| 494 |
+
"normalized": true,
|
| 495 |
+
"rstrip": false,
|
| 496 |
+
"single_word": false,
|
| 497 |
+
"special": false
|
| 498 |
+
},
|
| 499 |
+
"50314": {
|
| 500 |
+
"content": "[unused29]",
|
| 501 |
+
"lstrip": false,
|
| 502 |
+
"normalized": true,
|
| 503 |
+
"rstrip": false,
|
| 504 |
+
"single_word": false,
|
| 505 |
+
"special": false
|
| 506 |
+
},
|
| 507 |
+
"50315": {
|
| 508 |
+
"content": "[unused30]",
|
| 509 |
+
"lstrip": false,
|
| 510 |
+
"normalized": true,
|
| 511 |
+
"rstrip": false,
|
| 512 |
+
"single_word": false,
|
| 513 |
+
"special": false
|
| 514 |
+
},
|
| 515 |
+
"50316": {
|
| 516 |
+
"content": "[unused31]",
|
| 517 |
+
"lstrip": false,
|
| 518 |
+
"normalized": true,
|
| 519 |
+
"rstrip": false,
|
| 520 |
+
"single_word": false,
|
| 521 |
+
"special": false
|
| 522 |
+
},
|
| 523 |
+
"50317": {
|
| 524 |
+
"content": "[unused32]",
|
| 525 |
+
"lstrip": false,
|
| 526 |
+
"normalized": true,
|
| 527 |
+
"rstrip": false,
|
| 528 |
+
"single_word": false,
|
| 529 |
+
"special": false
|
| 530 |
+
},
|
| 531 |
+
"50318": {
|
| 532 |
+
"content": "[unused33]",
|
| 533 |
+
"lstrip": false,
|
| 534 |
+
"normalized": true,
|
| 535 |
+
"rstrip": false,
|
| 536 |
+
"single_word": false,
|
| 537 |
+
"special": false
|
| 538 |
+
},
|
| 539 |
+
"50319": {
|
| 540 |
+
"content": "[unused34]",
|
| 541 |
+
"lstrip": false,
|
| 542 |
+
"normalized": true,
|
| 543 |
+
"rstrip": false,
|
| 544 |
+
"single_word": false,
|
| 545 |
+
"special": false
|
| 546 |
+
},
|
| 547 |
+
"50320": {
|
| 548 |
+
"content": "[unused35]",
|
| 549 |
+
"lstrip": false,
|
| 550 |
+
"normalized": true,
|
| 551 |
+
"rstrip": false,
|
| 552 |
+
"single_word": false,
|
| 553 |
+
"special": false
|
| 554 |
+
},
|
| 555 |
+
"50321": {
|
| 556 |
+
"content": "[unused36]",
|
| 557 |
+
"lstrip": false,
|
| 558 |
+
"normalized": true,
|
| 559 |
+
"rstrip": false,
|
| 560 |
+
"single_word": false,
|
| 561 |
+
"special": false
|
| 562 |
+
},
|
| 563 |
+
"50322": {
|
| 564 |
+
"content": "[unused37]",
|
| 565 |
+
"lstrip": false,
|
| 566 |
+
"normalized": true,
|
| 567 |
+
"rstrip": false,
|
| 568 |
+
"single_word": false,
|
| 569 |
+
"special": false
|
| 570 |
+
},
|
| 571 |
+
"50323": {
|
| 572 |
+
"content": "[unused38]",
|
| 573 |
+
"lstrip": false,
|
| 574 |
+
"normalized": true,
|
| 575 |
+
"rstrip": false,
|
| 576 |
+
"single_word": false,
|
| 577 |
+
"special": false
|
| 578 |
+
},
|
| 579 |
+
"50324": {
|
| 580 |
+
"content": "[unused39]",
|
| 581 |
+
"lstrip": false,
|
| 582 |
+
"normalized": true,
|
| 583 |
+
"rstrip": false,
|
| 584 |
+
"single_word": false,
|
| 585 |
+
"special": false
|
| 586 |
+
},
|
| 587 |
+
"50325": {
|
| 588 |
+
"content": "[unused40]",
|
| 589 |
+
"lstrip": false,
|
| 590 |
+
"normalized": true,
|
| 591 |
+
"rstrip": false,
|
| 592 |
+
"single_word": false,
|
| 593 |
+
"special": false
|
| 594 |
+
},
|
| 595 |
+
"50326": {
|
| 596 |
+
"content": "[unused41]",
|
| 597 |
+
"lstrip": false,
|
| 598 |
+
"normalized": true,
|
| 599 |
+
"rstrip": false,
|
| 600 |
+
"single_word": false,
|
| 601 |
+
"special": false
|
| 602 |
+
},
|
| 603 |
+
"50327": {
|
| 604 |
+
"content": "[unused42]",
|
| 605 |
+
"lstrip": false,
|
| 606 |
+
"normalized": true,
|
| 607 |
+
"rstrip": false,
|
| 608 |
+
"single_word": false,
|
| 609 |
+
"special": false
|
| 610 |
+
},
|
| 611 |
+
"50328": {
|
| 612 |
+
"content": "[unused43]",
|
| 613 |
+
"lstrip": false,
|
| 614 |
+
"normalized": true,
|
| 615 |
+
"rstrip": false,
|
| 616 |
+
"single_word": false,
|
| 617 |
+
"special": false
|
| 618 |
+
},
|
| 619 |
+
"50329": {
|
| 620 |
+
"content": "[unused44]",
|
| 621 |
+
"lstrip": false,
|
| 622 |
+
"normalized": true,
|
| 623 |
+
"rstrip": false,
|
| 624 |
+
"single_word": false,
|
| 625 |
+
"special": false
|
| 626 |
+
},
|
| 627 |
+
"50330": {
|
| 628 |
+
"content": "[unused45]",
|
| 629 |
+
"lstrip": false,
|
| 630 |
+
"normalized": true,
|
| 631 |
+
"rstrip": false,
|
| 632 |
+
"single_word": false,
|
| 633 |
+
"special": false
|
| 634 |
+
},
|
| 635 |
+
"50331": {
|
| 636 |
+
"content": "[unused46]",
|
| 637 |
+
"lstrip": false,
|
| 638 |
+
"normalized": true,
|
| 639 |
+
"rstrip": false,
|
| 640 |
+
"single_word": false,
|
| 641 |
+
"special": false
|
| 642 |
+
},
|
| 643 |
+
"50332": {
|
| 644 |
+
"content": "[unused47]",
|
| 645 |
+
"lstrip": false,
|
| 646 |
+
"normalized": true,
|
| 647 |
+
"rstrip": false,
|
| 648 |
+
"single_word": false,
|
| 649 |
+
"special": false
|
| 650 |
+
},
|
| 651 |
+
"50333": {
|
| 652 |
+
"content": "[unused48]",
|
| 653 |
+
"lstrip": false,
|
| 654 |
+
"normalized": true,
|
| 655 |
+
"rstrip": false,
|
| 656 |
+
"single_word": false,
|
| 657 |
+
"special": false
|
| 658 |
+
},
|
| 659 |
+
"50334": {
|
| 660 |
+
"content": "[unused49]",
|
| 661 |
+
"lstrip": false,
|
| 662 |
+
"normalized": true,
|
| 663 |
+
"rstrip": false,
|
| 664 |
+
"single_word": false,
|
| 665 |
+
"special": false
|
| 666 |
+
},
|
| 667 |
+
"50335": {
|
| 668 |
+
"content": "[unused50]",
|
| 669 |
+
"lstrip": false,
|
| 670 |
+
"normalized": true,
|
| 671 |
+
"rstrip": false,
|
| 672 |
+
"single_word": false,
|
| 673 |
+
"special": false
|
| 674 |
+
},
|
| 675 |
+
"50336": {
|
| 676 |
+
"content": "[unused51]",
|
| 677 |
+
"lstrip": false,
|
| 678 |
+
"normalized": true,
|
| 679 |
+
"rstrip": false,
|
| 680 |
+
"single_word": false,
|
| 681 |
+
"special": false
|
| 682 |
+
},
|
| 683 |
+
"50337": {
|
| 684 |
+
"content": "[unused52]",
|
| 685 |
+
"lstrip": false,
|
| 686 |
+
"normalized": true,
|
| 687 |
+
"rstrip": false,
|
| 688 |
+
"single_word": false,
|
| 689 |
+
"special": false
|
| 690 |
+
},
|
| 691 |
+
"50338": {
|
| 692 |
+
"content": "[unused53]",
|
| 693 |
+
"lstrip": false,
|
| 694 |
+
"normalized": true,
|
| 695 |
+
"rstrip": false,
|
| 696 |
+
"single_word": false,
|
| 697 |
+
"special": false
|
| 698 |
+
},
|
| 699 |
+
"50339": {
|
| 700 |
+
"content": "[unused54]",
|
| 701 |
+
"lstrip": false,
|
| 702 |
+
"normalized": true,
|
| 703 |
+
"rstrip": false,
|
| 704 |
+
"single_word": false,
|
| 705 |
+
"special": false
|
| 706 |
+
},
|
| 707 |
+
"50340": {
|
| 708 |
+
"content": "[unused55]",
|
| 709 |
+
"lstrip": false,
|
| 710 |
+
"normalized": true,
|
| 711 |
+
"rstrip": false,
|
| 712 |
+
"single_word": false,
|
| 713 |
+
"special": false
|
| 714 |
+
},
|
| 715 |
+
"50341": {
|
| 716 |
+
"content": "[unused56]",
|
| 717 |
+
"lstrip": false,
|
| 718 |
+
"normalized": true,
|
| 719 |
+
"rstrip": false,
|
| 720 |
+
"single_word": false,
|
| 721 |
+
"special": false
|
| 722 |
+
},
|
| 723 |
+
"50342": {
|
| 724 |
+
"content": "[unused57]",
|
| 725 |
+
"lstrip": false,
|
| 726 |
+
"normalized": true,
|
| 727 |
+
"rstrip": false,
|
| 728 |
+
"single_word": false,
|
| 729 |
+
"special": false
|
| 730 |
+
},
|
| 731 |
+
"50343": {
|
| 732 |
+
"content": "[unused58]",
|
| 733 |
+
"lstrip": false,
|
| 734 |
+
"normalized": true,
|
| 735 |
+
"rstrip": false,
|
| 736 |
+
"single_word": false,
|
| 737 |
+
"special": false
|
| 738 |
+
},
|
| 739 |
+
"50344": {
|
| 740 |
+
"content": "[unused59]",
|
| 741 |
+
"lstrip": false,
|
| 742 |
+
"normalized": true,
|
| 743 |
+
"rstrip": false,
|
| 744 |
+
"single_word": false,
|
| 745 |
+
"special": false
|
| 746 |
+
},
|
| 747 |
+
"50345": {
|
| 748 |
+
"content": "[unused60]",
|
| 749 |
+
"lstrip": false,
|
| 750 |
+
"normalized": true,
|
| 751 |
+
"rstrip": false,
|
| 752 |
+
"single_word": false,
|
| 753 |
+
"special": false
|
| 754 |
+
},
|
| 755 |
+
"50346": {
|
| 756 |
+
"content": "[unused61]",
|
| 757 |
+
"lstrip": false,
|
| 758 |
+
"normalized": true,
|
| 759 |
+
"rstrip": false,
|
| 760 |
+
"single_word": false,
|
| 761 |
+
"special": false
|
| 762 |
+
},
|
| 763 |
+
"50347": {
|
| 764 |
+
"content": "[unused62]",
|
| 765 |
+
"lstrip": false,
|
| 766 |
+
"normalized": true,
|
| 767 |
+
"rstrip": false,
|
| 768 |
+
"single_word": false,
|
| 769 |
+
"special": false
|
| 770 |
+
},
|
| 771 |
+
"50348": {
|
| 772 |
+
"content": "[unused63]",
|
| 773 |
+
"lstrip": false,
|
| 774 |
+
"normalized": true,
|
| 775 |
+
"rstrip": false,
|
| 776 |
+
"single_word": false,
|
| 777 |
+
"special": false
|
| 778 |
+
},
|
| 779 |
+
"50349": {
|
| 780 |
+
"content": "[unused64]",
|
| 781 |
+
"lstrip": false,
|
| 782 |
+
"normalized": true,
|
| 783 |
+
"rstrip": false,
|
| 784 |
+
"single_word": false,
|
| 785 |
+
"special": false
|
| 786 |
+
},
|
| 787 |
+
"50350": {
|
| 788 |
+
"content": "[unused65]",
|
| 789 |
+
"lstrip": false,
|
| 790 |
+
"normalized": true,
|
| 791 |
+
"rstrip": false,
|
| 792 |
+
"single_word": false,
|
| 793 |
+
"special": false
|
| 794 |
+
},
|
| 795 |
+
"50351": {
|
| 796 |
+
"content": "[unused66]",
|
| 797 |
+
"lstrip": false,
|
| 798 |
+
"normalized": true,
|
| 799 |
+
"rstrip": false,
|
| 800 |
+
"single_word": false,
|
| 801 |
+
"special": false
|
| 802 |
+
},
|
| 803 |
+
"50352": {
|
| 804 |
+
"content": "[unused67]",
|
| 805 |
+
"lstrip": false,
|
| 806 |
+
"normalized": true,
|
| 807 |
+
"rstrip": false,
|
| 808 |
+
"single_word": false,
|
| 809 |
+
"special": false
|
| 810 |
+
},
|
| 811 |
+
"50353": {
|
| 812 |
+
"content": "[unused68]",
|
| 813 |
+
"lstrip": false,
|
| 814 |
+
"normalized": true,
|
| 815 |
+
"rstrip": false,
|
| 816 |
+
"single_word": false,
|
| 817 |
+
"special": false
|
| 818 |
+
},
|
| 819 |
+
"50354": {
|
| 820 |
+
"content": "[unused69]",
|
| 821 |
+
"lstrip": false,
|
| 822 |
+
"normalized": true,
|
| 823 |
+
"rstrip": false,
|
| 824 |
+
"single_word": false,
|
| 825 |
+
"special": false
|
| 826 |
+
},
|
| 827 |
+
"50355": {
|
| 828 |
+
"content": "[unused70]",
|
| 829 |
+
"lstrip": false,
|
| 830 |
+
"normalized": true,
|
| 831 |
+
"rstrip": false,
|
| 832 |
+
"single_word": false,
|
| 833 |
+
"special": false
|
| 834 |
+
},
|
| 835 |
+
"50356": {
|
| 836 |
+
"content": "[unused71]",
|
| 837 |
+
"lstrip": false,
|
| 838 |
+
"normalized": true,
|
| 839 |
+
"rstrip": false,
|
| 840 |
+
"single_word": false,
|
| 841 |
+
"special": false
|
| 842 |
+
},
|
| 843 |
+
"50357": {
|
| 844 |
+
"content": "[unused72]",
|
| 845 |
+
"lstrip": false,
|
| 846 |
+
"normalized": true,
|
| 847 |
+
"rstrip": false,
|
| 848 |
+
"single_word": false,
|
| 849 |
+
"special": false
|
| 850 |
+
},
|
| 851 |
+
"50358": {
|
| 852 |
+
"content": "[unused73]",
|
| 853 |
+
"lstrip": false,
|
| 854 |
+
"normalized": true,
|
| 855 |
+
"rstrip": false,
|
| 856 |
+
"single_word": false,
|
| 857 |
+
"special": false
|
| 858 |
+
},
|
| 859 |
+
"50359": {
|
| 860 |
+
"content": "[unused74]",
|
| 861 |
+
"lstrip": false,
|
| 862 |
+
"normalized": true,
|
| 863 |
+
"rstrip": false,
|
| 864 |
+
"single_word": false,
|
| 865 |
+
"special": false
|
| 866 |
+
},
|
| 867 |
+
"50360": {
|
| 868 |
+
"content": "[unused75]",
|
| 869 |
+
"lstrip": false,
|
| 870 |
+
"normalized": true,
|
| 871 |
+
"rstrip": false,
|
| 872 |
+
"single_word": false,
|
| 873 |
+
"special": false
|
| 874 |
+
},
|
| 875 |
+
"50361": {
|
| 876 |
+
"content": "[unused76]",
|
| 877 |
+
"lstrip": false,
|
| 878 |
+
"normalized": true,
|
| 879 |
+
"rstrip": false,
|
| 880 |
+
"single_word": false,
|
| 881 |
+
"special": false
|
| 882 |
+
},
|
| 883 |
+
"50362": {
|
| 884 |
+
"content": "[unused77]",
|
| 885 |
+
"lstrip": false,
|
| 886 |
+
"normalized": true,
|
| 887 |
+
"rstrip": false,
|
| 888 |
+
"single_word": false,
|
| 889 |
+
"special": false
|
| 890 |
+
},
|
| 891 |
+
"50363": {
|
| 892 |
+
"content": "[unused78]",
|
| 893 |
+
"lstrip": false,
|
| 894 |
+
"normalized": true,
|
| 895 |
+
"rstrip": false,
|
| 896 |
+
"single_word": false,
|
| 897 |
+
"special": false
|
| 898 |
+
},
|
| 899 |
+
"50364": {
|
| 900 |
+
"content": "[unused79]",
|
| 901 |
+
"lstrip": false,
|
| 902 |
+
"normalized": true,
|
| 903 |
+
"rstrip": false,
|
| 904 |
+
"single_word": false,
|
| 905 |
+
"special": false
|
| 906 |
+
},
|
| 907 |
+
"50365": {
|
| 908 |
+
"content": "[unused80]",
|
| 909 |
+
"lstrip": false,
|
| 910 |
+
"normalized": true,
|
| 911 |
+
"rstrip": false,
|
| 912 |
+
"single_word": false,
|
| 913 |
+
"special": false
|
| 914 |
+
},
|
| 915 |
+
"50366": {
|
| 916 |
+
"content": "[unused81]",
|
| 917 |
+
"lstrip": false,
|
| 918 |
+
"normalized": true,
|
| 919 |
+
"rstrip": false,
|
| 920 |
+
"single_word": false,
|
| 921 |
+
"special": false
|
| 922 |
+
},
|
| 923 |
+
"50367": {
|
| 924 |
+
"content": "[unused82]",
|
| 925 |
+
"lstrip": false,
|
| 926 |
+
"normalized": true,
|
| 927 |
+
"rstrip": false,
|
| 928 |
+
"single_word": false,
|
| 929 |
+
"special": false
|
| 930 |
+
}
|
| 931 |
+
},
|
| 932 |
+
"clean_up_tokenization_spaces": true,
|
| 933 |
+
"cls_token": "[CLS]",
|
| 934 |
+
"extra_special_tokens": {},
|
| 935 |
+
"mask_token": "[MASK]",
|
| 936 |
+
"model_input_names": [
|
| 937 |
+
"input_ids",
|
| 938 |
+
"attention_mask"
|
| 939 |
+
],
|
| 940 |
+
"model_max_length": 8192,
|
| 941 |
+
"pad_token": "[PAD]",
|
| 942 |
+
"sep_token": "[SEP]",
|
| 943 |
+
"tokenizer_class": "PreTrainedTokenizerFast",
|
| 944 |
+
"unk_token": "[UNK]"
|
| 945 |
+
}
|