Upload folder using huggingface_hub
Browse files- 1_Pooling/config.json +10 -0
- README.md +378 -3
- config.json +24 -0
- config_sentence_transformers.json +10 -0
- config_setfit.json +7 -0
- model.safetensors +3 -0
- model_head.pkl +3 -0
- modules.json +20 -0
- sentence_bert_config.json +4 -0
- special_tokens_map.json +51 -0
- tokenizer.json +0 -0
- tokenizer_config.json +72 -0
- vocab.txt +0 -0
1_Pooling/config.json
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"word_embedding_dimension": 768,
|
3 |
+
"pooling_mode_cls_token": false,
|
4 |
+
"pooling_mode_mean_tokens": true,
|
5 |
+
"pooling_mode_max_tokens": false,
|
6 |
+
"pooling_mode_mean_sqrt_len_tokens": false,
|
7 |
+
"pooling_mode_weightedmean_tokens": false,
|
8 |
+
"pooling_mode_lasttoken": false,
|
9 |
+
"include_prompt": true
|
10 |
+
}
|
README.md
CHANGED
@@ -1,3 +1,378 @@
|
|
1 |
-
---
|
2 |
-
|
3 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: setfit
|
3 |
+
metrics:
|
4 |
+
- accuracy
|
5 |
+
pipeline_tag: text-classification
|
6 |
+
tags:
|
7 |
+
- setfit
|
8 |
+
- sentence-transformers
|
9 |
+
- text-classification
|
10 |
+
- generated_from_setfit_trainer
|
11 |
+
widget:
|
12 |
+
- text: "Consistent CFE_PSP_Main implementation\nRTEMS PSP hardcodes \"/cf/cfe_es_startup.scr\"\
|
13 |
+
, but mcp750 and pc-linux both use the CFE_PLATFORM_ES_NONVOL_STARTUP_FILE.\r\n\
|
14 |
+
\r\nInconsistent implementations.\r\n\r\nFrom #102 (solved here):\r\ncfe_psp_start.c\
|
15 |
+
\ for mcp750 VxWorks has StartupFilePath as an input parameter to CFE_PSP_Main,\
|
16 |
+
\ but calls CFE_ES_Main with CFE_PLATFORM_ES_NONVOL_STARTUP_FILE.\r\n\r\nConfusing\
|
17 |
+
\ implementation... looks like at least the pc-linux PSP only uses CFE_PLATFORM_ES_NONVOL_STARTUP_FILE\
|
18 |
+
\ (but a different prototype)."
|
19 |
+
- text: "Fix input options handling dashes\n**Describe the bug**\r\nThe \"help\" option\
|
20 |
+
\ is triggered by `-help` which only uses one dash. Full-word options should use\
|
21 |
+
\ double dashes.\r\n\r\n**To Reproduce**\r\nSee code\r\n\r\n```\r\nif ((argc !=\
|
22 |
+
\ 2) || (strncmp(argv[1], \"-help\", 100) == 0))\r\n {\r\n printf(\"\
|
23 |
+
\\ncFE TS CRC calculator: \\%s\\n\", CFE_TS_CRC_VERSION_STRING);\r\n printf(\"\
|
24 |
+
\\nUsage: cfe_ts_crc [filename]\\n\");\r\n exit(0);\r\n }\r\n```\r\n\
|
25 |
+
\r\n**Expected behavior**\r\nUse `--help` instead\r\n\r\n**Code snips**\r\nIf\
|
26 |
+
\ applicable, add references to the software.\r\n\r\n**System observed on:**\r\
|
27 |
+
\nSource code\r\n\r\n**Additional context**\r\nNone\r\n\r\n**Reporter Info**\r\
|
28 |
+
\nGerardo E. Cruz-Ortiz, NASA-GSFC"
|
29 |
+
- text: "OS_TaskExit() on VxWorks causes task table owner to be the deleted task\n\
|
30 |
+
**Describe the bug**\r\nOS_TaskExit() calls OS_ObjectIdFinalizeDelete(). This\
|
31 |
+
\ function sets the task's record->active_id to 0, which is also being used as\
|
32 |
+
\ the task ID on VxWorks. ObjectIdFinalizeDelete() subsequently calls OS_Unlock_Global,\
|
33 |
+
\ which errors out and does not clear the owner, as the task ID is now zeroed\
|
34 |
+
\ out and does not match the owner of the table. This does not occur on Linux\r\
|
35 |
+
\n\r\n**To Reproduce**\r\nSteps to reproduce the behavior:\r\nOn VxWorks, call\
|
36 |
+
\ CFE_ES_ExitChildTask with OSAL_CONFIG_DEBUG_PRINTF enabled\r\n\r\n**Expected\
|
37 |
+
\ behavior**\r\nError message should not be printed out\r\n\r\n**Code snips**\r\
|
38 |
+
\nhttps://github.com/nasa/osal/blob/1a826576f8dd9eb37f47da0e633b1d4712b8ac61/src/os/shared/src/osapi-idmap.c#L745-L777\r\
|
39 |
+
\nhttps://github.com/nasa/osal/blob/1a826576f8dd9eb37f47da0e633b1d4712b8ac61/src/os/shared/src/osapi-idmap.c#L625-L676\r\
|
40 |
+
\nhttps://github.com/nasa/osal/blob/1a826576f8dd9eb37f47da0e633b1d4712b8ac61/src/os/vxworks/src/os-impl-tasks.c#L385-L413\r\
|
41 |
+
\nhttps://github.com/nasa/osal/blob/1a826576f8dd9eb37f47da0e633b1d4712b8ac61/src/os/posix/src/os-impl-tasks.c#L736-L751\r\
|
42 |
+
\n\r\n**System observed on:**\r\n - SP0\r\n - OS: VxWorks 6.9\r\n - Versions:\
|
43 |
+
\ CFE 6.8, OSAL 5.1.0-rc1+dev16, \r\n\r\n**Additional context**\r\nSee attached\
|
44 |
+
\ screenshots for stack traces\r\n![image](https://user-images.githubusercontent.com/63735778/98269251-82b02900-1f5b-11eb-83f9-0af820169aa8.png)\r\
|
45 |
+
\n![image](https://user-images.githubusercontent.com/63735778/98269098-5b595c00-1f5b-11eb-836c-4abd911c123e.png)\r\
|
46 |
+
\n**Reporter Info**\r\nJohn N. Pham, Northrop Grumman\r\n\r\n\r\n"
|
47 |
+
- text: "Outdated License(?)\nMany files in the PSP (and one in the CFS) contain a\
|
48 |
+
\ file license header that seems to be outdated? It doesn't reference the NOSA,\
|
49 |
+
\ and seems to include restrictions that are in conflict with the NOSA (see the\
|
50 |
+
\ 2nd paragraph). Note, Working with the SourceForge cFE release.\r\n\r\nAn example:\r\
|
51 |
+
\n{{{\r\n** Copyright (c) 2004-2006, United States government as represented\
|
52 |
+
\ by the\r\n** administrator of the National Aeronautics Space Administration.\r\
|
53 |
+
\n** All rights reserved. This software(cFE) was created at NASA Goddard\r\
|
54 |
+
\n** Space Flight Center pursuant to government contracts.\r\n**\r\n** \
|
55 |
+
\ This software may be used only pursuant to a United States government\r\n\
|
56 |
+
** sponsored project and the United States government may not be charged\r\
|
57 |
+
\n** for use thereof.\r\n}}}\r\n\r\nA quick grep showed these files:\r\n\
|
58 |
+
{{{\r\nfind . -type f -exec grep -li \"This software may be used only\" {} \\\
|
59 |
+
;\r\n./CFS/hs/fsw/unit_test/cfe_psp_timer.c\r\n./cFE/psp/fsw/mcp750-vxworks6.4/inc/psp_version.h\r\
|
60 |
+
\n./cFE/psp/fsw/mcp750-vxworks6.4/inc/cfe_psp_config.h\r\n./cFE/psp/fsw/mcp750-vxworks6.4/src/cfe_psp_support.c\r\
|
61 |
+
\n./cFE/psp/fsw/mcp750-vxworks6.4/src/cfe_psp_start.c\r\n./cFE/psp/fsw/mcp750-vxworks6.4/src/cfe_psp_ssr.c\r\
|
62 |
+
\n./cFE/psp/fsw/mcp750-vxworks6.4/src/cfe_psp_voltab.c\r\n./cFE/psp/fsw/mcp750-vxworks6.4/src/cfe_psp_exception.c\r\
|
63 |
+
\n./cFE/psp/fsw/mcp750-vxworks6.4/src/cfe_psp_watchdog.c\r\n./cFE/psp/fsw/mcp750-vxworks6.4/src/cfe_psp_timer.c\r\
|
64 |
+
\n./cFE/psp/fsw/mcp750-vxworks6.4/src/cfe_psp_memory.c\r\n./cFE/psp/fsw/inc/cfe_psp.h\r\
|
65 |
+
\n./cFE/psp/fsw/arm-linux/inc/psp_version.h\r\n./cFE/psp/fsw/arm-linux/inc/cfe_psp_config.h\r\
|
66 |
+
\n./cFE/psp/fsw/arm-linux/src/cfe_psp_support.c\r\n./cFE/psp/fsw/arm-linux/src/cfe_psp_start.c\r\
|
67 |
+
\n./cFE/psp/fsw/arm-linux/src/cfe_psp_ssr.c\r\n./cFE/psp/fsw/arm-linux/src/cfe_psp_voltab.c\r\
|
68 |
+
\n./cFE/psp/fsw/arm-linux/src/cfe_psp_exception.c\r\n./cFE/psp/fsw/arm-linux/src/cfe_psp_watchdog.c\r\
|
69 |
+
\n./cFE/psp/fsw/arm-linux/src/cfe_psp_timer.c\r\n./cFE/psp/fsw/arm-linux/src/cfe_psp_memory.c\r\
|
70 |
+
\n./cFE/psp/fsw/pc-cygwin/inc/psp_version.h\r\n./cFE/psp/fsw/pc-cygwin/inc/cfe_psp_config.h\r\
|
71 |
+
\n./cFE/psp/fsw/pc-cygwin/src/cfe_psp_support.c\r\n./cFE/psp/fsw/pc-cygwin/src/cfe_psp_start.c\r\
|
72 |
+
\n./cFE/psp/fsw/pc-cygwin/src/cfe_psp_ssr.c\r\n./cFE/psp/fsw/pc-cygwin/src/cfe_psp_voltab.c\r\
|
73 |
+
\n./cFE/psp/fsw/pc-cygwin/src/cfe_psp_exception.c\r\n./cFE/psp/fsw/pc-cygwin/src/cfe_psp_watchdog.c\r\
|
74 |
+
\n./cFE/psp/fsw/pc-cygwin/src/cfe_psp_timer.c\r\n./cFE/psp/fsw/pc-cygwin/src/cfe_psp_memory.c\r\
|
75 |
+
\n./cFE/psp/fsw/mac-osx/inc/psp_version.h\r\n./cFE/psp/fsw/mac-osx/inc/cfe_psp_config.h\r\
|
76 |
+
\n./cFE/psp/fsw/mac-osx/src/cfe_psp_support.c\r\n./cFE/psp/fsw/mac-osx/src/cfe_psp_start.c\r\
|
77 |
+
\n./cFE/psp/fsw/mac-osx/src/cfe_psp_ssr.c\r\n./cFE/psp/fsw/mac-osx/src/cfe_psp_voltab.c\r\
|
78 |
+
\n./cFE/psp/fsw/mac-osx/src/cfe_psp_exception.c\r\n./cFE/psp/fsw/mac-osx/src/cfe_psp_watchdog.c\r\
|
79 |
+
\n./cFE/psp/fsw/mac-osx/src/cfe_psp_timer.c\r\n./cFE/psp/fsw/mac-osx/src/cfe_psp_memory.c\r\
|
80 |
+
\n./cFE/psp/fsw/pc-linux/inc/psp_version.h\r\n./cFE/psp/fsw/pc-linux/inc/cfe_psp_config.h\r\
|
81 |
+
\n./cFE/psp/fsw/pc-linux/src/cfe_psp_support.c\r\n./cFE/psp/fsw/pc-linux/src/cfe_psp_start.c\r\
|
82 |
+
\n./cFE/psp/fsw/pc-linux/src/cfe_psp_ssr.c\r\n./cFE/psp/fsw/pc-linux/src/cfe_psp_voltab.c\r\
|
83 |
+
\n./cFE/psp/fsw/pc-linux/src/cfe_psp_exception.c\r\n./cFE/psp/fsw/pc-linux/src/cfe_psp_watchdog.c\r\
|
84 |
+
\n./cFE/psp/fsw/pc-linux/src/cfe_psp_timer.c\r\n./cFE/psp/fsw/pc-linux/src/cfe_psp_memory.c\r\
|
85 |
+
\n./cFE/psp/fsw/grut699-vxworks6/inc/psp_version.h\r\n./cFE/psp/fsw/grut699-vxworks6/inc/cfe_psp_config.h\r\
|
86 |
+
\n./cFE/psp/fsw/grut699-vxworks6/src/cfe_psp_support.c\r\n./cFE/psp/fsw/grut699-vxworks6/src/cfe_psp_start.c\r\
|
87 |
+
\n./cFE/psp/fsw/grut699-vxworks6/src/cfe_psp_ssr.c\r\n./cFE/psp/fsw/grut699-vxworks6/src/cfe_psp_voltab.c\r\
|
88 |
+
\n./cFE/psp/fsw/grut699-vxworks6/src/cfe_psp_exception.c\r\n./cFE/psp/fsw/grut699-vxworks6/src/cfe_psp_watchdog.c\r\
|
89 |
+
\n./cFE/psp/fsw/grut699-vxworks6/src/cfe_psp_timer.c\r\n./cFE/psp/fsw/grut699-vxworks6/src/cfe_psp_memory.c\r\
|
90 |
+
\n./cFE/psp/fsw/mcf5235-rtems/inc/psp_version.h\r\n./cFE/psp/fsw/mcf5235-rtems/inc/cfe_psp_config.h\r\
|
91 |
+
\n./cFE/psp/fsw/mcf5235-rtems/src/cfe_psp_support.c\r\n./cFE/psp/fsw/mcf5235-rtems/src/cfe_psp_start.c\r\
|
92 |
+
\n./cFE/psp/fsw/mcf5235-rtems/src/cfe_psp_ssr.c\r\n./cFE/psp/fsw/mcf5235-rtems/src/cfe_psp_voltab.c\r\
|
93 |
+
\n./cFE/psp/fsw/mcf5235-rtems/src/cfe_psp_exception.c\r\n./cFE/psp/fsw/mcf5235-rtems/src/cfe_psp_watchdog.c\r\
|
94 |
+
\n./cFE/psp/fsw/mcf5235-rtems/src/cfe_psp_timer.c\r\n./cFE/psp/fsw/mcf5235-rtems/src/cfe_psp_memory.c\r\
|
95 |
+
\n}}}\r\n"
|
96 |
+
- text: "Use a changelog to keep track of changes instead of having them in the Readme\
|
97 |
+
\ \n**Is your feature request related to a problem? Please describe.**\r\nThe\
|
98 |
+
\ version history in the Readme file clutters useful information\r\n\r\n**Describe\
|
99 |
+
\ the solution you'd like**\r\nMove the \"version history\" from `Readme.md` to\
|
100 |
+
\ `CHANGELOG.md` and start following this spec: https://keepachangelog.com/en/1.0.0/\r\
|
101 |
+
\n\r\n**Describe alternatives you've considered**\r\nMove changelog section in\
|
102 |
+
\ the readme to a section at the very bottom of the file\r\n\r\n**Additional context**\r\
|
103 |
+
\nNone\r\n\r\n**Requester Info**\r\nGerardo E. Cruz-Ortiz, NASA-GSFC\r\n"
|
104 |
+
inference: true
|
105 |
+
---
|
106 |
+
|
107 |
+
# SetFit
|
108 |
+
|
109 |
+
This is a [SetFit](https://github.com/huggingface/setfit) model that can be used for Text Classification. A [LogisticRegression](https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.LogisticRegression.html) instance is used for classification.
|
110 |
+
|
111 |
+
The model has been trained using an efficient few-shot learning technique that involves:
|
112 |
+
|
113 |
+
1. Fine-tuning a [Sentence Transformer](https://www.sbert.net) with contrastive learning.
|
114 |
+
2. Training a classification head with features from the fine-tuned Sentence Transformer.
|
115 |
+
|
116 |
+
## Model Details
|
117 |
+
|
118 |
+
### Model Description
|
119 |
+
- **Model Type:** SetFit
|
120 |
+
<!-- - **Sentence Transformer:** [Unknown](https://huggingface.co/unknown) -->
|
121 |
+
- **Classification head:** a [LogisticRegression](https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.LogisticRegression.html) instance
|
122 |
+
- **Maximum Sequence Length:** 384 tokens
|
123 |
+
- **Number of Classes:** 2 classes
|
124 |
+
<!-- - **Training Dataset:** [Unknown](https://huggingface.co/datasets/unknown) -->
|
125 |
+
<!-- - **Language:** Unknown -->
|
126 |
+
<!-- - **License:** Unknown -->
|
127 |
+
|
128 |
+
### Model Sources
|
129 |
+
|
130 |
+
- **Repository:** [SetFit on GitHub](https://github.com/huggingface/setfit)
|
131 |
+
- **Paper:** [Efficient Few-Shot Learning Without Prompts](https://arxiv.org/abs/2209.11055)
|
132 |
+
- **Blogpost:** [SetFit: Efficient Few-Shot Learning Without Prompts](https://huggingface.co/blog/setfit)
|
133 |
+
|
134 |
+
### Model Labels
|
135 |
+
| Label | Examples |
|
136 |
+
|:--------|:-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
137 |
+
| non-bug | <ul><li>"Define file subtype value behavior/expectations\n**Is your feature request related to a problem? Please describe.**\r\nNot clear if the CFE_FS_InitHeader SubType needs to be one of the FS enums or if it can be user defined by apps. Note there is no longer a shell file created by ES:\r\nhttps://github.com/nasa/cFE/blob/e80aae94e0f56b868657daba965c590766a4dc57/modules/core_api/fsw/inc/cfe_fs_extern_typedefs.h#L101-L108\r\n\r\n**Describe the solution you'd like**\r\nNeed to determine if FS should define all file subtypes, or treat it as an extendable field (or whatever). That will affect if the SHELL subtype gets removed or renamed (since there is still an app that would create it). Note right now apps don't even use `CFE_FS_InitHeader`, but they do currently set unique values.\r\n\r\n**Describe alternatives you've considered**\r\nNone\r\n\r\n**Additional context**\r\nCode review\r\n\r\n**Requester Info**\r\nJacob Hageman - NASA/GSFC\r\n"</li><li>'Disambiguate command vs message requirements \n**Is your feature request related to a problem? Please describe.**\r\n"Command" terminology has been used for both ground commands (that increment command counters) and inter-app commands (that typically do not increment command counters). So it\'s unclear in the requirement which sort of use case is intended.\r\n\r\n**Describe the solution you\'d like**\r\n"Command" is ground command with additional associated behavior (increments command counters), "Message" is typical sb message that does not increment command counter.\r\n\r\n**Describe alternatives you\'ve considered**\r\nNone\r\n\r\n**Additional context**\r\nDiscovered during requirements scrub, helps clarify what impacts command counter.\r\n\r\n**Requester Info**\r\nJacob Hageman - NASA/GSFC\r\n'</li><li>"Improve table handling\n**Is your feature request related to a problem? Please describe.**\r\nDoesn't actually allow table management within the task loop\r\n\r\n**Describe the solution you'd like**\r\nActually follow the table management pattern, allowing updates (should be a decent example)\r\n\r\n**Describe alternatives you've considered**\r\nN/A\r\n\r\n**Additional context**\r\nN/A\r\n\r\n**Requester Info**\r\nJacob Hageman - NASA/GSFC"</li></ul> |
|
138 |
+
| bug | <ul><li>'CFE_PLATFORM_ES_PERF_MAX_IDS not fully deprecated\n**Describe the bug**\r\nCFE_PLATFORM_ES_PERF_MAX_IDS was superseded by CFE_MISSION_ES_PERF_MAX_IDS as noted in this comment: https://github.com/nasa/cFE/search?q=CFE_PLATFORM_ES_PERF_MAX_IDS. However, sample cpu1_platform_cfg.h still contains the definition for CFE_PLATFORM_ES_PERF_MAX_IDS is still referenced in es_UT.c and comments in cfe_es_events.h and sample_perfids.h\r\n\r\n**To Reproduce**\r\nN/A\r\n\r\n**Expected behavior**\r\nEither CFE_PLATFORM_ES_PERF_MAX_IDS should be totally deprecated and all references should be replaced by CFE_MISSION_ES_PERF_MAX_IDS or (if deemed necessary) support for platform-specific max values should be re-added in the perf-log implementation.\r\n\r\n**Code snips**\r\ncfe/cmake/sample_defs/cpu1_platform_cfg.h:1978\r\ncfe/fsw/cfe-core/src/inc/cfe_es_events.h:1046\r\ncfe/fsw/cfe-core/unit-test/es_UT.c:3664\r\n\r\n**System observed on:**\r\nN/A\r\n\r\n**Additional context**\r\nN/A\r\n\r\n**Reporter Info**\r\nPJ Chapates Gateway Vehicle System Manager FSW Production, JSC\r\n'</li><li>'CF Purge Queue Command Opcode Not Defined\n**This issue was imported from the GSFC issue tracking system**\r\n\r\n_Imported from_: [GSFCCFS-1765] CF Purge Queue Command Opcode Not Defined\r\n_Originally submitted by_: Maldonado, Sergio E. (GSFC-580.0)[Arctic Slope Technical Services, Inc.] on Fri Oct 29 11:03:57 2021\r\n\r\n_Original Description_:\r\nThe command opcode for Purge Queue is not present in the CF\\_CMDS enumeration in cf\\_msg.h. It should be present with a value of 21. The command dispatch table in cf\\_cmd.c does have an entry for the command, as well as the implementation. Without the opcode defined, the command cannot be verified at the functional level. '</li><li>"File age check logic is wrong\n**Checklist (Please check before submitting)**\r\n\r\n* [x] I reviewed the [Contributing Guide](https://github.com/nasa/DS/blob/main/CONTRIBUTING.md).\r\n* [x] I performed a cursory search to see if the bug report is relevant, not redundant, nor in conflict with other tickets.\r\n\r\n**Describe the bug**\r\nProduces ~17 files in 10 minutes when requesting 1 file per minute\r\n\r\n**To Reproduce**\r\n1. Enable a 1 file per minute config\r\n2. Watch ~17 files get produced\r\n\r\n**Expected behavior**\r\n1 file per minute when configured to do so\r\n\r\n**Code snips**\r\nThe problem is how file age is accumulated. W/ the default config, 4 seconds are added every HK message, and another second is added every 1 second SB timeout. So within the typical 4 second scheduled HK request the file age gets incremented by 7 seconds (4 from HK processing and 3 from SB timeouts).\r\n\r\nhttps://github.com/nasa/DS/blob/ce988535edffd6b36cc1083e10988c2d0a4a38db/fsw/src/ds_app.c#L124\r\nhttps://github.com/nasa/DS/blob/ce988535edffd6b36cc1083e10988c2d0a4a38db/fsw/src/ds_app.c#L520\r\n\r\nReally the time accumulation logic is broken since it's going to vary based on receiving any other command that would cause SB not to timeout.\r\n\r\nLikely needs a functional test update to catch this issue.\r\n\r\n**System observed on:**\r\nIndependent of system\r\n\r\n**Additional context**\r\nNone\r\n\r\n**Reporter Info**\r\nJacob Hageman - NASA/GSFC"</li></ul> |
|
139 |
+
|
140 |
+
## Uses
|
141 |
+
|
142 |
+
### Direct Use for Inference
|
143 |
+
|
144 |
+
First install the SetFit library:
|
145 |
+
|
146 |
+
```bash
|
147 |
+
pip install setfit
|
148 |
+
```
|
149 |
+
|
150 |
+
Then you can load this model and run inference.
|
151 |
+
|
152 |
+
```python
|
153 |
+
from setfit import SetFitModel
|
154 |
+
|
155 |
+
# Download from the 🤗 Hub
|
156 |
+
model = SetFitModel.from_pretrained("setfit_model_id")
|
157 |
+
# Run inference
|
158 |
+
preds = model("Consistent CFE_PSP_Main implementation
|
159 |
+
RTEMS PSP hardcodes \"/cf/cfe_es_startup.scr\", but mcp750 and pc-linux both use the CFE_PLATFORM_ES_NONVOL_STARTUP_FILE.
|
160 |
+
|
161 |
+
Inconsistent implementations.
|
162 |
+
|
163 |
+
From #102 (solved here):
|
164 |
+
cfe_psp_start.c for mcp750 VxWorks has StartupFilePath as an input parameter to CFE_PSP_Main, but calls CFE_ES_Main with CFE_PLATFORM_ES_NONVOL_STARTUP_FILE.
|
165 |
+
|
166 |
+
Confusing implementation... looks like at least the pc-linux PSP only uses CFE_PLATFORM_ES_NONVOL_STARTUP_FILE (but a different prototype).")
|
167 |
+
```
|
168 |
+
|
169 |
+
<!--
|
170 |
+
### Downstream Use
|
171 |
+
|
172 |
+
*List how someone could finetune this model on their own dataset.*
|
173 |
+
-->
|
174 |
+
|
175 |
+
<!--
|
176 |
+
### Out-of-Scope Use
|
177 |
+
|
178 |
+
*List how the model may foreseeably be misused and address what users ought not to do with the model.*
|
179 |
+
-->
|
180 |
+
|
181 |
+
<!--
|
182 |
+
## Bias, Risks and Limitations
|
183 |
+
|
184 |
+
*What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
|
185 |
+
-->
|
186 |
+
|
187 |
+
<!--
|
188 |
+
### Recommendations
|
189 |
+
|
190 |
+
*What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
|
191 |
+
-->
|
192 |
+
|
193 |
+
## Training Details
|
194 |
+
|
195 |
+
### Training Set Metrics
|
196 |
+
| Training set | Min | Median | Max |
|
197 |
+
|:-------------|:----|:---------|:-----|
|
198 |
+
| Word count | 1 | 110.5796 | 2778 |
|
199 |
+
|
200 |
+
| Label | Training Sample Count |
|
201 |
+
|:--------|:----------------------|
|
202 |
+
| bug | 662 |
|
203 |
+
| non-bug | 1517 |
|
204 |
+
|
205 |
+
### Training Hyperparameters
|
206 |
+
- batch_size: (16, 2)
|
207 |
+
- num_epochs: (1, 1)
|
208 |
+
- max_steps: -1
|
209 |
+
- sampling_strategy: oversampling
|
210 |
+
- num_iterations: 20
|
211 |
+
- body_learning_rate: (2e-05, 1e-05)
|
212 |
+
- head_learning_rate: 0.01
|
213 |
+
- loss: CosineSimilarityLoss
|
214 |
+
- distance_metric: cosine_distance
|
215 |
+
- margin: 0.25
|
216 |
+
- end_to_end: False
|
217 |
+
- use_amp: False
|
218 |
+
- warmup_proportion: 0.1
|
219 |
+
- l2_weight: 0.01
|
220 |
+
- seed: 42
|
221 |
+
- eval_max_steps: -1
|
222 |
+
- load_best_model_at_end: False
|
223 |
+
|
224 |
+
### Training Results
|
225 |
+
| Epoch | Step | Training Loss | Validation Loss |
|
226 |
+
|:------:|:----:|:-------------:|:---------------:|
|
227 |
+
| 0.0002 | 1 | 0.4726 | - |
|
228 |
+
| 0.0092 | 50 | 0.2725 | - |
|
229 |
+
| 0.0184 | 100 | 0.2269 | - |
|
230 |
+
| 0.0275 | 150 | 0.2061 | - |
|
231 |
+
| 0.0367 | 200 | 0.2113 | - |
|
232 |
+
| 0.0459 | 250 | 0.1806 | - |
|
233 |
+
| 0.0551 | 300 | 0.1833 | - |
|
234 |
+
| 0.0642 | 350 | 0.1578 | - |
|
235 |
+
| 0.0734 | 400 | 0.1478 | - |
|
236 |
+
| 0.0826 | 450 | 0.1376 | - |
|
237 |
+
| 0.0918 | 500 | 0.1135 | - |
|
238 |
+
| 0.1010 | 550 | 0.1145 | - |
|
239 |
+
| 0.1101 | 600 | 0.1099 | - |
|
240 |
+
| 0.1193 | 650 | 0.0859 | - |
|
241 |
+
| 0.1285 | 700 | 0.0837 | - |
|
242 |
+
| 0.1377 | 750 | 0.0826 | - |
|
243 |
+
| 0.1468 | 800 | 0.0809 | - |
|
244 |
+
| 0.1560 | 850 | 0.0559 | - |
|
245 |
+
| 0.1652 | 900 | 0.0539 | - |
|
246 |
+
| 0.1744 | 950 | 0.0444 | - |
|
247 |
+
| 0.1836 | 1000 | 0.0376 | - |
|
248 |
+
| 0.1927 | 1050 | 0.0387 | - |
|
249 |
+
| 0.2019 | 1100 | 0.035 | - |
|
250 |
+
| 0.2111 | 1150 | 0.0317 | - |
|
251 |
+
| 0.2203 | 1200 | 0.029 | - |
|
252 |
+
| 0.2294 | 1250 | 0.0277 | - |
|
253 |
+
| 0.2386 | 1300 | 0.0108 | - |
|
254 |
+
| 0.2478 | 1350 | 0.0226 | - |
|
255 |
+
| 0.2570 | 1400 | 0.0105 | - |
|
256 |
+
| 0.2662 | 1450 | 0.02 | - |
|
257 |
+
| 0.2753 | 1500 | 0.016 | - |
|
258 |
+
| 0.2845 | 1550 | 0.0181 | - |
|
259 |
+
| 0.2937 | 1600 | 0.0184 | - |
|
260 |
+
| 0.3029 | 1650 | 0.0113 | - |
|
261 |
+
| 0.3120 | 1700 | 0.014 | - |
|
262 |
+
| 0.3212 | 1750 | 0.0101 | - |
|
263 |
+
| 0.3304 | 1800 | 0.0106 | - |
|
264 |
+
| 0.3396 | 1850 | 0.0101 | - |
|
265 |
+
| 0.3488 | 1900 | 0.0117 | - |
|
266 |
+
| 0.3579 | 1950 | 0.0115 | - |
|
267 |
+
| 0.3671 | 2000 | 0.0113 | - |
|
268 |
+
| 0.3763 | 2050 | 0.005 | - |
|
269 |
+
| 0.3855 | 2100 | 0.0062 | - |
|
270 |
+
| 0.3946 | 2150 | 0.0141 | - |
|
271 |
+
| 0.4038 | 2200 | 0.0096 | - |
|
272 |
+
| 0.4130 | 2250 | 0.0117 | - |
|
273 |
+
| 0.4222 | 2300 | 0.0051 | - |
|
274 |
+
| 0.4314 | 2350 | 0.0054 | - |
|
275 |
+
| 0.4405 | 2400 | 0.0049 | - |
|
276 |
+
| 0.4497 | 2450 | 0.0054 | - |
|
277 |
+
| 0.4589 | 2500 | 0.0027 | - |
|
278 |
+
| 0.4681 | 2550 | 0.0009 | - |
|
279 |
+
| 0.4772 | 2600 | 0.0021 | - |
|
280 |
+
| 0.4864 | 2650 | 0.005 | - |
|
281 |
+
| 0.4956 | 2700 | 0.0026 | - |
|
282 |
+
| 0.5048 | 2750 | 0.0025 | - |
|
283 |
+
| 0.5140 | 2800 | 0.0014 | - |
|
284 |
+
| 0.5231 | 2850 | 0.0005 | - |
|
285 |
+
| 0.5323 | 2900 | 0.0012 | - |
|
286 |
+
| 0.5415 | 2950 | 0.0027 | - |
|
287 |
+
| 0.5507 | 3000 | 0.0002 | - |
|
288 |
+
| 0.5598 | 3050 | 0.0012 | - |
|
289 |
+
| 0.5690 | 3100 | 0.0015 | - |
|
290 |
+
| 0.5782 | 3150 | 0.0001 | - |
|
291 |
+
| 0.5874 | 3200 | 0.0 | - |
|
292 |
+
| 0.5965 | 3250 | 0.0001 | - |
|
293 |
+
| 0.6057 | 3300 | 0.0011 | - |
|
294 |
+
| 0.6149 | 3350 | 0.0012 | - |
|
295 |
+
| 0.6241 | 3400 | 0.0043 | - |
|
296 |
+
| 0.6333 | 3450 | 0.0027 | - |
|
297 |
+
| 0.6424 | 3500 | 0.0007 | - |
|
298 |
+
| 0.6516 | 3550 | 0.0033 | - |
|
299 |
+
| 0.6608 | 3600 | 0.0005 | - |
|
300 |
+
| 0.6700 | 3650 | 0.0011 | - |
|
301 |
+
| 0.6791 | 3700 | 0.0023 | - |
|
302 |
+
| 0.6883 | 3750 | 0.0009 | - |
|
303 |
+
| 0.6975 | 3800 | 0.0012 | - |
|
304 |
+
| 0.7067 | 3850 | 0.0021 | - |
|
305 |
+
| 0.7159 | 3900 | 0.0003 | - |
|
306 |
+
| 0.7250 | 3950 | 0.0001 | - |
|
307 |
+
| 0.7342 | 4000 | 0.0001 | - |
|
308 |
+
| 0.7434 | 4050 | 0.0001 | - |
|
309 |
+
| 0.7526 | 4100 | 0.0023 | - |
|
310 |
+
| 0.7617 | 4150 | 0.0025 | - |
|
311 |
+
| 0.7709 | 4200 | 0.0001 | - |
|
312 |
+
| 0.7801 | 4250 | 0.0 | - |
|
313 |
+
| 0.7893 | 4300 | 0.0 | - |
|
314 |
+
| 0.7985 | 4350 | 0.001 | - |
|
315 |
+
| 0.8076 | 4400 | 0.0013 | - |
|
316 |
+
| 0.8168 | 4450 | 0.0002 | - |
|
317 |
+
| 0.8260 | 4500 | 0.0026 | - |
|
318 |
+
| 0.8352 | 4550 | 0.0002 | - |
|
319 |
+
| 0.8443 | 4600 | 0.0002 | - |
|
320 |
+
| 0.8535 | 4650 | 0.0 | - |
|
321 |
+
| 0.8627 | 4700 | 0.0001 | - |
|
322 |
+
| 0.8719 | 4750 | 0.0012 | - |
|
323 |
+
| 0.8811 | 4800 | 0.001 | - |
|
324 |
+
| 0.8902 | 4850 | 0.0001 | - |
|
325 |
+
| 0.8994 | 4900 | 0.001 | - |
|
326 |
+
| 0.9086 | 4950 | 0.0002 | - |
|
327 |
+
| 0.9178 | 5000 | 0.0002 | - |
|
328 |
+
| 0.9269 | 5050 | 0.001 | - |
|
329 |
+
| 0.9361 | 5100 | 0.0001 | - |
|
330 |
+
| 0.9453 | 5150 | 0.0021 | - |
|
331 |
+
| 0.9545 | 5200 | 0.0001 | - |
|
332 |
+
| 0.9637 | 5250 | 0.0001 | - |
|
333 |
+
| 0.9728 | 5300 | 0.0 | - |
|
334 |
+
| 0.9820 | 5350 | 0.0001 | - |
|
335 |
+
| 0.9912 | 5400 | 0.0002 | - |
|
336 |
+
|
337 |
+
### Framework Versions
|
338 |
+
- Python: 3.11.6
|
339 |
+
- SetFit: 1.1.0
|
340 |
+
- Sentence Transformers: 3.0.1
|
341 |
+
- Transformers: 4.44.2
|
342 |
+
- PyTorch: 2.4.1+cu121
|
343 |
+
- Datasets: 2.21.0
|
344 |
+
- Tokenizers: 0.19.1
|
345 |
+
|
346 |
+
## Citation
|
347 |
+
|
348 |
+
### BibTeX
|
349 |
+
```bibtex
|
350 |
+
@article{https://doi.org/10.48550/arxiv.2209.11055,
|
351 |
+
doi = {10.48550/ARXIV.2209.11055},
|
352 |
+
url = {https://arxiv.org/abs/2209.11055},
|
353 |
+
author = {Tunstall, Lewis and Reimers, Nils and Jo, Unso Eun Seo and Bates, Luke and Korat, Daniel and Wasserblat, Moshe and Pereg, Oren},
|
354 |
+
keywords = {Computation and Language (cs.CL), FOS: Computer and information sciences, FOS: Computer and information sciences},
|
355 |
+
title = {Efficient Few-Shot Learning Without Prompts},
|
356 |
+
publisher = {arXiv},
|
357 |
+
year = {2022},
|
358 |
+
copyright = {Creative Commons Attribution 4.0 International}
|
359 |
+
}
|
360 |
+
```
|
361 |
+
|
362 |
+
<!--
|
363 |
+
## Glossary
|
364 |
+
|
365 |
+
*Clearly define terms in order to be accessible across audiences.*
|
366 |
+
-->
|
367 |
+
|
368 |
+
<!--
|
369 |
+
## Model Card Authors
|
370 |
+
|
371 |
+
*Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
|
372 |
+
-->
|
373 |
+
|
374 |
+
<!--
|
375 |
+
## Model Card Contact
|
376 |
+
|
377 |
+
*Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
|
378 |
+
-->
|
config.json
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "sentence-transformers/all-mpnet-base-v2",
|
3 |
+
"architectures": [
|
4 |
+
"MPNetModel"
|
5 |
+
],
|
6 |
+
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"bos_token_id": 0,
|
8 |
+
"eos_token_id": 2,
|
9 |
+
"hidden_act": "gelu",
|
10 |
+
"hidden_dropout_prob": 0.1,
|
11 |
+
"hidden_size": 768,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 3072,
|
14 |
+
"layer_norm_eps": 1e-05,
|
15 |
+
"max_position_embeddings": 514,
|
16 |
+
"model_type": "mpnet",
|
17 |
+
"num_attention_heads": 12,
|
18 |
+
"num_hidden_layers": 12,
|
19 |
+
"pad_token_id": 1,
|
20 |
+
"relative_attention_num_buckets": 32,
|
21 |
+
"torch_dtype": "float32",
|
22 |
+
"transformers_version": "4.44.2",
|
23 |
+
"vocab_size": 30527
|
24 |
+
}
|
config_sentence_transformers.json
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"__version__": {
|
3 |
+
"sentence_transformers": "3.0.1",
|
4 |
+
"transformers": "4.44.2",
|
5 |
+
"pytorch": "2.4.1+cu121"
|
6 |
+
},
|
7 |
+
"prompts": {},
|
8 |
+
"default_prompt_name": null,
|
9 |
+
"similarity_fn_name": null
|
10 |
+
}
|
config_setfit.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"normalize_embeddings": false,
|
3 |
+
"labels": [
|
4 |
+
"bug",
|
5 |
+
"non-bug"
|
6 |
+
]
|
7 |
+
}
|
model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c79dcbe2189baa41c858c53c5d0df8f3d5b732ad5189ba655ab36e9e12d460c
|
3 |
+
size 437967672
|
model_head.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:694d9d99075f1d1b95462040d4767345d06b6fa7eb9f4eeeeec08284622ac32f
|
3 |
+
size 7055
|
modules.json
ADDED
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"idx": 0,
|
4 |
+
"name": "0",
|
5 |
+
"path": "",
|
6 |
+
"type": "sentence_transformers.models.Transformer"
|
7 |
+
},
|
8 |
+
{
|
9 |
+
"idx": 1,
|
10 |
+
"name": "1",
|
11 |
+
"path": "1_Pooling",
|
12 |
+
"type": "sentence_transformers.models.Pooling"
|
13 |
+
},
|
14 |
+
{
|
15 |
+
"idx": 2,
|
16 |
+
"name": "2",
|
17 |
+
"path": "2_Normalize",
|
18 |
+
"type": "sentence_transformers.models.Normalize"
|
19 |
+
}
|
20 |
+
]
|
sentence_bert_config.json
ADDED
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"max_seq_length": 384,
|
3 |
+
"do_lower_case": false
|
4 |
+
}
|
special_tokens_map.json
ADDED
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": {
|
3 |
+
"content": "<s>",
|
4 |
+
"lstrip": false,
|
5 |
+
"normalized": false,
|
6 |
+
"rstrip": false,
|
7 |
+
"single_word": false
|
8 |
+
},
|
9 |
+
"cls_token": {
|
10 |
+
"content": "<s>",
|
11 |
+
"lstrip": false,
|
12 |
+
"normalized": false,
|
13 |
+
"rstrip": false,
|
14 |
+
"single_word": false
|
15 |
+
},
|
16 |
+
"eos_token": {
|
17 |
+
"content": "</s>",
|
18 |
+
"lstrip": false,
|
19 |
+
"normalized": false,
|
20 |
+
"rstrip": false,
|
21 |
+
"single_word": false
|
22 |
+
},
|
23 |
+
"mask_token": {
|
24 |
+
"content": "<mask>",
|
25 |
+
"lstrip": true,
|
26 |
+
"normalized": false,
|
27 |
+
"rstrip": false,
|
28 |
+
"single_word": false
|
29 |
+
},
|
30 |
+
"pad_token": {
|
31 |
+
"content": "<pad>",
|
32 |
+
"lstrip": false,
|
33 |
+
"normalized": false,
|
34 |
+
"rstrip": false,
|
35 |
+
"single_word": false
|
36 |
+
},
|
37 |
+
"sep_token": {
|
38 |
+
"content": "</s>",
|
39 |
+
"lstrip": false,
|
40 |
+
"normalized": false,
|
41 |
+
"rstrip": false,
|
42 |
+
"single_word": false
|
43 |
+
},
|
44 |
+
"unk_token": {
|
45 |
+
"content": "[UNK]",
|
46 |
+
"lstrip": false,
|
47 |
+
"normalized": false,
|
48 |
+
"rstrip": false,
|
49 |
+
"single_word": false
|
50 |
+
}
|
51 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1,72 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"added_tokens_decoder": {
|
3 |
+
"0": {
|
4 |
+
"content": "<s>",
|
5 |
+
"lstrip": false,
|
6 |
+
"normalized": false,
|
7 |
+
"rstrip": false,
|
8 |
+
"single_word": false,
|
9 |
+
"special": true
|
10 |
+
},
|
11 |
+
"1": {
|
12 |
+
"content": "<pad>",
|
13 |
+
"lstrip": false,
|
14 |
+
"normalized": false,
|
15 |
+
"rstrip": false,
|
16 |
+
"single_word": false,
|
17 |
+
"special": true
|
18 |
+
},
|
19 |
+
"2": {
|
20 |
+
"content": "</s>",
|
21 |
+
"lstrip": false,
|
22 |
+
"normalized": false,
|
23 |
+
"rstrip": false,
|
24 |
+
"single_word": false,
|
25 |
+
"special": true
|
26 |
+
},
|
27 |
+
"3": {
|
28 |
+
"content": "<unk>",
|
29 |
+
"lstrip": false,
|
30 |
+
"normalized": true,
|
31 |
+
"rstrip": false,
|
32 |
+
"single_word": false,
|
33 |
+
"special": true
|
34 |
+
},
|
35 |
+
"104": {
|
36 |
+
"content": "[UNK]",
|
37 |
+
"lstrip": false,
|
38 |
+
"normalized": false,
|
39 |
+
"rstrip": false,
|
40 |
+
"single_word": false,
|
41 |
+
"special": true
|
42 |
+
},
|
43 |
+
"30526": {
|
44 |
+
"content": "<mask>",
|
45 |
+
"lstrip": true,
|
46 |
+
"normalized": false,
|
47 |
+
"rstrip": false,
|
48 |
+
"single_word": false,
|
49 |
+
"special": true
|
50 |
+
}
|
51 |
+
},
|
52 |
+
"bos_token": "<s>",
|
53 |
+
"clean_up_tokenization_spaces": true,
|
54 |
+
"cls_token": "<s>",
|
55 |
+
"do_lower_case": true,
|
56 |
+
"eos_token": "</s>",
|
57 |
+
"mask_token": "<mask>",
|
58 |
+
"max_length": 128,
|
59 |
+
"model_max_length": 384,
|
60 |
+
"pad_to_multiple_of": null,
|
61 |
+
"pad_token": "<pad>",
|
62 |
+
"pad_token_type_id": 0,
|
63 |
+
"padding_side": "right",
|
64 |
+
"sep_token": "</s>",
|
65 |
+
"stride": 0,
|
66 |
+
"strip_accents": null,
|
67 |
+
"tokenize_chinese_chars": true,
|
68 |
+
"tokenizer_class": "MPNetTokenizer",
|
69 |
+
"truncation_side": "right",
|
70 |
+
"truncation_strategy": "longest_first",
|
71 |
+
"unk_token": "[UNK]"
|
72 |
+
}
|
vocab.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|