Corran commited on
Commit
f6dbb74
·
verified ·
1 Parent(s): a793142

Add SetFit model

Browse files
1_Pooling/config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "word_embedding_dimension": 384,
3
+ "pooling_mode_cls_token": false,
4
+ "pooling_mode_mean_tokens": true,
5
+ "pooling_mode_max_tokens": false,
6
+ "pooling_mode_mean_sqrt_len_tokens": false,
7
+ "pooling_mode_weightedmean_tokens": false,
8
+ "pooling_mode_lasttoken": false,
9
+ "include_prompt": true
10
+ }
README.md ADDED
The diff for this file is too large to render. See raw diff
 
config.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "sentence-transformers/all-MiniLM-L6-v2",
3
+ "architectures": [
4
+ "BertModel"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "gradient_checkpointing": false,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.1,
11
+ "hidden_size": 384,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 1536,
14
+ "layer_norm_eps": 1e-12,
15
+ "max_position_embeddings": 512,
16
+ "model_type": "bert",
17
+ "num_attention_heads": 12,
18
+ "num_hidden_layers": 6,
19
+ "pad_token_id": 0,
20
+ "position_embedding_type": "absolute",
21
+ "torch_dtype": "float32",
22
+ "transformers_version": "4.39.0",
23
+ "type_vocab_size": 2,
24
+ "use_cache": true,
25
+ "vocab_size": 30522
26
+ }
config_sentence_transformers.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "__version__": {
3
+ "sentence_transformers": "3.1.1",
4
+ "transformers": "4.39.0",
5
+ "pytorch": "2.5.1+cu121"
6
+ },
7
+ "prompts": {},
8
+ "default_prompt_name": null,
9
+ "similarity_fn_name": null
10
+ }
config_setfit.json ADDED
@@ -0,0 +1,108 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "normalize_embeddings": false,
3
+ "labels": [
4
+ "Acknowledging limitation(s) whilst stating a finding or contribution",
5
+ "Advising cautious interpretation of the findings",
6
+ "Commenting on the findings",
7
+ "Commenting on the strengths of the current study",
8
+ "Comparing the result: contradicting previous findings",
9
+ "Comparing the result: supporting previous findings",
10
+ "Contrasting sources with \u2018however\u2019 for emphasis",
11
+ "Describing previously used methods",
12
+ "Describing questionnaire design",
13
+ "Describing the characteristics of the participants",
14
+ "Describing the limitations of the current study",
15
+ "Describing the process: adverbs of manner",
16
+ "Describing the process: expressing purpose with for",
17
+ "Describing the process: infinitive of purpose",
18
+ "Describing the process: sequence words",
19
+ "Describing the process: statistical procedures",
20
+ "Describing the process: typical verbs in the passive form",
21
+ "Describing the process: using + instrument",
22
+ "Describing the research design and the methods used",
23
+ "Describing what other writers do in their published work",
24
+ "Detailing specific limitations",
25
+ "Establishing the importance of the topic for the discipline",
26
+ "Establishing the importance of the topic for the discipline: time frame given",
27
+ "Establishing the importance of the topic for the world or society",
28
+ "Establishing the importance of the topic for the world or society: time frame given",
29
+ "Establising the importance of the topic as a problem to be addressed",
30
+ "Explaining keywords (also refer to Defining Terms)",
31
+ "Explaining the provenance of articles for review",
32
+ "Explaining the provenance of the participants",
33
+ "Explaining the significance of the current study",
34
+ "Explaining the significance of the findings or contribution of the study",
35
+ "General comments on the relevant literature",
36
+ "General reference to previous research or scholarship: highlighting negative outcomes",
37
+ "Giving reasons for personal interest in the research (sometimes found in the humanities, and the applied human sciences)",
38
+ "Giving reasons why a particular method was adopted",
39
+ "Giving reasons why a particular method was rejected",
40
+ "Highlighting inadequacies or weaknesses of previous studies (also refer to Being Critical)",
41
+ "Highlighting interesting or surprising results",
42
+ "Highlighting significant data in a table or chart",
43
+ "Identifying a controversy within the field of study",
44
+ "Identifying a knowledge gap in the field of study",
45
+ "Implications and/or recommendations for practice or policy",
46
+ "Indicating an expected outcome",
47
+ "Indicating an unexpected outcome",
48
+ "Indicating criteria for selection or inclusion in the study",
49
+ "Indicating methodological problems or limitations",
50
+ "Indicating missing, weak, or contradictory evidence",
51
+ "Indicating the methodology for the current research",
52
+ "Indicating the use of an established method",
53
+ "Introducing the limitations of the current study",
54
+ "Making recommendations for further research work",
55
+ "Noting implications of the findings",
56
+ "Noting the lack of or paucity of previous research",
57
+ "Offering an explanation for the findings",
58
+ "Outlining the structure of a short paper",
59
+ "Outlining the structure of a thesis or dissertation",
60
+ "Pointing out interesting or important findings",
61
+ "Previewing a chapter",
62
+ "Previous research: A historic perspective",
63
+ "Previous research: Approaches taken",
64
+ "Previous research: What has been established or proposed",
65
+ "Previous research: area investigated as the sentence object",
66
+ "Previous research: area investigated as the sentence subject",
67
+ "Previous research: highlighting negative outcomes",
68
+ "Providing background information: reference to the literature",
69
+ "Providing background information: reference to the purpose of the study",
70
+ "Reference to previous research: important studies",
71
+ "Referring back to the purpose of the paper or study",
72
+ "Referring back to the research aims or procedures",
73
+ "Referring to a single investigation in the past: investigation prominent",
74
+ "Referring to a single investigation in the past: researcher prominent",
75
+ "Referring to another writer\u2019s idea(s) or position",
76
+ "Referring to data in a table or chart",
77
+ "Referring to important texts in the area of interest",
78
+ "Referring to previous work to establish what is already known",
79
+ "Referring to secondary sources",
80
+ "Referring to the literature to justify a method or approach ",
81
+ "Reporting positive and negative reactions",
82
+ "Restating a result or one of several results",
83
+ "Setting out the research questions or hypotheses",
84
+ "Some ways of introducing quotations",
85
+ "Stating a negative result",
86
+ "Stating a positive result",
87
+ "Stating purpose of the current research with reference to gaps or issues in the literature",
88
+ "Stating the aims of the current research (note frequent use of past tense)",
89
+ "Stating the focus, aim, or argument of a short paper",
90
+ "Stating the purpose of the thesis, dissertation, or research article (note use of present tense)",
91
+ "Stating what is currently known about the topic",
92
+ "Suggesting general hypotheses",
93
+ "Suggesting implications for what is already known",
94
+ "Suggestions for future work",
95
+ "Summarising the literature review",
96
+ "Summarising the main research findings",
97
+ "Summarising the results section",
98
+ "Summarising the studies reviewed",
99
+ "Surveys and interviews: Introducing excerpts from interview data",
100
+ "Surveys and interviews: Reporting participants\u2019 views",
101
+ "Surveys and interviews: Reporting proportions",
102
+ "Surveys and interviews: Reporting response rates",
103
+ "Surveys and interviews: Reporting themes",
104
+ "Synthesising sources: contrasting evidence or ideas",
105
+ "Synthesising sources: supporting evidence or ideas",
106
+ "Transition: moving to the next result"
107
+ ]
108
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8511aae8825d3a996b23c7396fa18e39f8400be98c865e8a0715f18b54dbd22b
3
+ size 90864192
model_head.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fd905ee574c42dae304d3561c962c107f695fbf80e3139f6aa8eeaa8d505852
3
+ size 367519
modules.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "idx": 0,
4
+ "name": "0",
5
+ "path": "",
6
+ "type": "sentence_transformers.models.Transformer"
7
+ },
8
+ {
9
+ "idx": 1,
10
+ "name": "1",
11
+ "path": "1_Pooling",
12
+ "type": "sentence_transformers.models.Pooling"
13
+ },
14
+ {
15
+ "idx": 2,
16
+ "name": "2",
17
+ "path": "2_Normalize",
18
+ "type": "sentence_transformers.models.Normalize"
19
+ }
20
+ ]
sentence_bert_config.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "max_seq_length": 256,
3
+ "do_lower_case": false
4
+ }
special_tokens_map.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": {
3
+ "content": "[CLS]",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "mask_token": {
10
+ "content": "[MASK]",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "[PAD]",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "sep_token": {
24
+ "content": "[SEP]",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "unk_token": {
31
+ "content": "[UNK]",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ }
37
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,64 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "100": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "101": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "102": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "103": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "clean_up_tokenization_spaces": true,
45
+ "cls_token": "[CLS]",
46
+ "do_basic_tokenize": true,
47
+ "do_lower_case": true,
48
+ "mask_token": "[MASK]",
49
+ "max_length": 128,
50
+ "model_max_length": 256,
51
+ "never_split": null,
52
+ "pad_to_multiple_of": null,
53
+ "pad_token": "[PAD]",
54
+ "pad_token_type_id": 0,
55
+ "padding_side": "right",
56
+ "sep_token": "[SEP]",
57
+ "stride": 0,
58
+ "strip_accents": null,
59
+ "tokenize_chinese_chars": true,
60
+ "tokenizer_class": "BertTokenizer",
61
+ "truncation_side": "right",
62
+ "truncation_strategy": "longest_first",
63
+ "unk_token": "[UNK]"
64
+ }
vocab.txt ADDED
The diff for this file is too large to render. See raw diff