Upload 8 files

Browse files

Files changed (9) hide show

.gitattributes +1 -0
classification_report.txt +14 -0
config.json +48 -0
label_mappings.json +1 -0
model.safetensors +3 -0
special_tokens_map.json +51 -0
tokenizer.json +3 -0
tokenizer_config.json +55 -0
training_args.bin +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text

classification_report.txt ADDED Viewed

	@@ -0,0 +1,14 @@

+                          precision    recall  f1-score   support
+ business_rnd_innovation      0.938     0.833     0.882        18
+fellowships_scholarships      0.886     0.912     0.899        34
+   institutional_funding      0.750     0.600     0.667         5
+networking_collaborative      0.773     0.850     0.810        20
+  other_research_funding      1.000     0.455     0.625        11
+            out_of_scope      0.812     0.867     0.839        30
+   project_grants_public      0.864     0.895     0.879       114
+ research_infrastructure      0.714     0.714     0.714        14
+                accuracy                          0.850       246
+               macro avg      0.842     0.766     0.789       246
+            weighted avg      0.854     0.850     0.846       246

config.json ADDED Viewed

	@@ -0,0 +1,48 @@

+{
+  "architectures": [
+    "XLMRobertaForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 0,
+  "classifier_dropout": null,
+  "eos_token_id": 2,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 1024,
+  "id2label": {
+    "0": "business_rnd_innovation",
+    "1": "fellowships_scholarships",
+    "2": "institutional_funding",
+    "3": "networking_collaborative",
+    "4": "other_research_funding",
+    "5": "out_of_scope",
+    "6": "project_grants_public",
+    "7": "research_infrastructure"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 4096,
+  "label2id": {
+    "business_rnd_innovation": 0,
+    "fellowships_scholarships": 1,
+    "institutional_funding": 2,
+    "networking_collaborative": 3,
+    "other_research_funding": 4,
+    "out_of_scope": 5,
+    "project_grants_public": 6,
+    "research_infrastructure": 7
+  },
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 514,
+  "model_type": "xlm-roberta",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 24,
+  "output_past": true,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.51.3",
+  "type_vocab_size": 1,
+  "use_cache": true,
+  "vocab_size": 250002
+}

label_mappings.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"label_list": ["business_rnd_innovation", "fellowships_scholarships", "institutional_funding", "networking_collaborative", "other_research_funding", "out_of_scope", "project_grants_public", "research_infrastructure"], "label2id": {"business_rnd_innovation": 0, "fellowships_scholarships": 1, "institutional_funding": 2, "networking_collaborative": 3, "other_research_funding": 4, "out_of_scope": 5, "project_grants_public": 6, "research_infrastructure": 7}, "id2label": {"0": "business_rnd_innovation", "1": "fellowships_scholarships", "2": "institutional_funding", "3": "networking_collaborative", "4": "other_research_funding", "5": "out_of_scope", "6": "project_grants_public", "7": "research_infrastructure"}}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:14b03dd7a3c9cbd5eea56fbfd522aa323778ae71abbdd963d48150b451a3c02d
+size 2239643272

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,51 @@

+{
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "cls_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "mask_token": {
+    "content": "<mask>",
+    "lstrip": true,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<pad>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "sep_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3ffb37461c391f096759f4a9bbbc329da0f36952f88bab061fcf84940c022e98
+size 17082999

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<pad>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "250001": {
+      "content": "<mask>",
+      "lstrip": true,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "extra_special_tokens": {},
+  "mask_token": "<mask>",
+  "model_max_length": 512,
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "tokenizer_class": "XLMRobertaTokenizer",
+  "unk_token": "<unk>"
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f729fffea91b416e475974b584fec16bbaf82c82209e0a48e3a4e9e8e3245979
+size 5841